LLVM 23.0.0git
ConstantFolding.cpp
Go to the documentation of this file.
1//===-- ConstantFolding.cpp - Fold instructions into constants ------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines routines for folding instructions into constants.
10//
11// Also, to supplement the basic IR ConstantExpr simplifications,
12// this file defines some additional folding routines that can make use of
13// DataLayout information. These functions cannot go in IR due to library
14// dependency issues.
15//
16//===----------------------------------------------------------------------===//
17
19#include "llvm/ADT/APFloat.h"
20#include "llvm/ADT/APInt.h"
21#include "llvm/ADT/APSInt.h"
22#include "llvm/ADT/ArrayRef.h"
23#include "llvm/ADT/DenseMap.h"
24#include "llvm/ADT/STLExtras.h"
27#include "llvm/ADT/StringRef.h"
32#include "llvm/Config/config.h"
33#include "llvm/IR/Constant.h"
35#include "llvm/IR/Constants.h"
36#include "llvm/IR/DataLayout.h"
38#include "llvm/IR/Function.h"
39#include "llvm/IR/GlobalValue.h"
41#include "llvm/IR/InstrTypes.h"
42#include "llvm/IR/Instruction.h"
45#include "llvm/IR/Intrinsics.h"
46#include "llvm/IR/IntrinsicsAArch64.h"
47#include "llvm/IR/IntrinsicsAMDGPU.h"
48#include "llvm/IR/IntrinsicsARM.h"
49#include "llvm/IR/IntrinsicsNVPTX.h"
50#include "llvm/IR/IntrinsicsWebAssembly.h"
51#include "llvm/IR/IntrinsicsX86.h"
53#include "llvm/IR/Operator.h"
54#include "llvm/IR/Type.h"
55#include "llvm/IR/Value.h"
60#include <cassert>
61#include <cerrno>
62#include <cfenv>
63#include <cmath>
64#include <cstdint>
65
66using namespace llvm;
67
69 "disable-fp-call-folding",
70 cl::desc("Disable constant-folding of FP intrinsics and libcalls."),
71 cl::init(false), cl::Hidden);
72
73namespace {
74
75//===----------------------------------------------------------------------===//
76// Constant Folding internal helper functions
77//===----------------------------------------------------------------------===//
78
79static Constant *foldConstVectorToAPInt(APInt &Result, Type *DestTy,
80 Constant *C, Type *SrcEltTy,
81 unsigned NumSrcElts,
82 const DataLayout &DL) {
83 // Now that we know that the input value is a vector of integers, just shift
84 // and insert them into our result.
85 unsigned BitShift = DL.getTypeSizeInBits(SrcEltTy);
86 for (unsigned i = 0; i != NumSrcElts; ++i) {
87 Constant *Element;
88 if (DL.isLittleEndian())
89 Element = C->getAggregateElement(NumSrcElts - i - 1);
90 else
91 Element = C->getAggregateElement(i);
92
93 if (isa_and_nonnull<UndefValue>(Element)) {
94 Result <<= BitShift;
95 continue;
96 }
97
98 auto *ElementCI = dyn_cast_or_null<ConstantInt>(Element);
99 if (!ElementCI)
100 return ConstantExpr::getBitCast(C, DestTy);
101
102 Result <<= BitShift;
103 Result |= ElementCI->getValue().zext(Result.getBitWidth());
104 }
105
106 return nullptr;
107}
108
109/// Check whether folding this bitcast into a byte vector would mix poison and
110/// non-poison bits in the same output lane. While integer types track poison on
111/// a per-value basis, byte types track it on a per-bit basis. However,
112/// `ConstantByte` cannot represent values with both poison and non-poison bits.
113///
114/// Source elements are grouped by the output lane they map to. Returns true if
115/// any group contains both poison and non-poison elements.
116static bool foldMixesPoisonBits(Constant *C, unsigned NumSrcElt,
117 unsigned NumDstElt) {
118 // If element counts don't divide evenly, bail out if a poison source element
119 // might span multiple destination lanes.
120 if (NumSrcElt % NumDstElt != 0)
121 return C->containsPoisonElement();
122 unsigned Ratio = NumSrcElt / NumDstElt;
123 for (unsigned i = 0; i != NumSrcElt; i += Ratio) {
124 bool HasPoison = false;
125 bool HasNonPoison = false;
126 for (unsigned j = 0; j != Ratio; ++j) {
127 Constant *Src = C->getAggregateElement(i + j);
128 // Conservatively bail out.
129 if (!Src)
130 return true;
131 if (isa<PoisonValue>(Src))
132 HasPoison = true;
133 else
134 HasNonPoison = true;
135 }
136 if (HasPoison && HasNonPoison)
137 return true;
138 }
139 return false;
140}
141
142/// Track which destination lanes of a bitcast are produced from poison bytes.
143/// A destination lane is marked if any source element mapped to it is poison.
144/// Returns false if an aggregate element cannot be inspected. The caller should
145/// bail out of folding.
146static bool computePoisonDstLanes(Constant *C, unsigned NumSrcElt,
147 unsigned NumDstElt,
148 SmallBitVector &PoisonDstElts) {
149 // If element counts don't divide evenly, bail out if a poison source element
150 // might span multiple destination lanes.
151 if ((NumDstElt < NumSrcElt ? NumSrcElt % NumDstElt : NumDstElt % NumSrcElt))
152 return !C->containsPoisonElement();
153 if (NumDstElt < NumSrcElt) {
154 unsigned Ratio = NumSrcElt / NumDstElt;
155 for (unsigned i = 0; i != NumDstElt; ++i) {
156 for (unsigned j = 0; j != Ratio; ++j) {
157 Constant *Src = C->getAggregateElement(i * Ratio + j);
158 if (!Src)
159 return false;
160 if (isa<PoisonValue>(Src)) {
161 PoisonDstElts[i] = true;
162 break;
163 }
164 }
165 }
166 } else {
167 unsigned Ratio = NumDstElt / NumSrcElt;
168 for (unsigned i = 0; i != NumSrcElt; ++i) {
169 Constant *Src = C->getAggregateElement(i);
170 if (!Src)
171 return false;
172 if (isa<PoisonValue>(Src))
173 PoisonDstElts.set(i * Ratio, (i + 1) * Ratio);
174 }
175 }
176 return true;
177}
178
179/// Constant fold bitcast, symbolically evaluating it with DataLayout.
180/// This always returns a non-null constant, but it may be a
181/// ConstantExpr if unfoldable.
182Constant *FoldBitCast(Constant *C, Type *DestTy, const DataLayout &DL) {
183 assert(CastInst::castIsValid(Instruction::BitCast, C, DestTy) &&
184 "Invalid constantexpr bitcast!");
185
186 // Catch the obvious splat cases.
187 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
188 return Res;
189
190 if (auto *VTy = dyn_cast<VectorType>(C->getType())) {
191 // Handle a vector->scalar integer/fp cast.
192 if (isa<IntegerType>(DestTy) || DestTy->isFloatingPointTy()) {
193 unsigned NumSrcElts = cast<FixedVectorType>(VTy)->getNumElements();
194 Type *SrcEltTy = VTy->getElementType();
195
196 // Bitcasting a byte containing any poison bit to an integer or fp type
197 // yields poison.
198 if (SrcEltTy->isByteTy() && C->containsPoisonElement())
199 return PoisonValue::get(DestTy);
200
201 // If the vector is a vector of floating point or bytes, convert it to a
202 // vector of int to simplify things.
203 if (SrcEltTy->isFloatingPointTy() || SrcEltTy->isByteTy()) {
204 unsigned Width = SrcEltTy->getPrimitiveSizeInBits();
205 auto *SrcIVTy = FixedVectorType::get(
206 IntegerType::get(C->getContext(), Width), NumSrcElts);
207 // Ask IR to do the conversion now that #elts line up.
208 C = ConstantExpr::getBitCast(C, SrcIVTy);
209 }
210
211 APInt Result(DL.getTypeSizeInBits(DestTy), 0);
212 if (Constant *CE = foldConstVectorToAPInt(Result, DestTy, C,
213 SrcEltTy, NumSrcElts, DL))
214 return CE;
215
216 if (isa<IntegerType>(DestTy))
217 return ConstantInt::get(DestTy, Result);
218
219 APFloat FP(DestTy->getFltSemantics(), Result);
220 return ConstantFP::get(DestTy->getContext(), FP);
221 }
222 }
223
224 // The code below only handles casts to vectors currently.
225 auto *DestVTy = dyn_cast<VectorType>(DestTy);
226 if (!DestVTy)
227 return ConstantExpr::getBitCast(C, DestTy);
228
229 // If this is a scalar -> vector cast, convert the input into a <1 x scalar>
230 // vector so the code below can handle it uniformly.
231 if (!isa<VectorType>(C->getType()) &&
233 Constant *Ops = C; // don't take the address of C!
234 return FoldBitCast(ConstantVector::get(Ops), DestTy, DL);
235 }
236
237 // Some of what follows may extend to cover scalable vectors but the current
238 // implementation is fixed length specific.
239 if (!isa<FixedVectorType>(C->getType()))
240 return ConstantExpr::getBitCast(C, DestTy);
241
242 // If this is a bitcast from constant vector -> vector, fold it.
245 return ConstantExpr::getBitCast(C, DestTy);
246
247 // If the element types match, IR can fold it.
248 unsigned NumDstElt = cast<FixedVectorType>(DestVTy)->getNumElements();
249 unsigned NumSrcElt = cast<FixedVectorType>(C->getType())->getNumElements();
250 if (NumDstElt == NumSrcElt)
251 return ConstantExpr::getBitCast(C, DestTy);
252
253 Type *SrcEltTy = cast<VectorType>(C->getType())->getElementType();
254 Type *DstEltTy = DestVTy->getElementType();
255
256 // Otherwise, we're changing the number of elements in a vector, which
257 // requires endianness information to do the right thing. For example,
258 // bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
259 // folds to (little endian):
260 // <4 x i32> <i32 0, i32 0, i32 1, i32 0>
261 // and to (big endian):
262 // <4 x i32> <i32 0, i32 0, i32 0, i32 1>
263
264 // First thing is first. We only want to think about integer here, so if
265 // we have something in FP form, recast it as integer.
266 if (DstEltTy->isFloatingPointTy()) {
267 // Fold to an vector of integers with same size as our FP type.
268 unsigned FPWidth = DstEltTy->getPrimitiveSizeInBits();
269 auto *DestIVTy = FixedVectorType::get(
270 IntegerType::get(C->getContext(), FPWidth), NumDstElt);
271 // Recursively handle this integer conversion, if possible.
272 C = FoldBitCast(C, DestIVTy, DL);
273
274 // Finally, IR can handle this now that #elts line up.
275 return ConstantExpr::getBitCast(C, DestTy);
276 }
277
278 // Handle byte destination type by folding through integers.
279 if (DstEltTy->isByteTy()) {
280 // When combining elements into larger byte values, bail out if the fold
281 // mixes poison and non-poison bits in the same destination element. Byte
282 // types track poison per bit, and no constant value can represent that.
283 if (NumDstElt < NumSrcElt && foldMixesPoisonBits(C, NumSrcElt, NumDstElt))
284 return ConstantExpr::getBitCast(C, DestTy);
285
286 // Fold to a vector of integers with same size as the byte type.
287 unsigned ByteWidth = DstEltTy->getPrimitiveSizeInBits();
288 auto *DestIVTy = FixedVectorType::get(
289 IntegerType::get(C->getContext(), ByteWidth), NumDstElt);
290 C = FoldBitCast(C, DestIVTy, DL);
291 return ConstantExpr::getBitCast(C, DestTy);
292 }
293
294 // Okay, we know the destination is integer, if the input is FP, convert
295 // it to integer first.
296 if (SrcEltTy->isFloatingPointTy()) {
297 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
298 auto *SrcIVTy = FixedVectorType::get(
299 IntegerType::get(C->getContext(), FPWidth), NumSrcElt);
300 // Ask IR to do the conversion now that #elts line up.
301 C = ConstantExpr::getBitCast(C, SrcIVTy);
302 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
304 "Constant folding cannot fail for plain fp->int bitcast!");
305 }
306
307 // Handle byte source type by folding through integers. Byte types track
308 // poison per bit, so any poison bit makes the destination lane poison.
309 // Record which destination lanes contain poison bits, before the generic
310 // fold below refines them to undef/zero, so they can be restored.
311 SmallBitVector PoisonDstElts(NumDstElt);
312 if (SrcEltTy->isByteTy()) {
313 if (!computePoisonDstLanes(C, NumSrcElt, NumDstElt, PoisonDstElts))
314 return ConstantExpr::getBitCast(C, DestTy);
315
316 unsigned ByteWidth = SrcEltTy->getPrimitiveSizeInBits();
317 auto *SrcIVTy = FixedVectorType::get(
318 IntegerType::get(C->getContext(), ByteWidth), NumSrcElt);
319 // Ask IR to do the conversion now that #elts line up.
320 C = ConstantExpr::getBitCast(C, SrcIVTy);
321 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
323 "Constant folding cannot fail for plain byte->int bitcast!");
324 }
325
326 // Now we know that the input and output vectors are both integer vectors
327 // of the same size, and that their #elements is not the same.
328 // Use data buffer for easy non-integer element ratio vectors handling,
329 // For example: <4 x i24> to <3 x i32>.
330 bool isLittleEndian = DL.isLittleEndian();
331 unsigned SrcBitSize = SrcEltTy->getPrimitiveSizeInBits();
332 unsigned DstBitSize = DstEltTy->getPrimitiveSizeInBits();
334 unsigned SrcElt = 0;
335
336 APInt Buffer(2 * std::max(SrcBitSize, DstBitSize), 0);
337 APInt UndefMask(Buffer.getBitWidth(), 0);
338 APInt PoisonMask(Buffer.getBitWidth(), 0);
339 unsigned BufferBitSize = 0;
340
341 while (Result.size() != NumDstElt) {
342 // Load SrcElts into Buffer.
343 while (BufferBitSize < DstBitSize) {
344 Constant *Element = C->getAggregateElement(SrcElt++);
345 if (!Element) // Reject constantexpr elements
346 return ConstantExpr::getBitCast(C, DestTy);
347
348 // Shift Buffer & Masks to fit next SrcElt.
349 if (!isLittleEndian) {
350 Buffer <<= SrcBitSize;
351 UndefMask <<= SrcBitSize;
352 PoisonMask <<= SrcBitSize;
353 }
354
355 APInt SrcValue;
356 unsigned BitPosition = isLittleEndian ? BufferBitSize : 0;
357 if (isa<UndefValue>(Element)) {
358 // Set masks fragments bits.
359 UndefMask.setBits(BitPosition, BitPosition + SrcBitSize);
360 if (isa<PoisonValue>(Element))
361 PoisonMask.setBits(BitPosition, BitPosition + SrcBitSize);
362 SrcValue = APInt::getZero(DstBitSize);
363 } else {
364 auto *Src = dyn_cast<ConstantInt>(Element);
365 if (!Src)
366 return ConstantExpr::getBitCast(C, DestTy);
367 SrcValue = Src->getValue();
368 }
369
370 // Insert src element bits into Buffer on correct position.
371 Buffer.insertBits(SrcValue, BitPosition);
372 BufferBitSize += SrcBitSize;
373 }
374
375 // Create DstElts from Buffer.
376 while (BufferBitSize >= DstBitSize) {
377 unsigned ShiftAmt = isLittleEndian ? 0 : BufferBitSize - DstBitSize;
378 // Emit undef/poison, if all undef mask fragment bits are set.
379 if (UndefMask.extractBits(DstBitSize, ShiftAmt).isAllOnes()) {
380 // Push poison, if any bit in poison mask fragment is set.
381 if (!PoisonMask.extractBits(DstBitSize, ShiftAmt).isZero()) {
382 Result.push_back(PoisonValue::get(DstEltTy));
383 } else {
384 Result.push_back(UndefValue::get(DstEltTy));
385 }
386 } else {
387 // Create and push DstElt.
388 APInt Elt = Buffer.extractBits(DstBitSize, ShiftAmt);
389 Result.push_back(ConstantInt::get(DstEltTy, Elt));
390 }
391
392 // Shift unused Buffer fragment to lower bits.
393 if (isLittleEndian) {
394 Buffer.lshrInPlace(DstBitSize);
395 UndefMask.lshrInPlace(DstBitSize);
396 PoisonMask.lshrInPlace(DstBitSize);
397 }
398 BufferBitSize -= DstBitSize;
399 }
400 }
401
402 // Restore destination lanes whose source bytes contained poison bits.
403 for (unsigned I : PoisonDstElts.set_bits())
404 Result[I] = PoisonValue::get(DstEltTy);
405
406 return ConstantVector::get(Result);
407}
408
409} // end anonymous namespace
410
411/// If this constant is a constant offset from a global, return the global and
412/// the constant. Because of constantexprs, this function is recursive.
414 APInt &Offset, const DataLayout &DL,
415 DSOLocalEquivalent **DSOEquiv) {
416 if (DSOEquiv)
417 *DSOEquiv = nullptr;
418
419 // Trivial case, constant is the global.
420 if ((GV = dyn_cast<GlobalValue>(C))) {
421 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
422 Offset = APInt(BitWidth, 0);
423 return true;
424 }
425
426 if (auto *FoundDSOEquiv = dyn_cast<DSOLocalEquivalent>(C)) {
427 if (DSOEquiv)
428 *DSOEquiv = FoundDSOEquiv;
429 GV = FoundDSOEquiv->getGlobalValue();
430 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
431 Offset = APInt(BitWidth, 0);
432 return true;
433 }
434
435 // Otherwise, if this isn't a constant expr, bail out.
436 auto *CE = dyn_cast<ConstantExpr>(C);
437 if (!CE) return false;
438
439 // Look through ptr->int and ptr->ptr casts.
440 if (CE->getOpcode() == Instruction::PtrToInt ||
441 CE->getOpcode() == Instruction::PtrToAddr)
442 return IsConstantOffsetFromGlobal(CE->getOperand(0), GV, Offset, DL,
443 DSOEquiv);
444
445 // i32* getelementptr ([5 x i32]* @a, i32 0, i32 5)
446 auto *GEP = dyn_cast<GEPOperator>(CE);
447 if (!GEP)
448 return false;
449
450 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
451 APInt TmpOffset(BitWidth, 0);
452
453 // If the base isn't a global+constant, we aren't either.
454 if (!IsConstantOffsetFromGlobal(CE->getOperand(0), GV, TmpOffset, DL,
455 DSOEquiv))
456 return false;
457
458 // Otherwise, add any offset that our operands provide.
459 if (!GEP->accumulateConstantOffset(DL, TmpOffset))
460 return false;
461
462 Offset = TmpOffset;
463 return true;
464}
465
467 const DataLayout &DL) {
468 do {
469 Type *SrcTy = C->getType();
470 if (SrcTy == DestTy)
471 return C;
472
473 TypeSize DestSize = DL.getTypeSizeInBits(DestTy);
474 TypeSize SrcSize = DL.getTypeSizeInBits(SrcTy);
475 if (!TypeSize::isKnownGE(SrcSize, DestSize))
476 return nullptr;
477
478 // Catch the obvious splat cases (since all-zeros can coerce non-integral
479 // pointers legally).
480 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
481 return Res;
482
483 // If the type sizes are the same and a cast is legal, just directly
484 // cast the constant.
485 // But be careful not to coerce non-integral pointers illegally.
486 if (SrcSize == DestSize &&
487 DL.isNonIntegralPointerType(SrcTy->getScalarType()) ==
488 DL.isNonIntegralPointerType(DestTy->getScalarType())) {
489 Instruction::CastOps Cast = Instruction::BitCast;
490 // If we are going from a pointer to int or vice versa, we spell the cast
491 // differently.
492 if (SrcTy->isIntegerTy() && DestTy->isPointerTy())
493 Cast = Instruction::IntToPtr;
494 else if (SrcTy->isPointerTy() && DestTy->isIntegerTy())
495 Cast = Instruction::PtrToInt;
496
497 if (CastInst::castIsValid(Cast, C, DestTy))
498 return ConstantFoldCastOperand(Cast, C, DestTy, DL);
499 }
500
501 // If this isn't an aggregate type, there is nothing we can do to drill down
502 // and find a bitcastable constant.
503 if (!SrcTy->isAggregateType() && !SrcTy->isVectorTy())
504 return nullptr;
505
506 // We're simulating a load through a pointer that was bitcast to point to
507 // a different type, so we can try to walk down through the initial
508 // elements of an aggregate to see if some part of the aggregate is
509 // castable to implement the "load" semantic model.
510 if (SrcTy->isStructTy()) {
511 // Struct types might have leading zero-length elements like [0 x i32],
512 // which are certainly not what we are looking for, so skip them.
513 unsigned Elem = 0;
514 Constant *ElemC;
515 do {
516 ElemC = C->getAggregateElement(Elem++);
517 } while (ElemC && DL.getTypeSizeInBits(ElemC->getType()).isZero());
518 C = ElemC;
519 } else {
520 // For non-byte-sized vector elements, the first element is not
521 // necessarily located at the vector base address.
522 if (auto *VT = dyn_cast<VectorType>(SrcTy))
523 if (!DL.typeSizeEqualsStoreSize(VT->getElementType()))
524 return nullptr;
525
526 C = C->getAggregateElement(0u);
527 }
528 } while (C);
529
530 return nullptr;
531}
532
533namespace {
534
535/// Recursive helper to read bits out of global. C is the constant being copied
536/// out of. ByteOffset is an offset into C. CurPtr is the pointer to copy
537/// results into and BytesLeft is the number of bytes left in
538/// the CurPtr buffer. DL is the DataLayout.
539bool ReadDataFromGlobal(Constant *C, uint64_t ByteOffset, unsigned char *CurPtr,
540 unsigned BytesLeft, const DataLayout &DL) {
541 assert(ByteOffset <= DL.getTypeAllocSize(C->getType()) &&
542 "Out of range access");
543
544 // Reading type padding, return zero.
545 if (ByteOffset >= DL.getTypeStoreSize(C->getType()))
546 return true;
547
548 // If this element is zero or undefined, we can just return since *CurPtr is
549 // zero initialized.
551 return true;
552
553 auto *CI = dyn_cast<ConstantInt>(C);
554 if (CI && CI->getType()->isIntegerTy()) {
555 if ((CI->getBitWidth() & 7) != 0)
556 return false;
557 const APInt &Val = CI->getValue();
558 unsigned IntBytes = unsigned(CI->getBitWidth()/8);
559
560 for (unsigned i = 0; i != BytesLeft && ByteOffset != IntBytes; ++i) {
561 unsigned n = ByteOffset;
562 if (!DL.isLittleEndian())
563 n = IntBytes - n - 1;
564 CurPtr[i] = Val.extractBits(8, n * 8).getZExtValue();
565 ++ByteOffset;
566 }
567 return true;
568 }
569
570 auto *CFP = dyn_cast<ConstantFP>(C);
571 if (CFP && CFP->getType()->isFloatingPointTy()) {
572 if (CFP->getType()->isDoubleTy()) {
573 C = FoldBitCast(C, Type::getInt64Ty(C->getContext()), DL);
574 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
575 }
576 if (CFP->getType()->isFloatTy()){
577 C = FoldBitCast(C, Type::getInt32Ty(C->getContext()), DL);
578 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
579 }
580 if (CFP->getType()->isHalfTy()){
581 C = FoldBitCast(C, Type::getInt16Ty(C->getContext()), DL);
582 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
583 }
584 return false;
585 }
586
587 if (auto *CS = dyn_cast<ConstantStruct>(C)) {
588 const StructLayout *SL = DL.getStructLayout(CS->getType());
589 unsigned Index = SL->getElementContainingOffset(ByteOffset);
590 uint64_t CurEltOffset = SL->getElementOffset(Index);
591 ByteOffset -= CurEltOffset;
592
593 while (true) {
594 // If the element access is to the element itself and not to tail padding,
595 // read the bytes from the element.
596 uint64_t EltSize = DL.getTypeAllocSize(CS->getOperand(Index)->getType());
597
598 if (ByteOffset < EltSize &&
599 !ReadDataFromGlobal(CS->getOperand(Index), ByteOffset, CurPtr,
600 BytesLeft, DL))
601 return false;
602
603 ++Index;
604
605 // Check to see if we read from the last struct element, if so we're done.
606 if (Index == CS->getType()->getNumElements())
607 return true;
608
609 // If we read all of the bytes we needed from this element we're done.
610 uint64_t NextEltOffset = SL->getElementOffset(Index);
611
612 if (BytesLeft <= NextEltOffset - CurEltOffset - ByteOffset)
613 return true;
614
615 // Move to the next element of the struct.
616 CurPtr += NextEltOffset - CurEltOffset - ByteOffset;
617 BytesLeft -= NextEltOffset - CurEltOffset - ByteOffset;
618 ByteOffset = 0;
619 CurEltOffset = NextEltOffset;
620 }
621 // not reached.
622 }
623
627 uint64_t NumElts, EltSize;
628 Type *EltTy;
629 if (auto *AT = dyn_cast<ArrayType>(C->getType())) {
630 NumElts = AT->getNumElements();
631 EltTy = AT->getElementType();
632 EltSize = DL.getTypeAllocSize(EltTy);
633 } else {
634 NumElts = cast<FixedVectorType>(C->getType())->getNumElements();
635 EltTy = cast<FixedVectorType>(C->getType())->getElementType();
636 // TODO: For non-byte-sized vectors, current implementation assumes there is
637 // padding to the next byte boundary between elements.
638 if (!DL.typeSizeEqualsStoreSize(EltTy))
639 return false;
640
641 EltSize = DL.getTypeStoreSize(EltTy);
642 }
643 uint64_t Index = ByteOffset / EltSize;
644 uint64_t Offset = ByteOffset - Index * EltSize;
645
646 for (; Index != NumElts; ++Index) {
647 if (!ReadDataFromGlobal(C->getAggregateElement(Index), Offset, CurPtr,
648 BytesLeft, DL))
649 return false;
650
651 uint64_t BytesWritten = EltSize - Offset;
652 assert(BytesWritten <= EltSize && "Not indexing into this element?");
653 if (BytesWritten >= BytesLeft)
654 return true;
655
656 Offset = 0;
657 BytesLeft -= BytesWritten;
658 CurPtr += BytesWritten;
659 }
660 return true;
661 }
662
663 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
664 if (CE->getOpcode() == Instruction::IntToPtr &&
665 CE->getOperand(0)->getType() == DL.getIntPtrType(CE->getType())) {
666 return ReadDataFromGlobal(CE->getOperand(0), ByteOffset, CurPtr,
667 BytesLeft, DL);
668 }
669 }
670
671 // Otherwise, unknown initializer type.
672 return false;
673}
674
675/// OrigLoadTy is the original type being loaded, while LoadTy is the type
676/// currently being folded (which may be integer type mapped from OrigLoadTy).
677Constant *FoldReinterpretLoadFromConst(Constant *C, Type *LoadTy,
678 Type *OrigLoadTy, int64_t Offset,
679 const DataLayout &DL) {
680 // Bail out early. Not expect to load from scalable global variable.
681 if (isa<ScalableVectorType>(LoadTy))
682 return nullptr;
683
684 auto *IntType = dyn_cast<IntegerType>(LoadTy);
685
686 // If this isn't an integer load we can't fold it directly.
687 if (!IntType) {
688 // If this is a non-integer load, we can try folding it as an int load and
689 // then bitcast the result. This can be useful for union cases. Note
690 // that address spaces don't matter here since we're not going to result in
691 // an actual new load.
692 if (!LoadTy->isFloatingPointTy() && !LoadTy->isPointerTy() &&
693 !LoadTy->isVectorTy())
694 return nullptr;
695
696 Type *MapTy = Type::getIntNTy(C->getContext(),
697 DL.getTypeSizeInBits(LoadTy).getFixedValue());
698 if (Constant *Res =
699 FoldReinterpretLoadFromConst(C, MapTy, OrigLoadTy, Offset, DL)) {
700 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
701 // Materializing a zero can be done trivially without a bitcast
702 return Constant::getNullValue(LoadTy);
703 Type *CastTy = LoadTy->isPtrOrPtrVectorTy() ? DL.getIntPtrType(LoadTy) : LoadTy;
704 Res = FoldBitCast(Res, CastTy, DL);
705 if (LoadTy->isPtrOrPtrVectorTy()) {
706 // For vector of pointer, we needed to first convert to a vector of integer, then do vector inttoptr
707 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
708 return Constant::getNullValue(LoadTy);
709 if (DL.isNonIntegralPointerType(LoadTy->getScalarType()))
710 // Be careful not to replace a load of an addrspace value with an inttoptr here
711 return nullptr;
712 Res = ConstantExpr::getIntToPtr(Res, LoadTy);
713 }
714 return Res;
715 }
716 return nullptr;
717 }
718
719 unsigned BytesLoaded = (IntType->getBitWidth() + 7) / 8;
720 // Allow folding of large type loads (e.g. <16 x double>).
721 if (BytesLoaded > 128 || BytesLoaded == 0)
722 return nullptr;
723
724 // For scalar integer load, use smaller limit to avoid regression during
725 // memcmp expansion. Codegen may generate inefficient string operations.
726 if (BytesLoaded > 32 && OrigLoadTy->isIntegerTy())
727 return nullptr;
728
729 // If we're not accessing anything in this constant, the result is undefined.
730 if (Offset <= -1 * static_cast<int64_t>(BytesLoaded))
731 return PoisonValue::get(IntType);
732
733 // TODO: We should be able to support scalable types.
734 TypeSize InitializerSize = DL.getTypeAllocSize(C->getType());
735 if (InitializerSize.isScalable())
736 return nullptr;
737
738 // If we're not accessing anything in this constant, the result is undefined.
739 if (Offset >= (int64_t)InitializerSize.getFixedValue())
740 return PoisonValue::get(IntType);
741
742 SmallVector<unsigned char, 64> RawBytes(BytesLoaded);
743 unsigned char *CurPtr = RawBytes.data();
744 unsigned BytesLeft = BytesLoaded;
745
746 // If we're loading off the beginning of the global, some bytes may be valid.
747 if (Offset < 0) {
748 CurPtr += -Offset;
749 BytesLeft += Offset;
750 Offset = 0;
751 }
752
753 if (!ReadDataFromGlobal(C, Offset, CurPtr, BytesLeft, DL))
754 return nullptr;
755
756 APInt ResultVal = APInt(IntType->getBitWidth(), 0);
757 if (DL.isLittleEndian()) {
758 ResultVal = RawBytes[BytesLoaded - 1];
759 for (unsigned i = 1; i != BytesLoaded; ++i) {
760 ResultVal <<= 8;
761 ResultVal |= RawBytes[BytesLoaded - 1 - i];
762 }
763 } else {
764 ResultVal = RawBytes[0];
765 for (unsigned i = 1; i != BytesLoaded; ++i) {
766 ResultVal <<= 8;
767 ResultVal |= RawBytes[i];
768 }
769 }
770
771 return ConstantInt::get(IntType->getContext(), ResultVal);
772}
773
774} // anonymous namespace
775
776// If GV is a constant with an initializer read its representation starting
777// at Offset and return it as a constant array of unsigned char. Otherwise
778// return null.
781 if (!GV->isConstant() || !GV->hasDefinitiveInitializer())
782 return nullptr;
783
784 const DataLayout &DL = GV->getDataLayout();
785 Constant *Init = const_cast<Constant *>(GV->getInitializer());
786 TypeSize InitSize = DL.getTypeAllocSize(Init->getType());
787 if (InitSize < Offset)
788 return nullptr;
789
790 uint64_t NBytes = InitSize - Offset;
791 if (NBytes > UINT16_MAX)
792 // Bail for large initializers in excess of 64K to avoid allocating
793 // too much memory.
794 // Offset is assumed to be less than or equal than InitSize (this
795 // is enforced in ReadDataFromGlobal).
796 return nullptr;
797
798 SmallVector<unsigned char, 256> RawBytes(static_cast<size_t>(NBytes));
799 unsigned char *CurPtr = RawBytes.data();
800
801 if (!ReadDataFromGlobal(Init, Offset, CurPtr, NBytes, DL))
802 return nullptr;
803
804 return ConstantDataArray::get(GV->getContext(), RawBytes);
805}
806
807/// If this Offset points exactly to the start of an aggregate element, return
808/// that element, otherwise return nullptr.
810 const DataLayout &DL) {
811 if (Offset.isZero())
812 return Base;
813
815 return nullptr;
816
817 Type *ElemTy = Base->getType();
818 SmallVector<APInt> Indices = DL.getGEPIndicesForOffset(ElemTy, Offset);
819 if (!Offset.isZero() || !Indices[0].isZero())
820 return nullptr;
821
822 Constant *C = Base;
823 for (const APInt &Index : drop_begin(Indices)) {
824 if (Index.isNegative() || Index.getActiveBits() >= 32)
825 return nullptr;
826
827 C = C->getAggregateElement(Index.getZExtValue());
828 if (!C)
829 return nullptr;
830 }
831
832 return C;
833}
834
836 const APInt &Offset,
837 const DataLayout &DL) {
838 if (Constant *AtOffset = getConstantAtOffset(C, Offset, DL))
839 if (Constant *Result = ConstantFoldLoadThroughBitcast(AtOffset, Ty, DL))
840 return Result;
841
842 // Explicitly check for out-of-bounds access, so we return poison even if the
843 // constant is a uniform value.
844 TypeSize Size = DL.getTypeAllocSize(C->getType());
845 if (!Size.isScalable() && Offset.sge(Size.getFixedValue()))
846 return PoisonValue::get(Ty);
847
848 // Try an offset-independent fold of a uniform value.
849 if (Constant *Result = ConstantFoldLoadFromUniformValue(C, Ty, DL))
850 return Result;
851
852 // Try hard to fold loads from bitcasted strange and non-type-safe things.
853 if (Offset.getSignificantBits() <= 64)
854 if (Constant *Result =
855 FoldReinterpretLoadFromConst(C, Ty, Ty, Offset.getSExtValue(), DL))
856 return Result;
857
858 return nullptr;
859}
860
865
868 const DataLayout &DL) {
869 // We can only fold loads from constant globals with a definitive initializer.
870 // Check this upfront, to skip expensive offset calculations.
872 if (!GV || !GV->isConstant() || !GV->hasDefinitiveInitializer())
873 return nullptr;
874
875 C = cast<Constant>(C->stripAndAccumulateConstantOffsets(
876 DL, Offset, /* AllowNonInbounds */ true));
877
878 if (C == GV)
879 if (Constant *Result = ConstantFoldLoadFromConst(GV->getInitializer(), Ty,
880 Offset, DL))
881 return Result;
882
883 // If this load comes from anywhere in a uniform constant global, the value
884 // is always the same, regardless of the loaded offset.
885 return ConstantFoldLoadFromUniformValue(GV->getInitializer(), Ty, DL);
886}
887
889 const DataLayout &DL) {
890 APInt Offset(DL.getIndexTypeSizeInBits(C->getType()), 0);
891 return ConstantFoldLoadFromConstPtr(C, Ty, std::move(Offset), DL);
892}
893
895 const DataLayout &DL) {
896 if (isa<PoisonValue>(C))
897 return PoisonValue::get(Ty);
898 if (isa<UndefValue>(C))
899 return UndefValue::get(Ty);
900 // If padding is needed when storing C to memory, then it isn't considered as
901 // uniform.
902 if (!DL.typeSizeEqualsStoreSize(C->getType()))
903 return nullptr;
904 if (C->isNullValue() && !Ty->isX86_AMXTy())
905 return Constant::getNullValue(Ty);
906 if (C->isAllOnesValue() &&
907 (Ty->isIntOrIntVectorTy() || Ty->isFPOrFPVectorTy()))
908 return Constant::getAllOnesValue(Ty);
909 return nullptr;
910}
911
912namespace {
913
914/// One of Op0/Op1 is a constant expression.
915/// Attempt to symbolically evaluate the result of a binary operator merging
916/// these together. If target data info is available, it is provided as DL,
917/// otherwise DL is null.
918Constant *SymbolicallyEvaluateBinop(unsigned Opc, Constant *Op0, Constant *Op1,
919 const DataLayout &DL) {
920 // SROA
921
922 // Fold (and 0xffffffff00000000, (shl x, 32)) -> shl.
923 // Fold (lshr (or X, Y), 32) -> (lshr [X/Y], 32) if one doesn't contribute
924 // bits.
925
926 if (Opc == Instruction::And) {
927 KnownBits Known0 = computeKnownBits(Op0, DL);
928 KnownBits Known1 = computeKnownBits(Op1, DL);
929 if ((Known1.One | Known0.Zero).isAllOnes()) {
930 // All the bits of Op0 that the 'and' could be masking are already zero.
931 return Op0;
932 }
933 if ((Known0.One | Known1.Zero).isAllOnes()) {
934 // All the bits of Op1 that the 'and' could be masking are already zero.
935 return Op1;
936 }
937
938 Known0 &= Known1;
939 if (Known0.isConstant())
940 return ConstantInt::get(Op0->getType(), Known0.getConstant());
941 }
942
943 // If the constant expr is something like &A[123] - &A[4].f, fold this into a
944 // constant. This happens frequently when iterating over a global array.
945 if (Opc == Instruction::Sub) {
946 GlobalValue *GV1, *GV2;
947 APInt Offs1, Offs2;
948
949 if (IsConstantOffsetFromGlobal(Op0, GV1, Offs1, DL))
950 if (IsConstantOffsetFromGlobal(Op1, GV2, Offs2, DL) && GV1 == GV2) {
951 unsigned OpSize = DL.getTypeSizeInBits(Op0->getType());
952
953 // (&GV+C1) - (&GV+C2) -> C1-C2, pointer arithmetic cannot overflow.
954 // PtrToInt may change the bitwidth so we have convert to the right size
955 // first.
956 return ConstantInt::get(Op0->getType(), Offs1.zextOrTrunc(OpSize) -
957 Offs2.zextOrTrunc(OpSize));
958 }
959 }
960
961 return nullptr;
962}
963
964/// If array indices are not pointer-sized integers, explicitly cast them so
965/// that they aren't implicitly casted by the getelementptr.
966Constant *CastGEPIndices(Type *SrcElemTy, ArrayRef<Constant *> Ops,
967 Type *ResultTy, GEPNoWrapFlags NW,
968 std::optional<ConstantRange> InRange,
969 const DataLayout &DL, const TargetLibraryInfo *TLI) {
970 Type *IntIdxTy = DL.getIndexType(ResultTy);
971 Type *IntIdxScalarTy = IntIdxTy->getScalarType();
972
973 bool Any = false;
975 for (unsigned i = 1, e = Ops.size(); i != e; ++i) {
976 if ((i == 1 ||
978 SrcElemTy, Ops.slice(1, i - 1)))) &&
979 Ops[i]->getType()->getScalarType() != IntIdxScalarTy) {
980 Any = true;
981 Type *NewType =
982 Ops[i]->getType()->isVectorTy() ? IntIdxTy : IntIdxScalarTy;
984 CastInst::getCastOpcode(Ops[i], true, NewType, true), Ops[i], NewType,
985 DL);
986 if (!NewIdx)
987 return nullptr;
988 NewIdxs.push_back(NewIdx);
989 } else
990 NewIdxs.push_back(Ops[i]);
991 }
992
993 if (!Any)
994 return nullptr;
995
996 Constant *C =
997 ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], NewIdxs, NW, InRange);
998 return ConstantFoldConstant(C, DL, TLI);
999}
1000
1001/// If we can symbolically evaluate the GEP constant expression, do so.
1002Constant *SymbolicallyEvaluateGEP(const GEPOperator *GEP,
1004 const DataLayout &DL,
1005 const TargetLibraryInfo *TLI) {
1006 Type *SrcElemTy = GEP->getSourceElementType();
1007 Type *ResTy = GEP->getType();
1008 if (!SrcElemTy->isSized() || isa<ScalableVectorType>(SrcElemTy))
1009 return nullptr;
1010
1011 if (Constant *C = CastGEPIndices(SrcElemTy, Ops, ResTy, GEP->getNoWrapFlags(),
1012 GEP->getInRange(), DL, TLI))
1013 return C;
1014
1015 Constant *Ptr = Ops[0];
1016 if (!Ptr->getType()->isPointerTy())
1017 return nullptr;
1018
1019 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1020
1021 for (unsigned i = 1, e = Ops.size(); i != e; ++i)
1022 if (!isa<ConstantInt>(Ops[i]) || !Ops[i]->getType()->isIntegerTy())
1023 return nullptr;
1024
1025 unsigned BitWidth = DL.getTypeSizeInBits(IntIdxTy);
1026 APInt Offset = APInt(
1027 BitWidth,
1028 DL.getIndexedOffsetInType(
1029 SrcElemTy, ArrayRef((Value *const *)Ops.data() + 1, Ops.size() - 1)),
1030 /*isSigned=*/true, /*implicitTrunc=*/true);
1031
1032 std::optional<ConstantRange> InRange = GEP->getInRange();
1033 if (InRange)
1034 InRange = InRange->sextOrTrunc(BitWidth);
1035
1036 // If this is a GEP of a GEP, fold it all into a single GEP.
1037 GEPNoWrapFlags NW = GEP->getNoWrapFlags();
1038 bool Overflow = false;
1039 while (auto *GEP = dyn_cast<GEPOperator>(Ptr)) {
1040 NW &= GEP->getNoWrapFlags();
1041
1042 SmallVector<Value *, 4> NestedOps(llvm::drop_begin(GEP->operands()));
1043
1044 // Do not try the incorporate the sub-GEP if some index is not a number.
1045 bool AllConstantInt = true;
1046 for (Value *NestedOp : NestedOps)
1047 if (!isa<ConstantInt>(NestedOp)) {
1048 AllConstantInt = false;
1049 break;
1050 }
1051 if (!AllConstantInt)
1052 break;
1053
1054 // Adjust inrange offset and intersect inrange attributes
1055 if (auto GEPRange = GEP->getInRange()) {
1056 auto AdjustedGEPRange = GEPRange->sextOrTrunc(BitWidth).subtract(Offset);
1057 InRange =
1058 InRange ? InRange->intersectWith(AdjustedGEPRange) : AdjustedGEPRange;
1059 }
1060
1061 Ptr = cast<Constant>(GEP->getOperand(0));
1062 SrcElemTy = GEP->getSourceElementType();
1063 Offset = Offset.sadd_ov(
1064 APInt(BitWidth, DL.getIndexedOffsetInType(SrcElemTy, NestedOps),
1065 /*isSigned=*/true, /*implicitTrunc=*/true),
1066 Overflow);
1067 }
1068
1069 // Preserving nusw (without inbounds) also requires that the offset
1070 // additions did not overflow.
1071 if (NW.hasNoUnsignedSignedWrap() && !NW.isInBounds() && Overflow)
1073
1074 // If the base value for this address is a literal integer value, fold the
1075 // getelementptr to the resulting integer value casted to the pointer type.
1076 APInt BaseIntVal(DL.getPointerTypeSizeInBits(Ptr->getType()), 0);
1077 if (auto *CE = dyn_cast<ConstantExpr>(Ptr)) {
1078 if (CE->getOpcode() == Instruction::IntToPtr) {
1079 if (auto *Base = dyn_cast<ConstantInt>(CE->getOperand(0)))
1080 BaseIntVal = Base->getValue().zextOrTrunc(BaseIntVal.getBitWidth());
1081 }
1082 }
1083
1084 if ((Ptr->isNullValue() || BaseIntVal != 0) &&
1085 !DL.mustNotIntroduceIntToPtr(Ptr->getType())) {
1086
1087 // If the index size is smaller than the pointer size, add to the low
1088 // bits only.
1089 BaseIntVal.insertBits(BaseIntVal.trunc(BitWidth) + Offset, 0);
1090 Constant *C = ConstantInt::get(Ptr->getContext(), BaseIntVal);
1091 return ConstantExpr::getIntToPtr(C, ResTy);
1092 }
1093
1094 // Try to infer inbounds for GEPs of globals.
1095 if (!NW.isInBounds() && Offset.isNonNegative()) {
1096 bool CanBeNull, CanBeFreed;
1097 uint64_t DerefBytes =
1098 Ptr->getPointerDereferenceableBytes(DL, CanBeNull, CanBeFreed);
1099 if (DerefBytes != 0 && !CanBeNull && Offset.sle(DerefBytes))
1101 }
1102
1103 // nusw + nneg -> nuw
1104 if (NW.hasNoUnsignedSignedWrap() && Offset.isNonNegative())
1106
1107 // Otherwise canonicalize this to a single ptradd.
1108 LLVMContext &Ctx = Ptr->getContext();
1109 return ConstantExpr::getPtrAdd(Ptr, ConstantInt::get(Ctx, Offset), NW,
1110 InRange);
1111}
1112
1113/// Attempt to constant fold an instruction with the
1114/// specified opcode and operands. If successful, the constant result is
1115/// returned, if not, null is returned. Note that this function can fail when
1116/// attempting to fold instructions like loads and stores, which have no
1117/// constant expression form.
1118Constant *ConstantFoldInstOperandsImpl(const Value *InstOrCE, unsigned Opcode,
1120 const DataLayout &DL,
1121 const TargetLibraryInfo *TLI,
1122 bool AllowNonDeterministic) {
1123 Type *DestTy = InstOrCE->getType();
1124
1125 if (Instruction::isUnaryOp(Opcode))
1126 return ConstantFoldUnaryOpOperand(Opcode, Ops[0], DL);
1127
1128 if (Instruction::isBinaryOp(Opcode)) {
1129 switch (Opcode) {
1130 default:
1131 break;
1132 case Instruction::FAdd:
1133 case Instruction::FSub:
1134 case Instruction::FMul:
1135 case Instruction::FDiv:
1136 case Instruction::FRem:
1137 // Handle floating point instructions separately to account for denormals
1138 // TODO: If a constant expression is being folded rather than an
1139 // instruction, denormals will not be flushed/treated as zero
1140 if (const auto *I = dyn_cast<Instruction>(InstOrCE)) {
1141 return ConstantFoldFPInstOperands(Opcode, Ops[0], Ops[1], DL, I,
1142 AllowNonDeterministic);
1143 }
1144 }
1145 return ConstantFoldBinaryOpOperands(Opcode, Ops[0], Ops[1], DL);
1146 }
1147
1148 if (Instruction::isCast(Opcode))
1149 return ConstantFoldCastOperand(Opcode, Ops[0], DestTy, DL);
1150
1151 if (auto *GEP = dyn_cast<GEPOperator>(InstOrCE)) {
1152 Type *SrcElemTy = GEP->getSourceElementType();
1154 return nullptr;
1155
1156 if (Constant *C = SymbolicallyEvaluateGEP(GEP, Ops, DL, TLI))
1157 return C;
1158
1159 return ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], Ops.slice(1),
1160 GEP->getNoWrapFlags(),
1161 GEP->getInRange());
1162 }
1163
1164 if (auto *CE = dyn_cast<ConstantExpr>(InstOrCE))
1165 return CE->getWithOperands(Ops);
1166
1167 switch (Opcode) {
1168 default: return nullptr;
1169 case Instruction::ICmp:
1170 case Instruction::FCmp: {
1171 auto *C = cast<CmpInst>(InstOrCE);
1172 return ConstantFoldCompareInstOperands(C->getPredicate(), Ops[0], Ops[1],
1173 DL, TLI, C);
1174 }
1175 case Instruction::Freeze:
1176 return isGuaranteedNotToBeUndefOrPoison(Ops[0]) ? Ops[0] : nullptr;
1177 case Instruction::Call:
1178 if (auto *F = dyn_cast<Function>(Ops.back())) {
1179 const auto *Call = cast<CallBase>(InstOrCE);
1181 return ConstantFoldCall(Call, F, Ops.slice(0, Ops.size() - 1), TLI,
1182 AllowNonDeterministic);
1183 }
1184 return nullptr;
1185 case Instruction::Select:
1186 return ConstantFoldSelectInstruction(Ops[0], Ops[1], Ops[2]);
1187 case Instruction::ExtractElement:
1189 case Instruction::ExtractValue:
1191 Ops[0], cast<ExtractValueInst>(InstOrCE)->getIndices());
1192 case Instruction::InsertElement:
1193 return ConstantExpr::getInsertElement(Ops[0], Ops[1], Ops[2]);
1194 case Instruction::InsertValue:
1196 Ops[0], Ops[1], cast<InsertValueInst>(InstOrCE)->getIndices());
1197 case Instruction::ShuffleVector:
1199 Ops[0], Ops[1], cast<ShuffleVectorInst>(InstOrCE)->getShuffleMask());
1200 case Instruction::Load: {
1201 const auto *LI = dyn_cast<LoadInst>(InstOrCE);
1202 if (LI->isVolatile())
1203 return nullptr;
1204 return ConstantFoldLoadFromConstPtr(Ops[0], LI->getType(), DL);
1205 }
1206 }
1207}
1208
1209} // end anonymous namespace
1210
1211//===----------------------------------------------------------------------===//
1212// Constant Folding public APIs
1213//===----------------------------------------------------------------------===//
1214
1215namespace {
1216
1217Constant *
1218ConstantFoldConstantImpl(const Constant *C, const DataLayout &DL,
1219 const TargetLibraryInfo *TLI,
1222 return const_cast<Constant *>(C);
1223
1225 for (const Use &OldU : C->operands()) {
1226 Constant *OldC = cast<Constant>(&OldU);
1227 Constant *NewC = OldC;
1228 // Recursively fold the ConstantExpr's operands. If we have already folded
1229 // a ConstantExpr, we don't have to process it again.
1230 if (isa<ConstantVector>(OldC) || isa<ConstantExpr>(OldC)) {
1231 auto It = FoldedOps.find(OldC);
1232 if (It == FoldedOps.end()) {
1233 NewC = ConstantFoldConstantImpl(OldC, DL, TLI, FoldedOps);
1234 FoldedOps.insert({OldC, NewC});
1235 } else {
1236 NewC = It->second;
1237 }
1238 }
1239 Ops.push_back(NewC);
1240 }
1241
1242 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1243 if (Constant *Res = ConstantFoldInstOperandsImpl(
1244 CE, CE->getOpcode(), Ops, DL, TLI, /*AllowNonDeterministic=*/true))
1245 return Res;
1246 return const_cast<Constant *>(C);
1247 }
1248
1250 return ConstantVector::get(Ops);
1251}
1252
1253} // end anonymous namespace
1254
1256 const DataLayout &DL,
1257 const TargetLibraryInfo *TLI) {
1258 // Handle PHI nodes quickly here...
1259 if (auto *PN = dyn_cast<PHINode>(I)) {
1260 Constant *CommonValue = nullptr;
1261
1263 for (Value *Incoming : PN->incoming_values()) {
1264 // If the incoming value is undef then skip it. Note that while we could
1265 // skip the value if it is equal to the phi node itself we choose not to
1266 // because that would break the rule that constant folding only applies if
1267 // all operands are constants.
1268 if (isa<UndefValue>(Incoming))
1269 continue;
1270 // If the incoming value is not a constant, then give up.
1271 auto *C = dyn_cast<Constant>(Incoming);
1272 if (!C)
1273 return nullptr;
1274 // Fold the PHI's operands.
1275 C = ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1276 // If the incoming value is a different constant to
1277 // the one we saw previously, then give up.
1278 if (CommonValue && C != CommonValue)
1279 return nullptr;
1280 CommonValue = C;
1281 }
1282
1283 // If we reach here, all incoming values are the same constant or undef.
1284 return CommonValue ? CommonValue : UndefValue::get(PN->getType());
1285 }
1286
1287 // Scan the operand list, checking to see if they are all constants, if so,
1288 // hand off to ConstantFoldInstOperandsImpl.
1289 if (!all_of(I->operands(), [](const Use &U) { return isa<Constant>(U); }))
1290 return nullptr;
1291
1294 for (const Use &OpU : I->operands()) {
1295 auto *Op = cast<Constant>(&OpU);
1296 // Fold the Instruction's operands.
1297 Op = ConstantFoldConstantImpl(Op, DL, TLI, FoldedOps);
1298 Ops.push_back(Op);
1299 }
1300
1301 return ConstantFoldInstOperands(I, Ops, DL, TLI);
1302}
1303
1305 const TargetLibraryInfo *TLI) {
1307 return ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1308}
1309
1312 const DataLayout &DL,
1313 const TargetLibraryInfo *TLI,
1314 bool AllowNonDeterministic) {
1315 return ConstantFoldInstOperandsImpl(I, I->getOpcode(), Ops, DL, TLI,
1316 AllowNonDeterministic);
1317}
1318
1320 unsigned IntPredicate, Constant *Ops0, Constant *Ops1, const DataLayout &DL,
1321 const TargetLibraryInfo *TLI, const Instruction *I) {
1322 CmpInst::Predicate Predicate = (CmpInst::Predicate)IntPredicate;
1323 // fold: icmp (inttoptr x), null -> icmp x, 0
1324 // fold: icmp null, (inttoptr x) -> icmp 0, x
1325 // fold: icmp (ptrtoint x), 0 -> icmp x, null
1326 // fold: icmp 0, (ptrtoint x) -> icmp null, x
1327 // fold: icmp (inttoptr x), (inttoptr y) -> icmp trunc/zext x, trunc/zext y
1328 // fold: icmp (ptrtoint x), (ptrtoint y) -> icmp x, y
1329 //
1330 // FIXME: The following comment is out of data and the DataLayout is here now.
1331 // ConstantExpr::getCompare cannot do this, because it doesn't have DL
1332 // around to know if bit truncation is happening.
1333 if (auto *CE0 = dyn_cast<ConstantExpr>(Ops0)) {
1334 if (Ops1->isNullValue()) {
1335 if (CE0->getOpcode() == Instruction::IntToPtr) {
1336 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1337 // Convert the integer value to the right size to ensure we get the
1338 // proper extension or truncation.
1339 if (Constant *C = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1340 /*IsSigned*/ false, DL)) {
1341 Constant *Null = Constant::getNullValue(C->getType());
1342 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1343 }
1344 }
1345
1346 // icmp only compares the address part of the pointer, so only do this
1347 // transform if the integer size matches the address size.
1348 if (CE0->getOpcode() == Instruction::PtrToInt ||
1349 CE0->getOpcode() == Instruction::PtrToAddr) {
1350 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1351 if (CE0->getType() == AddrTy) {
1352 Constant *C = CE0->getOperand(0);
1353 Constant *Null = Constant::getNullValue(C->getType());
1354 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1355 }
1356 }
1357 }
1358
1359 if (auto *CE1 = dyn_cast<ConstantExpr>(Ops1)) {
1360 if (CE0->getOpcode() == CE1->getOpcode()) {
1361 if (CE0->getOpcode() == Instruction::IntToPtr) {
1362 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1363
1364 // Convert the integer value to the right size to ensure we get the
1365 // proper extension or truncation.
1366 Constant *C0 = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1367 /*IsSigned*/ false, DL);
1368 Constant *C1 = ConstantFoldIntegerCast(CE1->getOperand(0), IntPtrTy,
1369 /*IsSigned*/ false, DL);
1370 if (C0 && C1)
1371 return ConstantFoldCompareInstOperands(Predicate, C0, C1, DL, TLI);
1372 }
1373
1374 // icmp only compares the address part of the pointer, so only do this
1375 // transform if the integer size matches the address size.
1376 if (CE0->getOpcode() == Instruction::PtrToInt ||
1377 CE0->getOpcode() == Instruction::PtrToAddr) {
1378 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1379 if (CE0->getType() == AddrTy &&
1380 CE0->getOperand(0)->getType() == CE1->getOperand(0)->getType()) {
1382 Predicate, CE0->getOperand(0), CE1->getOperand(0), DL, TLI);
1383 }
1384 }
1385 }
1386 }
1387
1388 // Convert pointer comparison (base+offset1) pred (base+offset2) into
1389 // offset1 pred offset2, for the case where the offset is inbounds. This
1390 // only works for equality and unsigned comparison, as inbounds permits
1391 // crossing the sign boundary. However, the offset comparison itself is
1392 // signed.
1393 if (Ops0->getType()->isPointerTy() && !ICmpInst::isSigned(Predicate)) {
1394 unsigned IndexWidth = DL.getIndexTypeSizeInBits(Ops0->getType());
1395 APInt Offset0(IndexWidth, 0);
1396 bool IsEqPred = ICmpInst::isEquality(Predicate);
1397 Value *Stripped0 = Ops0->stripAndAccumulateConstantOffsets(
1398 DL, Offset0, /*AllowNonInbounds=*/IsEqPred,
1399 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1400 /*LookThroughIntToPtr=*/IsEqPred);
1401 APInt Offset1(IndexWidth, 0);
1402 Value *Stripped1 = Ops1->stripAndAccumulateConstantOffsets(
1403 DL, Offset1, /*AllowNonInbounds=*/IsEqPred,
1404 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1405 /*LookThroughIntToPtr=*/IsEqPred);
1406 if (Stripped0 == Stripped1)
1407 return ConstantInt::getBool(
1408 Ops0->getContext(),
1409 ICmpInst::compare(Offset0, Offset1,
1410 ICmpInst::getSignedPredicate(Predicate)));
1411 }
1412 } else if (isa<ConstantExpr>(Ops1)) {
1413 // If RHS is a constant expression, but the left side isn't, swap the
1414 // operands and try again.
1415 Predicate = ICmpInst::getSwappedPredicate(Predicate);
1416 return ConstantFoldCompareInstOperands(Predicate, Ops1, Ops0, DL, TLI);
1417 }
1418
1419 if (CmpInst::isFPPredicate(Predicate)) {
1420 // Flush any denormal constant float input according to denormal handling
1421 // mode.
1422 Ops0 = FlushFPConstant(Ops0, I, /*IsOutput=*/false);
1423 if (!Ops0)
1424 return nullptr;
1425 Ops1 = FlushFPConstant(Ops1, I, /*IsOutput=*/false);
1426 if (!Ops1)
1427 return nullptr;
1428 }
1429
1430 return ConstantFoldCompareInstruction(Predicate, Ops0, Ops1);
1431}
1432
1434 const DataLayout &DL) {
1436
1437 return ConstantFoldUnaryInstruction(Opcode, Op);
1438}
1439
1441 Constant *RHS,
1442 const DataLayout &DL) {
1444 if (isa<ConstantExpr>(LHS) || isa<ConstantExpr>(RHS))
1445 if (Constant *C = SymbolicallyEvaluateBinop(Opcode, LHS, RHS, DL))
1446 return C;
1447
1449 return ConstantExpr::get(Opcode, LHS, RHS);
1450 return ConstantFoldBinaryInstruction(Opcode, LHS, RHS);
1451}
1452
1455 switch (Mode) {
1457 return nullptr;
1458 case DenormalMode::IEEE:
1459 return ConstantFP::get(Ty, APF);
1461 return ConstantFP::get(
1462 Ty, APFloat::getZero(APF.getSemantics(), APF.isNegative()));
1464 return ConstantFP::get(Ty, APFloat::getZero(APF.getSemantics(), false));
1465 default:
1466 break;
1467 }
1468
1469 llvm_unreachable("unknown denormal mode");
1470}
1471
1472/// Return the denormal mode that can be assumed when executing a floating point
1473/// operation at \p CtxI.
1475 if (!CtxI || !CtxI->getParent() || !CtxI->getFunction())
1476 return DenormalMode::getDynamic();
1477 return CtxI->getFunction()->getDenormalMode(
1478 Ty->getScalarType()->getFltSemantics());
1479}
1480
1482 const Instruction *Inst,
1483 bool IsOutput) {
1484 const APFloat &APF = CFP->getValueAPF();
1485 if (!APF.isDenormal())
1486 return CFP;
1487
1489 return flushDenormalConstant(CFP->getType(), APF,
1490 IsOutput ? Mode.Output : Mode.Input);
1491}
1492
1494 bool IsOutput) {
1495 if (ConstantFP *CFP = dyn_cast<ConstantFP>(Operand))
1496 return flushDenormalConstantFP(CFP, Inst, IsOutput);
1497
1499 return Operand;
1500
1501 Type *Ty = Operand->getType();
1502 VectorType *VecTy = dyn_cast<VectorType>(Ty);
1503 if (VecTy) {
1504 if (auto *Splat = dyn_cast_or_null<ConstantFP>(Operand->getSplatValue())) {
1505 Constant *Folded = flushDenormalConstantFP(Splat, Inst, IsOutput);
1506 if (!Folded)
1507 return nullptr;
1508 return ConstantVector::getSplat(VecTy->getElementCount(), Folded);
1509 }
1510
1511 Ty = VecTy->getElementType();
1512 }
1513
1514 if (isa<ConstantExpr>(Operand))
1515 return Operand;
1516
1517 if (const auto *CV = dyn_cast<ConstantVector>(Operand)) {
1519 for (unsigned i = 0, e = CV->getNumOperands(); i != e; ++i) {
1520 Constant *Element = CV->getAggregateElement(i);
1521 if (isa<UndefValue>(Element)) {
1522 NewElts.push_back(Element);
1523 continue;
1524 }
1525
1526 ConstantFP *CFP = dyn_cast<ConstantFP>(Element);
1527 if (!CFP)
1528 return nullptr;
1529
1530 Constant *Folded = flushDenormalConstantFP(CFP, Inst, IsOutput);
1531 if (!Folded)
1532 return nullptr;
1533 NewElts.push_back(Folded);
1534 }
1535
1536 return ConstantVector::get(NewElts);
1537 }
1538
1539 if (const auto *CDV = dyn_cast<ConstantDataVector>(Operand)) {
1541 for (unsigned I = 0, E = CDV->getNumElements(); I < E; ++I) {
1542 const APFloat &Elt = CDV->getElementAsAPFloat(I);
1543 if (!Elt.isDenormal()) {
1544 NewElts.push_back(ConstantFP::get(Ty, Elt));
1545 } else {
1546 DenormalMode Mode = getInstrDenormalMode(Inst, Ty);
1547 Constant *Folded =
1548 flushDenormalConstant(Ty, Elt, IsOutput ? Mode.Output : Mode.Input);
1549 if (!Folded)
1550 return nullptr;
1551 NewElts.push_back(Folded);
1552 }
1553 }
1554
1555 return ConstantVector::get(NewElts);
1556 }
1557
1558 return nullptr;
1559}
1560
1562 Constant *RHS, const DataLayout &DL,
1563 const Instruction *I,
1564 bool AllowNonDeterministic) {
1565 if (Instruction::isBinaryOp(Opcode)) {
1566 // Flush denormal inputs if needed.
1567 Constant *Op0 = FlushFPConstant(LHS, I, /* IsOutput */ false);
1568 if (!Op0)
1569 return nullptr;
1570 Constant *Op1 = FlushFPConstant(RHS, I, /* IsOutput */ false);
1571 if (!Op1)
1572 return nullptr;
1573
1574 // If nsz or an algebraic FMF flag is set, the result of the FP operation
1575 // may change due to future optimization. Don't constant fold them if
1576 // non-deterministic results are not allowed.
1577 if (!AllowNonDeterministic)
1579 if (FP->hasNoSignedZeros() || FP->hasAllowReassoc() ||
1580 FP->hasAllowContract() || FP->hasAllowReciprocal())
1581 return nullptr;
1582
1583 // Calculate constant result.
1584 Constant *C = ConstantFoldBinaryOpOperands(Opcode, Op0, Op1, DL);
1585 if (!C)
1586 return nullptr;
1587
1588 // Flush denormal output if needed.
1589 C = FlushFPConstant(C, I, /* IsOutput */ true);
1590 if (!C)
1591 return nullptr;
1592
1593 // The precise NaN value is non-deterministic.
1594 if (!AllowNonDeterministic && C->isNaN())
1595 return nullptr;
1596
1597 return C;
1598 }
1599 // If instruction lacks a parent/function and the denormal mode cannot be
1600 // determined, use the default (IEEE).
1601 return ConstantFoldBinaryOpOperands(Opcode, LHS, RHS, DL);
1602}
1603
1605 Type *DestTy, const DataLayout &DL) {
1606 assert(Instruction::isCast(Opcode));
1607
1608 if (auto *CE = dyn_cast<ConstantExpr>(C))
1609 if (CE->isCast())
1610 if (unsigned NewOp = CastInst::isEliminableCastPair(
1611 Instruction::CastOps(CE->getOpcode()),
1612 Instruction::CastOps(Opcode), CE->getOperand(0)->getType(),
1613 C->getType(), DestTy, &DL))
1614 return ConstantFoldCastOperand(NewOp, CE->getOperand(0), DestTy, DL);
1615
1616 switch (Opcode) {
1617 default:
1618 llvm_unreachable("Missing case");
1619 case Instruction::PtrToAddr:
1620 case Instruction::PtrToInt:
1621 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1622 Constant *FoldedValue = nullptr;
1623 // If the input is an inttoptr, eliminate the pair. This requires knowing
1624 // the width of a pointer, so it can't be done in ConstantExpr::getCast.
1625 if (CE->getOpcode() == Instruction::IntToPtr) {
1626 // zext/trunc the inttoptr to pointer/address size.
1627 Type *MidTy = Opcode == Instruction::PtrToInt
1628 ? DL.getAddressType(CE->getType())
1629 : DL.getIntPtrType(CE->getType());
1630 FoldedValue = ConstantFoldIntegerCast(CE->getOperand(0), MidTy,
1631 /*IsSigned=*/false, DL);
1632 } else if (auto *GEP = dyn_cast<GEPOperator>(CE)) {
1633 // If we have GEP, we can perform the following folds:
1634 // (ptrtoint/ptrtoaddr (gep null, x)) -> x
1635 // (ptrtoint/ptrtoaddr (gep (gep null, x), y) -> x + y, etc.
1636 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
1637 APInt BaseOffset(BitWidth, 0);
1638 auto *Base = cast<Constant>(GEP->stripAndAccumulateConstantOffsets(
1639 DL, BaseOffset, /*AllowNonInbounds=*/true));
1640 if (Base->isNullValue()) {
1641 FoldedValue = ConstantInt::get(CE->getContext(), BaseOffset);
1642 } else {
1643 // ptrtoint/ptrtoaddr (gep i8, Ptr, (sub 0, V))
1644 // -> sub (ptrtoint/ptrtoaddr Ptr), V
1645 if (GEP->getNumIndices() == 1 &&
1646 GEP->getSourceElementType()->isIntegerTy(8)) {
1647 auto *Ptr = cast<Constant>(GEP->getPointerOperand());
1648 auto *Sub = dyn_cast<ConstantExpr>(GEP->getOperand(1));
1649 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1650 if (Sub && Sub->getType() == IntIdxTy &&
1651 Sub->getOpcode() == Instruction::Sub &&
1652 Sub->getOperand(0)->isNullValue())
1653 FoldedValue = ConstantExpr::getSub(
1654 ConstantExpr::getCast(Opcode, Ptr, IntIdxTy),
1655 Sub->getOperand(1));
1656 }
1657 }
1658 }
1659 if (FoldedValue) {
1660 // Do a zext or trunc to get to the ptrtoint/ptrtoaddr dest size.
1661 return ConstantFoldIntegerCast(FoldedValue, DestTy, /*IsSigned=*/false,
1662 DL);
1663 }
1664 }
1665 break;
1666 case Instruction::IntToPtr:
1667 // If the input is a ptrtoint, turn the pair into a ptr to ptr bitcast if
1668 // the int size is >= the ptr size and the address spaces are the same.
1669 // This requires knowing the width of a pointer, so it can't be done in
1670 // ConstantExpr::getCast.
1671 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1672 if (CE->getOpcode() == Instruction::PtrToInt) {
1673 Constant *SrcPtr = CE->getOperand(0);
1674 unsigned SrcPtrSize = DL.getPointerTypeSizeInBits(SrcPtr->getType());
1675 unsigned MidIntSize = CE->getType()->getScalarSizeInBits();
1676
1677 if (MidIntSize >= SrcPtrSize) {
1678 unsigned SrcAS = SrcPtr->getType()->getPointerAddressSpace();
1679 if (SrcAS == DestTy->getPointerAddressSpace())
1680 return FoldBitCast(CE->getOperand(0), DestTy, DL);
1681 }
1682 }
1683 }
1684 break;
1685 case Instruction::Trunc:
1686 case Instruction::ZExt:
1687 case Instruction::SExt:
1688 case Instruction::FPTrunc:
1689 case Instruction::FPExt:
1690 case Instruction::UIToFP:
1691 case Instruction::SIToFP:
1692 case Instruction::FPToUI:
1693 case Instruction::FPToSI:
1694 case Instruction::AddrSpaceCast:
1695 break;
1696 case Instruction::BitCast:
1697 return FoldBitCast(C, DestTy, DL);
1698 }
1699
1701 return ConstantExpr::getCast(Opcode, C, DestTy);
1702 return ConstantFoldCastInstruction(Opcode, C, DestTy);
1703}
1704
1706 bool IsSigned, const DataLayout &DL) {
1707 Type *SrcTy = C->getType();
1708 if (SrcTy == DestTy)
1709 return C;
1710 if (SrcTy->getScalarSizeInBits() > DestTy->getScalarSizeInBits())
1711 return ConstantFoldCastOperand(Instruction::Trunc, C, DestTy, DL);
1712 if (IsSigned)
1713 return ConstantFoldCastOperand(Instruction::SExt, C, DestTy, DL);
1714 return ConstantFoldCastOperand(Instruction::ZExt, C, DestTy, DL);
1715}
1716
1717//===----------------------------------------------------------------------===//
1718// Constant Folding for Calls
1719//
1720
1722 if (Call->isNoBuiltin())
1723 return false;
1724 if (Call->getFunctionType() != F->getFunctionType())
1725 return false;
1726
1727 // Allow FP calls (both libcalls and intrinsics) to avoid being folded.
1728 // This can be useful for GPU targets or in cross-compilation scenarios
1729 // when the exact target FP behaviour is required, and the host compiler's
1730 // behaviour may be slightly different from the device's run-time behaviour.
1731 if (DisableFPCallFolding && (F->getReturnType()->isFloatingPointTy() ||
1732 any_of(F->args(), [](const Argument &Arg) {
1733 return Arg.getType()->isFloatingPointTy();
1734 })))
1735 return false;
1736
1737 switch (F->getIntrinsicID()) {
1738 // Operations that do not operate floating-point numbers and do not depend on
1739 // FP environment can be folded even in strictfp functions.
1740 case Intrinsic::bswap:
1741 case Intrinsic::ctpop:
1742 case Intrinsic::ctlz:
1743 case Intrinsic::cttz:
1744 case Intrinsic::fshl:
1745 case Intrinsic::fshr:
1746 case Intrinsic::launder_invariant_group:
1747 case Intrinsic::strip_invariant_group:
1748 case Intrinsic::masked_load:
1749 case Intrinsic::get_active_lane_mask:
1750 case Intrinsic::abs:
1751 case Intrinsic::smax:
1752 case Intrinsic::smin:
1753 case Intrinsic::umax:
1754 case Intrinsic::umin:
1755 case Intrinsic::scmp:
1756 case Intrinsic::ucmp:
1757 case Intrinsic::sadd_with_overflow:
1758 case Intrinsic::uadd_with_overflow:
1759 case Intrinsic::ssub_with_overflow:
1760 case Intrinsic::usub_with_overflow:
1761 case Intrinsic::smul_with_overflow:
1762 case Intrinsic::umul_with_overflow:
1763 case Intrinsic::sadd_sat:
1764 case Intrinsic::uadd_sat:
1765 case Intrinsic::ssub_sat:
1766 case Intrinsic::usub_sat:
1767 case Intrinsic::smul_fix:
1768 case Intrinsic::smul_fix_sat:
1769 case Intrinsic::bitreverse:
1770 case Intrinsic::is_constant:
1771 case Intrinsic::vector_reduce_add:
1772 case Intrinsic::vector_reduce_mul:
1773 case Intrinsic::vector_reduce_and:
1774 case Intrinsic::vector_reduce_or:
1775 case Intrinsic::vector_reduce_xor:
1776 case Intrinsic::vector_reduce_smin:
1777 case Intrinsic::vector_reduce_smax:
1778 case Intrinsic::vector_reduce_umin:
1779 case Intrinsic::vector_reduce_umax:
1780 case Intrinsic::vector_extract:
1781 case Intrinsic::vector_insert:
1782 case Intrinsic::vector_interleave2:
1783 case Intrinsic::vector_interleave3:
1784 case Intrinsic::vector_interleave4:
1785 case Intrinsic::vector_interleave5:
1786 case Intrinsic::vector_interleave6:
1787 case Intrinsic::vector_interleave7:
1788 case Intrinsic::vector_interleave8:
1789 case Intrinsic::vector_deinterleave2:
1790 case Intrinsic::vector_deinterleave3:
1791 case Intrinsic::vector_deinterleave4:
1792 case Intrinsic::vector_deinterleave5:
1793 case Intrinsic::vector_deinterleave6:
1794 case Intrinsic::vector_deinterleave7:
1795 case Intrinsic::vector_deinterleave8:
1796 // Target intrinsics
1797 case Intrinsic::amdgcn_perm:
1798 case Intrinsic::amdgcn_wave_reduce_umin:
1799 case Intrinsic::amdgcn_wave_reduce_umax:
1800 case Intrinsic::amdgcn_wave_reduce_max:
1801 case Intrinsic::amdgcn_wave_reduce_min:
1802 case Intrinsic::amdgcn_wave_reduce_and:
1803 case Intrinsic::amdgcn_wave_reduce_or:
1804 case Intrinsic::amdgcn_s_wqm:
1805 case Intrinsic::amdgcn_s_quadmask:
1806 case Intrinsic::amdgcn_s_bitreplicate:
1807 case Intrinsic::arm_mve_vctp8:
1808 case Intrinsic::arm_mve_vctp16:
1809 case Intrinsic::arm_mve_vctp32:
1810 case Intrinsic::arm_mve_vctp64:
1811 case Intrinsic::aarch64_sve_convert_from_svbool:
1812 case Intrinsic::wasm_alltrue:
1813 case Intrinsic::wasm_anytrue:
1814 case Intrinsic::wasm_dot:
1815 // WebAssembly float semantics are always known
1816 case Intrinsic::wasm_trunc_signed:
1817 case Intrinsic::wasm_trunc_unsigned:
1818 return true;
1819
1820 // Floating point operations cannot be folded in strictfp functions in
1821 // general case. They can be folded if FP environment is known to compiler.
1822 case Intrinsic::minnum:
1823 case Intrinsic::maxnum:
1824 case Intrinsic::minimum:
1825 case Intrinsic::maximum:
1826 case Intrinsic::minimumnum:
1827 case Intrinsic::maximumnum:
1828 case Intrinsic::log:
1829 case Intrinsic::log2:
1830 case Intrinsic::log10:
1831 case Intrinsic::exp:
1832 case Intrinsic::exp2:
1833 case Intrinsic::exp10:
1834 case Intrinsic::sqrt:
1835 case Intrinsic::sin:
1836 case Intrinsic::cos:
1837 case Intrinsic::sincos:
1838 case Intrinsic::sinh:
1839 case Intrinsic::cosh:
1840 case Intrinsic::atan:
1841 case Intrinsic::pow:
1842 case Intrinsic::powi:
1843 case Intrinsic::ldexp:
1844 case Intrinsic::fma:
1845 case Intrinsic::fmuladd:
1846 case Intrinsic::frexp:
1847 case Intrinsic::fptoui_sat:
1848 case Intrinsic::fptosi_sat:
1849 case Intrinsic::amdgcn_cos:
1850 case Intrinsic::amdgcn_cubeid:
1851 case Intrinsic::amdgcn_cubema:
1852 case Intrinsic::amdgcn_cubesc:
1853 case Intrinsic::amdgcn_cubetc:
1854 case Intrinsic::amdgcn_fmul_legacy:
1855 case Intrinsic::amdgcn_fma_legacy:
1856 case Intrinsic::amdgcn_fract:
1857 case Intrinsic::amdgcn_sin:
1858 // The intrinsics below depend on rounding mode in MXCSR.
1859 case Intrinsic::x86_sse_cvtss2si:
1860 case Intrinsic::x86_sse_cvtss2si64:
1861 case Intrinsic::x86_sse_cvttss2si:
1862 case Intrinsic::x86_sse_cvttss2si64:
1863 case Intrinsic::x86_sse2_cvtsd2si:
1864 case Intrinsic::x86_sse2_cvtsd2si64:
1865 case Intrinsic::x86_sse2_cvttsd2si:
1866 case Intrinsic::x86_sse2_cvttsd2si64:
1867 case Intrinsic::x86_avx512_vcvtss2si32:
1868 case Intrinsic::x86_avx512_vcvtss2si64:
1869 case Intrinsic::x86_avx512_cvttss2si:
1870 case Intrinsic::x86_avx512_cvttss2si64:
1871 case Intrinsic::x86_avx512_vcvtsd2si32:
1872 case Intrinsic::x86_avx512_vcvtsd2si64:
1873 case Intrinsic::x86_avx512_cvttsd2si:
1874 case Intrinsic::x86_avx512_cvttsd2si64:
1875 case Intrinsic::x86_avx512_vcvtss2usi32:
1876 case Intrinsic::x86_avx512_vcvtss2usi64:
1877 case Intrinsic::x86_avx512_cvttss2usi:
1878 case Intrinsic::x86_avx512_cvttss2usi64:
1879 case Intrinsic::x86_avx512_vcvtsd2usi32:
1880 case Intrinsic::x86_avx512_vcvtsd2usi64:
1881 case Intrinsic::x86_avx512_cvttsd2usi:
1882 case Intrinsic::x86_avx512_cvttsd2usi64:
1883
1884 // NVVM FMax intrinsics
1885 case Intrinsic::nvvm_fmax_d:
1886 case Intrinsic::nvvm_fmax_f:
1887 case Intrinsic::nvvm_fmax_ftz_f:
1888 case Intrinsic::nvvm_fmax_ftz_nan_f:
1889 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
1890 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
1891 case Intrinsic::nvvm_fmax_nan_f:
1892 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
1893 case Intrinsic::nvvm_fmax_xorsign_abs_f:
1894
1895 // NVVM FMin intrinsics
1896 case Intrinsic::nvvm_fmin_d:
1897 case Intrinsic::nvvm_fmin_f:
1898 case Intrinsic::nvvm_fmin_ftz_f:
1899 case Intrinsic::nvvm_fmin_ftz_nan_f:
1900 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
1901 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
1902 case Intrinsic::nvvm_fmin_nan_f:
1903 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
1904 case Intrinsic::nvvm_fmin_xorsign_abs_f:
1905
1906 // NVVM float/double to int32/uint32 conversion intrinsics
1907 case Intrinsic::nvvm_f2i_rm:
1908 case Intrinsic::nvvm_f2i_rn:
1909 case Intrinsic::nvvm_f2i_rp:
1910 case Intrinsic::nvvm_f2i_rz:
1911 case Intrinsic::nvvm_f2i_rm_ftz:
1912 case Intrinsic::nvvm_f2i_rn_ftz:
1913 case Intrinsic::nvvm_f2i_rp_ftz:
1914 case Intrinsic::nvvm_f2i_rz_ftz:
1915 case Intrinsic::nvvm_f2ui_rm:
1916 case Intrinsic::nvvm_f2ui_rn:
1917 case Intrinsic::nvvm_f2ui_rp:
1918 case Intrinsic::nvvm_f2ui_rz:
1919 case Intrinsic::nvvm_f2ui_rm_ftz:
1920 case Intrinsic::nvvm_f2ui_rn_ftz:
1921 case Intrinsic::nvvm_f2ui_rp_ftz:
1922 case Intrinsic::nvvm_f2ui_rz_ftz:
1923 case Intrinsic::nvvm_d2i_rm:
1924 case Intrinsic::nvvm_d2i_rn:
1925 case Intrinsic::nvvm_d2i_rp:
1926 case Intrinsic::nvvm_d2i_rz:
1927 case Intrinsic::nvvm_d2ui_rm:
1928 case Intrinsic::nvvm_d2ui_rn:
1929 case Intrinsic::nvvm_d2ui_rp:
1930 case Intrinsic::nvvm_d2ui_rz:
1931
1932 // NVVM float/double to int64/uint64 conversion intrinsics
1933 case Intrinsic::nvvm_f2ll_rm:
1934 case Intrinsic::nvvm_f2ll_rn:
1935 case Intrinsic::nvvm_f2ll_rp:
1936 case Intrinsic::nvvm_f2ll_rz:
1937 case Intrinsic::nvvm_f2ll_rm_ftz:
1938 case Intrinsic::nvvm_f2ll_rn_ftz:
1939 case Intrinsic::nvvm_f2ll_rp_ftz:
1940 case Intrinsic::nvvm_f2ll_rz_ftz:
1941 case Intrinsic::nvvm_f2ull_rm:
1942 case Intrinsic::nvvm_f2ull_rn:
1943 case Intrinsic::nvvm_f2ull_rp:
1944 case Intrinsic::nvvm_f2ull_rz:
1945 case Intrinsic::nvvm_f2ull_rm_ftz:
1946 case Intrinsic::nvvm_f2ull_rn_ftz:
1947 case Intrinsic::nvvm_f2ull_rp_ftz:
1948 case Intrinsic::nvvm_f2ull_rz_ftz:
1949 case Intrinsic::nvvm_d2ll_rm:
1950 case Intrinsic::nvvm_d2ll_rn:
1951 case Intrinsic::nvvm_d2ll_rp:
1952 case Intrinsic::nvvm_d2ll_rz:
1953 case Intrinsic::nvvm_d2ull_rm:
1954 case Intrinsic::nvvm_d2ull_rn:
1955 case Intrinsic::nvvm_d2ull_rp:
1956 case Intrinsic::nvvm_d2ull_rz:
1957
1958 // NVVM math intrinsics:
1959 case Intrinsic::nvvm_ceil_d:
1960 case Intrinsic::nvvm_ceil_f:
1961 case Intrinsic::nvvm_ceil_ftz_f:
1962
1963 case Intrinsic::nvvm_fabs:
1964 case Intrinsic::nvvm_fabs_ftz:
1965
1966 case Intrinsic::nvvm_floor_d:
1967 case Intrinsic::nvvm_floor_f:
1968 case Intrinsic::nvvm_floor_ftz_f:
1969
1970 case Intrinsic::nvvm_rcp_rm_d:
1971 case Intrinsic::nvvm_rcp_rm_f:
1972 case Intrinsic::nvvm_rcp_rm_ftz_f:
1973 case Intrinsic::nvvm_rcp_rn_d:
1974 case Intrinsic::nvvm_rcp_rn_f:
1975 case Intrinsic::nvvm_rcp_rn_ftz_f:
1976 case Intrinsic::nvvm_rcp_rp_d:
1977 case Intrinsic::nvvm_rcp_rp_f:
1978 case Intrinsic::nvvm_rcp_rp_ftz_f:
1979 case Intrinsic::nvvm_rcp_rz_d:
1980 case Intrinsic::nvvm_rcp_rz_f:
1981 case Intrinsic::nvvm_rcp_rz_ftz_f:
1982
1983 case Intrinsic::nvvm_round_d:
1984 case Intrinsic::nvvm_round_f:
1985 case Intrinsic::nvvm_round_ftz_f:
1986
1987 case Intrinsic::nvvm_saturate_d:
1988 case Intrinsic::nvvm_saturate_f:
1989 case Intrinsic::nvvm_saturate_ftz_f:
1990
1991 case Intrinsic::nvvm_sqrt_f:
1992 case Intrinsic::nvvm_sqrt_rn_d:
1993 case Intrinsic::nvvm_sqrt_rn_f:
1994 case Intrinsic::nvvm_sqrt_rn_ftz_f:
1995 return !Call->isStrictFP();
1996
1997 // NVVM add intrinsics with explicit rounding modes
1998 case Intrinsic::nvvm_add_rm_d:
1999 case Intrinsic::nvvm_add_rn_d:
2000 case Intrinsic::nvvm_add_rp_d:
2001 case Intrinsic::nvvm_add_rz_d:
2002 case Intrinsic::nvvm_add_rm_f:
2003 case Intrinsic::nvvm_add_rn_f:
2004 case Intrinsic::nvvm_add_rp_f:
2005 case Intrinsic::nvvm_add_rz_f:
2006 case Intrinsic::nvvm_add_rm_ftz_f:
2007 case Intrinsic::nvvm_add_rn_ftz_f:
2008 case Intrinsic::nvvm_add_rp_ftz_f:
2009 case Intrinsic::nvvm_add_rz_ftz_f:
2010
2011 // NVVM div intrinsics with explicit rounding modes
2012 case Intrinsic::nvvm_div_rm_d:
2013 case Intrinsic::nvvm_div_rn_d:
2014 case Intrinsic::nvvm_div_rp_d:
2015 case Intrinsic::nvvm_div_rz_d:
2016 case Intrinsic::nvvm_div_rm_f:
2017 case Intrinsic::nvvm_div_rn_f:
2018 case Intrinsic::nvvm_div_rp_f:
2019 case Intrinsic::nvvm_div_rz_f:
2020 case Intrinsic::nvvm_div_rm_ftz_f:
2021 case Intrinsic::nvvm_div_rn_ftz_f:
2022 case Intrinsic::nvvm_div_rp_ftz_f:
2023 case Intrinsic::nvvm_div_rz_ftz_f:
2024
2025 // NVVM mul intrinsics with explicit rounding modes
2026 case Intrinsic::nvvm_mul_rm_d:
2027 case Intrinsic::nvvm_mul_rn_d:
2028 case Intrinsic::nvvm_mul_rp_d:
2029 case Intrinsic::nvvm_mul_rz_d:
2030 case Intrinsic::nvvm_mul_rm_f:
2031 case Intrinsic::nvvm_mul_rn_f:
2032 case Intrinsic::nvvm_mul_rp_f:
2033 case Intrinsic::nvvm_mul_rz_f:
2034 case Intrinsic::nvvm_mul_rm_ftz_f:
2035 case Intrinsic::nvvm_mul_rn_ftz_f:
2036 case Intrinsic::nvvm_mul_rp_ftz_f:
2037 case Intrinsic::nvvm_mul_rz_ftz_f:
2038
2039 // NVVM fma intrinsics with explicit rounding modes
2040 case Intrinsic::nvvm_fma_rm_d:
2041 case Intrinsic::nvvm_fma_rn_d:
2042 case Intrinsic::nvvm_fma_rp_d:
2043 case Intrinsic::nvvm_fma_rz_d:
2044 case Intrinsic::nvvm_fma_rm_f:
2045 case Intrinsic::nvvm_fma_rn_f:
2046 case Intrinsic::nvvm_fma_rp_f:
2047 case Intrinsic::nvvm_fma_rz_f:
2048 case Intrinsic::nvvm_fma_rm_ftz_f:
2049 case Intrinsic::nvvm_fma_rn_ftz_f:
2050 case Intrinsic::nvvm_fma_rp_ftz_f:
2051 case Intrinsic::nvvm_fma_rz_ftz_f:
2052
2053 // Sign operations are actually bitwise operations, they do not raise
2054 // exceptions even for SNANs.
2055 case Intrinsic::fabs:
2056 case Intrinsic::copysign:
2057 case Intrinsic::is_fpclass:
2058 // Non-constrained variants of rounding operations means default FP
2059 // environment, they can be folded in any case.
2060 case Intrinsic::ceil:
2061 case Intrinsic::floor:
2062 case Intrinsic::round:
2063 case Intrinsic::roundeven:
2064 case Intrinsic::trunc:
2065 case Intrinsic::nearbyint:
2066 case Intrinsic::rint:
2067 case Intrinsic::canonicalize:
2068
2069 // Constrained intrinsics can be folded if FP environment is known
2070 // to compiler.
2071 case Intrinsic::experimental_constrained_fma:
2072 case Intrinsic::experimental_constrained_fmuladd:
2073 case Intrinsic::experimental_constrained_fadd:
2074 case Intrinsic::experimental_constrained_fsub:
2075 case Intrinsic::experimental_constrained_fmul:
2076 case Intrinsic::experimental_constrained_fdiv:
2077 case Intrinsic::experimental_constrained_frem:
2078 case Intrinsic::experimental_constrained_ceil:
2079 case Intrinsic::experimental_constrained_floor:
2080 case Intrinsic::experimental_constrained_round:
2081 case Intrinsic::experimental_constrained_roundeven:
2082 case Intrinsic::experimental_constrained_trunc:
2083 case Intrinsic::experimental_constrained_nearbyint:
2084 case Intrinsic::experimental_constrained_rint:
2085 case Intrinsic::experimental_constrained_fcmp:
2086 case Intrinsic::experimental_constrained_fcmps:
2087
2088 case Intrinsic::experimental_cttz_elts:
2089 return true;
2090 default:
2091 return false;
2092 case Intrinsic::not_intrinsic: break;
2093 }
2094
2095 if (!F->hasName() || Call->isStrictFP())
2096 return false;
2097
2098 // In these cases, the check of the length is required. We don't want to
2099 // return true for a name like "cos\0blah" which strcmp would return equal to
2100 // "cos", but has length 8.
2101 StringRef Name = F->getName();
2102 switch (Name[0]) {
2103 default:
2104 return false;
2105 // clang-format off
2106 case 'a':
2107 return Name == "acos" || Name == "acosf" ||
2108 Name == "asin" || Name == "asinf" ||
2109 Name == "atan" || Name == "atanf" ||
2110 Name == "atan2" || Name == "atan2f";
2111 case 'c':
2112 return Name == "ceil" || Name == "ceilf" ||
2113 Name == "cos" || Name == "cosf" ||
2114 Name == "cosh" || Name == "coshf";
2115 case 'e':
2116 return Name == "exp" || Name == "expf" || Name == "exp2" ||
2117 Name == "exp2f" || Name == "erf" || Name == "erff";
2118 case 'f':
2119 return Name == "fabs" || Name == "fabsf" ||
2120 Name == "floor" || Name == "floorf" ||
2121 Name == "fmod" || Name == "fmodf";
2122 case 'i':
2123 return Name == "ilogb" || Name == "ilogbf";
2124 case 'l':
2125 return Name == "log" || Name == "logf" || Name == "logl" ||
2126 Name == "log2" || Name == "log2f" || Name == "log10" ||
2127 Name == "log10f" || Name == "logb" || Name == "logbf" ||
2128 Name == "log1p" || Name == "log1pf";
2129 case 'n':
2130 return Name == "nearbyint" || Name == "nearbyintf" || Name == "nextafter" ||
2131 Name == "nextafterf" || Name == "nexttoward" ||
2132 Name == "nexttowardf";
2133 case 'p':
2134 return Name == "pow" || Name == "powf";
2135 case 'r':
2136 return Name == "remainder" || Name == "remainderf" ||
2137 Name == "rint" || Name == "rintf" ||
2138 Name == "round" || Name == "roundf" ||
2139 Name == "roundeven" || Name == "roundevenf";
2140 case 's':
2141 return Name == "sin" || Name == "sinf" ||
2142 Name == "sinh" || Name == "sinhf" ||
2143 Name == "sqrt" || Name == "sqrtf";
2144 case 't':
2145 return Name == "tan" || Name == "tanf" ||
2146 Name == "tanh" || Name == "tanhf" ||
2147 Name == "trunc" || Name == "truncf";
2148 case '_':
2149 // Check for various function names that get used for the math functions
2150 // when the header files are preprocessed with the macro
2151 // __FINITE_MATH_ONLY__ enabled.
2152 // The '12' here is the length of the shortest name that can match.
2153 // We need to check the size before looking at Name[1] and Name[2]
2154 // so we may as well check a limit that will eliminate mismatches.
2155 if (Name.size() < 12 || Name[1] != '_')
2156 return false;
2157 switch (Name[2]) {
2158 default:
2159 return false;
2160 case 'a':
2161 return Name == "__acos_finite" || Name == "__acosf_finite" ||
2162 Name == "__asin_finite" || Name == "__asinf_finite" ||
2163 Name == "__atan2_finite" || Name == "__atan2f_finite";
2164 case 'c':
2165 return Name == "__cosh_finite" || Name == "__coshf_finite";
2166 case 'e':
2167 return Name == "__exp_finite" || Name == "__expf_finite" ||
2168 Name == "__exp2_finite" || Name == "__exp2f_finite";
2169 case 'l':
2170 return Name == "__log_finite" || Name == "__logf_finite" ||
2171 Name == "__log10_finite" || Name == "__log10f_finite";
2172 case 'p':
2173 return Name == "__pow_finite" || Name == "__powf_finite";
2174 case 's':
2175 return Name == "__sinh_finite" || Name == "__sinhf_finite";
2176 }
2177 // clang-format on
2178 }
2179}
2180
2181namespace {
2182
2183Constant *GetConstantFoldFPValue(double V, Type *Ty) {
2184 if (Ty->isHalfTy() || Ty->isFloatTy()) {
2185 APFloat APF(V);
2186 bool unused;
2187 APF.convert(Ty->getFltSemantics(), APFloat::rmNearestTiesToEven, &unused);
2188 return ConstantFP::get(Ty->getContext(), APF);
2189 }
2190 if (Ty->isDoubleTy())
2191 return ConstantFP::get(Ty->getContext(), APFloat(V));
2192 llvm_unreachable("Can only constant fold half/float/double");
2193}
2194
2195#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2196Constant *GetConstantFoldFPValue128(float128 V, Type *Ty) {
2197 if (Ty->isFP128Ty())
2198 return ConstantFP::get(Ty, V);
2199 llvm_unreachable("Can only constant fold fp128");
2200}
2201#endif
2202
2203/// Clear the floating-point exception state.
2204inline void llvm_fenv_clearexcept() {
2205#if HAVE_DECL_FE_ALL_EXCEPT
2206 feclearexcept(FE_ALL_EXCEPT);
2207#endif
2208 errno = 0;
2209}
2210
2211/// Test if a floating-point exception was raised.
2212inline bool llvm_fenv_testexcept() {
2213 int errno_val = errno;
2214 if (errno_val == ERANGE || errno_val == EDOM)
2215 return true;
2216#if HAVE_DECL_FE_ALL_EXCEPT && HAVE_DECL_FE_INEXACT
2217 if (fetestexcept(FE_ALL_EXCEPT & ~FE_INEXACT))
2218 return true;
2219#endif
2220 return false;
2221}
2222
2223static APFloat FTZPreserveSign(const APFloat &V) {
2224 if (V.isDenormal())
2225 return APFloat::getZero(V.getSemantics(), V.isNegative());
2226 return V;
2227}
2228
2229static APFloat FlushToPositiveZero(const APFloat &V) {
2230 if (V.isDenormal())
2231 return APFloat::getZero(V.getSemantics(), false);
2232 return V;
2233}
2234
2235static APFloat FlushWithDenormKind(const APFloat &V,
2236 DenormalMode::DenormalModeKind DenormKind) {
2239 switch (DenormKind) {
2241 return V;
2243 return FTZPreserveSign(V);
2245 return FlushToPositiveZero(V);
2246 default:
2247 llvm_unreachable("Invalid denormal mode!");
2248 }
2249}
2250
2251Constant *ConstantFoldFP(double (*NativeFP)(double), const APFloat &V, Type *Ty,
2252 DenormalMode DenormMode = DenormalMode::getIEEE()) {
2253 if (!DenormMode.isValid() ||
2254 DenormMode.Input == DenormalMode::DenormalModeKind::Dynamic ||
2255 DenormMode.Output == DenormalMode::DenormalModeKind::Dynamic)
2256 return nullptr;
2257
2258 llvm_fenv_clearexcept();
2259 auto Input = FlushWithDenormKind(V, DenormMode.Input);
2260 double Result = NativeFP(Input.convertToDouble());
2261 if (llvm_fenv_testexcept()) {
2262 llvm_fenv_clearexcept();
2263 return nullptr;
2264 }
2265
2266 Constant *Output = GetConstantFoldFPValue(Result, Ty);
2267 if (DenormMode.Output == DenormalMode::DenormalModeKind::IEEE)
2268 return Output;
2269 const auto *CFP = static_cast<ConstantFP *>(Output);
2270 const auto Res = FlushWithDenormKind(CFP->getValueAPF(), DenormMode.Output);
2271 return ConstantFP::get(Ty->getContext(), Res);
2272}
2273
2274#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2275Constant *ConstantFoldFP128(float128 (*NativeFP)(float128), const APFloat &V,
2276 Type *Ty) {
2277 llvm_fenv_clearexcept();
2278 float128 Result = NativeFP(V.convertToQuad());
2279 if (llvm_fenv_testexcept()) {
2280 llvm_fenv_clearexcept();
2281 return nullptr;
2282 }
2283
2284 return GetConstantFoldFPValue128(Result, Ty);
2285}
2286#endif
2287
2288Constant *ConstantFoldBinaryFP(double (*NativeFP)(double, double),
2289 const APFloat &V, const APFloat &W, Type *Ty) {
2290 llvm_fenv_clearexcept();
2291 double Result = NativeFP(V.convertToDouble(), W.convertToDouble());
2292 if (llvm_fenv_testexcept()) {
2293 llvm_fenv_clearexcept();
2294 return nullptr;
2295 }
2296
2297 return GetConstantFoldFPValue(Result, Ty);
2298}
2299
2300Constant *constantFoldVectorReduce(Intrinsic::ID IID, Constant *Op) {
2301 auto *OpVT = cast<VectorType>(Op->getType());
2302
2303 // This is the same as the underlying binops - poison propagates.
2304 if (Op->containsPoisonElement())
2305 return PoisonValue::get(OpVT->getElementType());
2306
2307 // Shortcut non-accumulating reductions.
2308 if (Constant *SplatVal = Op->getSplatValue()) {
2309 switch (IID) {
2310 case Intrinsic::vector_reduce_and:
2311 case Intrinsic::vector_reduce_or:
2312 case Intrinsic::vector_reduce_smin:
2313 case Intrinsic::vector_reduce_smax:
2314 case Intrinsic::vector_reduce_umin:
2315 case Intrinsic::vector_reduce_umax:
2316 return SplatVal;
2317 case Intrinsic::vector_reduce_add:
2318 if (SplatVal->isNullValue())
2319 return SplatVal;
2320 break;
2321 case Intrinsic::vector_reduce_mul:
2322 if (SplatVal->isNullValue() || SplatVal->isOneValue())
2323 return SplatVal;
2324 break;
2325 case Intrinsic::vector_reduce_xor:
2326 if (SplatVal->isNullValue())
2327 return SplatVal;
2328 if (OpVT->getElementCount().isKnownMultipleOf(2))
2329 return Constant::getNullValue(OpVT->getElementType());
2330 break;
2331 }
2332 }
2333
2335 if (!VT)
2336 return nullptr;
2337
2338 // TODO: Handle undef.
2339 auto *EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(0U));
2340 if (!EltC)
2341 return nullptr;
2342
2343 APInt Acc = EltC->getValue();
2344 for (unsigned I = 1, E = VT->getNumElements(); I != E; I++) {
2345 if (!(EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(I))))
2346 return nullptr;
2347 const APInt &X = EltC->getValue();
2348 switch (IID) {
2349 case Intrinsic::vector_reduce_add:
2350 Acc = Acc + X;
2351 break;
2352 case Intrinsic::vector_reduce_mul:
2353 Acc = Acc * X;
2354 break;
2355 case Intrinsic::vector_reduce_and:
2356 Acc = Acc & X;
2357 break;
2358 case Intrinsic::vector_reduce_or:
2359 Acc = Acc | X;
2360 break;
2361 case Intrinsic::vector_reduce_xor:
2362 Acc = Acc ^ X;
2363 break;
2364 case Intrinsic::vector_reduce_smin:
2365 Acc = APIntOps::smin(Acc, X);
2366 break;
2367 case Intrinsic::vector_reduce_smax:
2368 Acc = APIntOps::smax(Acc, X);
2369 break;
2370 case Intrinsic::vector_reduce_umin:
2371 Acc = APIntOps::umin(Acc, X);
2372 break;
2373 case Intrinsic::vector_reduce_umax:
2374 Acc = APIntOps::umax(Acc, X);
2375 break;
2376 }
2377 }
2378
2379 return ConstantInt::get(Op->getContext(), Acc);
2380}
2381
2382/// Attempt to fold an SSE floating point to integer conversion of a constant
2383/// floating point. If roundTowardZero is false, the default IEEE rounding is
2384/// used (toward nearest, ties to even). This matches the behavior of the
2385/// non-truncating SSE instructions in the default rounding mode. The desired
2386/// integer type Ty is used to select how many bits are available for the
2387/// result. Returns null if the conversion cannot be performed, otherwise
2388/// returns the Constant value resulting from the conversion.
2389Constant *ConstantFoldSSEConvertToInt(const APFloat &Val, bool roundTowardZero,
2390 Type *Ty, bool IsSigned) {
2391 // All of these conversion intrinsics form an integer of at most 64bits.
2392 unsigned ResultWidth = Ty->getIntegerBitWidth();
2393 assert(ResultWidth <= 64 &&
2394 "Can only constant fold conversions to 64 and 32 bit ints");
2395
2396 uint64_t UIntVal;
2397 bool isExact = false;
2401 Val.convertToInteger(MutableArrayRef(UIntVal), ResultWidth,
2402 IsSigned, mode, &isExact);
2403 if (status != APFloat::opOK &&
2404 (!roundTowardZero || status != APFloat::opInexact))
2405 return nullptr;
2406 return ConstantInt::get(Ty, UIntVal, IsSigned);
2407}
2408
2409double getValueAsDouble(ConstantFP *Op) {
2410 Type *Ty = Op->getType();
2411
2412 if (Ty->isBFloatTy() || Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())
2413 return Op->getValueAPF().convertToDouble();
2414
2415 bool unused;
2416 APFloat APF = Op->getValueAPF();
2418 return APF.convertToDouble();
2419}
2420
2421static bool getConstIntOrUndef(Value *Op, const APInt *&C) {
2422 if (auto *CI = dyn_cast<ConstantInt>(Op)) {
2423 C = &CI->getValue();
2424 return true;
2425 }
2426 if (isa<UndefValue>(Op)) {
2427 C = nullptr;
2428 return true;
2429 }
2430 return false;
2431}
2432
2433/// Checks if the given intrinsic call, which evaluates to constant, is allowed
2434/// to be folded.
2435///
2436/// \param CI Constrained intrinsic call.
2437/// \param St Exception flags raised during constant evaluation.
2438static bool mayFoldConstrained(ConstrainedFPIntrinsic *CI,
2439 APFloat::opStatus St) {
2440 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2441 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2442
2443 // If the operation does not change exception status flags, it is safe
2444 // to fold.
2445 if (St == APFloat::opStatus::opOK)
2446 return true;
2447
2448 // If evaluation raised FP exception, the result can depend on rounding
2449 // mode. If the latter is unknown, folding is not possible.
2450 if (ORM == RoundingMode::Dynamic)
2451 return false;
2452
2453 // If FP exceptions are ignored, fold the call, even if such exception is
2454 // raised.
2455 if (EB && *EB != fp::ExceptionBehavior::ebStrict)
2456 return true;
2457
2458 // Leave the calculation for runtime so that exception flags be correctly set
2459 // in hardware.
2460 return false;
2461}
2462
2463/// Returns the rounding mode that should be used for constant evaluation.
2464static RoundingMode
2465getEvaluationRoundingMode(const ConstrainedFPIntrinsic *CI) {
2466 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2467 if (!ORM || *ORM == RoundingMode::Dynamic)
2468 // Even if the rounding mode is unknown, try evaluating the operation.
2469 // If it does not raise inexact exception, rounding was not applied,
2470 // so the result is exact and does not depend on rounding mode. Whether
2471 // other FP exceptions are raised, it does not depend on rounding mode.
2473 return *ORM;
2474}
2475
2476/// Try to constant fold llvm.canonicalize for the given caller and value.
2477static Constant *constantFoldCanonicalize(const Type *Ty, const CallBase *CI,
2478 const APFloat &Src) {
2479 // Zero, positive and negative, is always OK to fold.
2480 if (Src.isZero()) {
2481 // Get a fresh 0, since ppc_fp128 does have non-canonical zeros.
2482 return ConstantFP::get(
2483 CI->getContext(),
2484 APFloat::getZero(Src.getSemantics(), Src.isNegative()));
2485 }
2486
2487 if (!Ty->isIEEELikeFPTy())
2488 return nullptr;
2489
2490 // Zero is always canonical and the sign must be preserved.
2491 //
2492 // Denorms and nans may have special encodings, but it should be OK to fold a
2493 // totally average number.
2494 if (Src.isNormal() || Src.isInfinity())
2495 return ConstantFP::get(CI->getContext(), Src);
2496
2497 if (Src.isDenormal() && CI->getParent() && CI->getFunction()) {
2498 DenormalMode DenormMode =
2499 CI->getFunction()->getDenormalMode(Src.getSemantics());
2500
2501 if (DenormMode == DenormalMode::getIEEE())
2502 return ConstantFP::get(CI->getContext(), Src);
2503
2504 if (DenormMode.Input == DenormalMode::Dynamic)
2505 return nullptr;
2506
2507 // If we know if either input or output is flushed, we can fold.
2508 if ((DenormMode.Input == DenormalMode::Dynamic &&
2509 DenormMode.Output == DenormalMode::IEEE) ||
2510 (DenormMode.Input == DenormalMode::IEEE &&
2511 DenormMode.Output == DenormalMode::Dynamic))
2512 return nullptr;
2513
2514 bool IsPositive =
2515 (!Src.isNegative() || DenormMode.Input == DenormalMode::PositiveZero ||
2516 (DenormMode.Output == DenormalMode::PositiveZero &&
2517 DenormMode.Input == DenormalMode::IEEE));
2518
2519 return ConstantFP::get(CI->getContext(),
2520 APFloat::getZero(Src.getSemantics(), !IsPositive));
2521 }
2522
2523 return nullptr;
2524}
2525
2526static Constant *ConstantFoldScalarCall1(StringRef Name,
2527 Intrinsic::ID IntrinsicID,
2528 Type *Ty,
2529 ArrayRef<Constant *> Operands,
2530 const TargetLibraryInfo *TLI,
2531 const CallBase *Call) {
2532 assert(Operands.size() == 1 && "Wrong number of operands.");
2533
2534 if (IntrinsicID == Intrinsic::is_constant) {
2535 // We know we have a "Constant" argument. But we want to only
2536 // return true for manifest constants, not those that depend on
2537 // constants with unknowable values, e.g. GlobalValue or BlockAddress.
2538 if (Operands[0]->isManifestConstant())
2539 return ConstantInt::getTrue(Ty->getContext());
2540 return nullptr;
2541 }
2542
2543 if (isa<UndefValue>(Operands[0])) {
2544 // cosine(arg) is between -1 and 1. cosine(invalid arg) is NaN.
2545 // ctpop() is between 0 and bitwidth, pick 0 for undef.
2546 // fptoui.sat and fptosi.sat can always fold to zero (for a zero input).
2547 if (IntrinsicID == Intrinsic::cos ||
2548 IntrinsicID == Intrinsic::ctpop ||
2549 IntrinsicID == Intrinsic::fptoui_sat ||
2550 IntrinsicID == Intrinsic::fptosi_sat ||
2551 IntrinsicID == Intrinsic::canonicalize)
2552 return Constant::getNullValue(Ty);
2553 if (IntrinsicID == Intrinsic::bswap ||
2554 IntrinsicID == Intrinsic::bitreverse ||
2555 IntrinsicID == Intrinsic::launder_invariant_group ||
2556 IntrinsicID == Intrinsic::strip_invariant_group)
2557 return Operands[0];
2558 }
2559
2560 if (isa<ConstantPointerNull>(Operands[0])) {
2561 // launder(null) == null == strip(null) iff in addrspace 0
2562 if (IntrinsicID == Intrinsic::launder_invariant_group ||
2563 IntrinsicID == Intrinsic::strip_invariant_group) {
2564 // If instruction is not yet put in a basic block (e.g. when cloning
2565 // a function during inlining), Call's caller may not be available.
2566 // So check Call's BB first before querying Call->getCaller.
2567 const Function *Caller =
2568 Call->getParent() ? Call->getCaller() : nullptr;
2569 if (Caller &&
2571 Caller, Operands[0]->getType()->getPointerAddressSpace())) {
2572 return Operands[0];
2573 }
2574 return nullptr;
2575 }
2576 }
2577
2578 if (auto *Op = dyn_cast<ConstantFP>(Operands[0])) {
2579 APFloat U = Op->getValueAPF();
2580
2581 if (IntrinsicID == Intrinsic::wasm_trunc_signed ||
2582 IntrinsicID == Intrinsic::wasm_trunc_unsigned) {
2583 bool Signed = IntrinsicID == Intrinsic::wasm_trunc_signed;
2584
2585 if (U.isNaN())
2586 return nullptr;
2587
2588 unsigned Width = Ty->getIntegerBitWidth();
2589 APSInt Int(Width, !Signed);
2590 bool IsExact = false;
2592 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2593
2595 return ConstantInt::get(Ty, Int);
2596
2597 return nullptr;
2598 }
2599
2600 if (IntrinsicID == Intrinsic::fptoui_sat ||
2601 IntrinsicID == Intrinsic::fptosi_sat) {
2602 // convertToInteger() already has the desired saturation semantics.
2603 APSInt Int(Ty->getIntegerBitWidth(),
2604 IntrinsicID == Intrinsic::fptoui_sat);
2605 bool IsExact;
2606 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2607 return ConstantInt::get(Ty, Int);
2608 }
2609
2610 if (IntrinsicID == Intrinsic::canonicalize)
2611 return constantFoldCanonicalize(Ty, Call, U);
2612
2613#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2614 if (Ty->isFP128Ty()) {
2615 if (IntrinsicID == Intrinsic::log) {
2616 float128 Result = logf128(Op->getValueAPF().convertToQuad());
2617 return GetConstantFoldFPValue128(Result, Ty);
2618 }
2619
2620 LibFunc Fp128Func = NotLibFunc;
2621 if (TLI && TLI->getLibFunc(Name, Fp128Func) && TLI->has(Fp128Func) &&
2622 Fp128Func == LibFunc_logl)
2623 return ConstantFoldFP128(logf128, Op->getValueAPF(), Ty);
2624 }
2625#endif
2626
2627 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy() &&
2628 !Ty->isIntegerTy())
2629 return nullptr;
2630
2631 // Use internal versions of these intrinsics.
2632
2633 if (IntrinsicID == Intrinsic::nearbyint || IntrinsicID == Intrinsic::rint ||
2634 IntrinsicID == Intrinsic::roundeven) {
2635 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2636 return ConstantFP::get(Ty, U);
2637 }
2638
2639 if (IntrinsicID == Intrinsic::round) {
2640 U.roundToIntegral(APFloat::rmNearestTiesToAway);
2641 return ConstantFP::get(Ty, U);
2642 }
2643
2644 if (IntrinsicID == Intrinsic::roundeven) {
2645 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2646 return ConstantFP::get(Ty, U);
2647 }
2648
2649 if (IntrinsicID == Intrinsic::ceil) {
2650 U.roundToIntegral(APFloat::rmTowardPositive);
2651 return ConstantFP::get(Ty, U);
2652 }
2653
2654 if (IntrinsicID == Intrinsic::floor) {
2655 U.roundToIntegral(APFloat::rmTowardNegative);
2656 return ConstantFP::get(Ty, U);
2657 }
2658
2659 if (IntrinsicID == Intrinsic::trunc) {
2660 U.roundToIntegral(APFloat::rmTowardZero);
2661 return ConstantFP::get(Ty, U);
2662 }
2663
2664 if (IntrinsicID == Intrinsic::fabs) {
2665 U.clearSign();
2666 return ConstantFP::get(Ty, U);
2667 }
2668
2669 if (IntrinsicID == Intrinsic::amdgcn_fract) {
2670 // The v_fract instruction behaves like the OpenCL spec, which defines
2671 // fract(x) as fmin(x - floor(x), 0x1.fffffep-1f): "The min() operator is
2672 // there to prevent fract(-small) from returning 1.0. It returns the
2673 // largest positive floating-point number less than 1.0."
2674 APFloat FloorU(U);
2675 FloorU.roundToIntegral(APFloat::rmTowardNegative);
2676 APFloat FractU(U - FloorU);
2677 APFloat AlmostOne(U.getSemantics(), 1);
2678 AlmostOne.next(/*nextDown*/ true);
2679 return ConstantFP::get(Ty, minimum(FractU, AlmostOne));
2680 }
2681
2682 // Rounding operations (floor, trunc, ceil, round and nearbyint) do not
2683 // raise FP exceptions, unless the argument is signaling NaN.
2684
2685 std::optional<APFloat::roundingMode> RM;
2686 switch (IntrinsicID) {
2687 default:
2688 break;
2689 case Intrinsic::experimental_constrained_nearbyint:
2690 case Intrinsic::experimental_constrained_rint: {
2692 RM = CI->getRoundingMode();
2693 if (!RM || *RM == RoundingMode::Dynamic)
2694 return nullptr;
2695 break;
2696 }
2697 case Intrinsic::experimental_constrained_round:
2699 break;
2700 case Intrinsic::experimental_constrained_ceil:
2702 break;
2703 case Intrinsic::experimental_constrained_floor:
2705 break;
2706 case Intrinsic::experimental_constrained_trunc:
2708 break;
2709 }
2710 if (RM) {
2712 if (U.isFinite()) {
2713 APFloat::opStatus St = U.roundToIntegral(*RM);
2714 if (IntrinsicID == Intrinsic::experimental_constrained_rint &&
2715 St == APFloat::opInexact) {
2716 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2717 if (EB == fp::ebStrict)
2718 return nullptr;
2719 }
2720 } else if (U.isSignaling()) {
2721 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2722 if (EB && *EB != fp::ebIgnore)
2723 return nullptr;
2724 U = APFloat::getQNaN(U.getSemantics());
2725 }
2726 return ConstantFP::get(Ty, U);
2727 }
2728
2729 // NVVM float/double to signed/unsigned int32/int64 conversions:
2730 switch (IntrinsicID) {
2731 // f2i
2732 case Intrinsic::nvvm_f2i_rm:
2733 case Intrinsic::nvvm_f2i_rn:
2734 case Intrinsic::nvvm_f2i_rp:
2735 case Intrinsic::nvvm_f2i_rz:
2736 case Intrinsic::nvvm_f2i_rm_ftz:
2737 case Intrinsic::nvvm_f2i_rn_ftz:
2738 case Intrinsic::nvvm_f2i_rp_ftz:
2739 case Intrinsic::nvvm_f2i_rz_ftz:
2740 // f2ui
2741 case Intrinsic::nvvm_f2ui_rm:
2742 case Intrinsic::nvvm_f2ui_rn:
2743 case Intrinsic::nvvm_f2ui_rp:
2744 case Intrinsic::nvvm_f2ui_rz:
2745 case Intrinsic::nvvm_f2ui_rm_ftz:
2746 case Intrinsic::nvvm_f2ui_rn_ftz:
2747 case Intrinsic::nvvm_f2ui_rp_ftz:
2748 case Intrinsic::nvvm_f2ui_rz_ftz:
2749 // d2i
2750 case Intrinsic::nvvm_d2i_rm:
2751 case Intrinsic::nvvm_d2i_rn:
2752 case Intrinsic::nvvm_d2i_rp:
2753 case Intrinsic::nvvm_d2i_rz:
2754 // d2ui
2755 case Intrinsic::nvvm_d2ui_rm:
2756 case Intrinsic::nvvm_d2ui_rn:
2757 case Intrinsic::nvvm_d2ui_rp:
2758 case Intrinsic::nvvm_d2ui_rz:
2759 // f2ll
2760 case Intrinsic::nvvm_f2ll_rm:
2761 case Intrinsic::nvvm_f2ll_rn:
2762 case Intrinsic::nvvm_f2ll_rp:
2763 case Intrinsic::nvvm_f2ll_rz:
2764 case Intrinsic::nvvm_f2ll_rm_ftz:
2765 case Intrinsic::nvvm_f2ll_rn_ftz:
2766 case Intrinsic::nvvm_f2ll_rp_ftz:
2767 case Intrinsic::nvvm_f2ll_rz_ftz:
2768 // f2ull
2769 case Intrinsic::nvvm_f2ull_rm:
2770 case Intrinsic::nvvm_f2ull_rn:
2771 case Intrinsic::nvvm_f2ull_rp:
2772 case Intrinsic::nvvm_f2ull_rz:
2773 case Intrinsic::nvvm_f2ull_rm_ftz:
2774 case Intrinsic::nvvm_f2ull_rn_ftz:
2775 case Intrinsic::nvvm_f2ull_rp_ftz:
2776 case Intrinsic::nvvm_f2ull_rz_ftz:
2777 // d2ll
2778 case Intrinsic::nvvm_d2ll_rm:
2779 case Intrinsic::nvvm_d2ll_rn:
2780 case Intrinsic::nvvm_d2ll_rp:
2781 case Intrinsic::nvvm_d2ll_rz:
2782 // d2ull
2783 case Intrinsic::nvvm_d2ull_rm:
2784 case Intrinsic::nvvm_d2ull_rn:
2785 case Intrinsic::nvvm_d2ull_rp:
2786 case Intrinsic::nvvm_d2ull_rz: {
2787 // In float-to-integer conversion, NaN inputs are converted to 0.
2788 if (U.isNaN()) {
2789 // In float-to-integer conversion, NaN inputs are converted to 0
2790 // when the source and destination bitwidths are both less than 64.
2791 if (nvvm::FPToIntegerIntrinsicNaNZero(IntrinsicID))
2792 return ConstantInt::get(Ty, 0);
2793
2794 // Otherwise, the most significant bit is set.
2795 unsigned BitWidth = Ty->getIntegerBitWidth();
2796 uint64_t Val = 1ULL << (BitWidth - 1);
2797 return ConstantInt::get(Ty, APInt(BitWidth, Val, /*IsSigned=*/false));
2798 }
2799
2800 APFloat::roundingMode RMode =
2802 bool IsFTZ = nvvm::FPToIntegerIntrinsicShouldFTZ(IntrinsicID);
2803 bool IsSigned = nvvm::FPToIntegerIntrinsicResultIsSigned(IntrinsicID);
2804
2805 APSInt ResInt(Ty->getIntegerBitWidth(), !IsSigned);
2806 auto FloatToRound = IsFTZ ? FTZPreserveSign(U) : U;
2807
2808 // Return max/min value for integers if the result is +/-inf or
2809 // is too large to fit in the result's integer bitwidth.
2810 bool IsExact = false;
2811 FloatToRound.convertToInteger(ResInt, RMode, &IsExact);
2812 return ConstantInt::get(Ty, ResInt);
2813 }
2814 }
2815
2816 /// We only fold functions with finite arguments. Folding NaN and inf is
2817 /// likely to be aborted with an exception anyway, and some host libms
2818 /// have known errors raising exceptions.
2819 if (!U.isFinite())
2820 return nullptr;
2821
2822 /// Currently APFloat versions of these functions do not exist, so we use
2823 /// the host native double versions. Float versions are not called
2824 /// directly but for all these it is true (float)(f((double)arg)) ==
2825 /// f(arg). Long double not supported yet.
2826 const APFloat &APF = Op->getValueAPF();
2827
2828 switch (IntrinsicID) {
2829 default: break;
2830 case Intrinsic::log:
2831 if (U.isZero())
2832 return ConstantFP::getInfinity(Ty, true);
2833 if (U.isNegative())
2834 return ConstantFP::getNaN(Ty);
2835 if (U.isExactlyValue(1.0))
2836 return ConstantFP::getZero(Ty);
2837 return ConstantFoldFP(log, APF, Ty);
2838 case Intrinsic::log2:
2839 if (U.isZero())
2840 return ConstantFP::getInfinity(Ty, true);
2841 if (U.isNegative())
2842 return ConstantFP::getNaN(Ty);
2843 if (U.isExactlyValue(1.0))
2844 return ConstantFP::getZero(Ty);
2845 // TODO: What about hosts that lack a C99 library?
2846 return ConstantFoldFP(log2, APF, Ty);
2847 case Intrinsic::log10:
2848 if (U.isZero())
2849 return ConstantFP::getInfinity(Ty, true);
2850 if (U.isNegative())
2851 return ConstantFP::getNaN(Ty);
2852 if (U.isExactlyValue(1.0))
2853 return ConstantFP::getZero(Ty);
2854 // TODO: What about hosts that lack a C99 library?
2855 return ConstantFoldFP(log10, APF, Ty);
2856 case Intrinsic::exp:
2857 return ConstantFoldFP(exp, APF, Ty);
2858 case Intrinsic::exp2:
2859 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2860 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2861 case Intrinsic::exp10:
2862 // Fold exp10(x) as pow(10, x), in case the host lacks a C99 library.
2863 return ConstantFoldBinaryFP(pow, APFloat(10.0), APF, Ty);
2864 case Intrinsic::sin:
2865 return ConstantFoldFP(sin, APF, Ty);
2866 case Intrinsic::cos:
2867 return ConstantFoldFP(cos, APF, Ty);
2868 case Intrinsic::sinh:
2869 return ConstantFoldFP(sinh, APF, Ty);
2870 case Intrinsic::cosh:
2871 return ConstantFoldFP(cosh, APF, Ty);
2872 case Intrinsic::atan:
2873 // Implement optional behavior from C's Annex F for +/-0.0.
2874 if (U.isZero())
2875 return ConstantFP::get(Ty, U);
2876 return ConstantFoldFP(atan, APF, Ty);
2877 case Intrinsic::sqrt:
2878 return ConstantFoldFP(sqrt, APF, Ty);
2879
2880 // NVVM Intrinsics:
2881 case Intrinsic::nvvm_ceil_ftz_f:
2882 case Intrinsic::nvvm_ceil_f:
2883 case Intrinsic::nvvm_ceil_d:
2884 return ConstantFoldFP(
2885 ceil, APF, Ty,
2887 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2888
2889 case Intrinsic::nvvm_fabs_ftz:
2890 case Intrinsic::nvvm_fabs:
2891 return ConstantFoldFP(
2892 fabs, APF, Ty,
2894 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2895
2896 case Intrinsic::nvvm_floor_ftz_f:
2897 case Intrinsic::nvvm_floor_f:
2898 case Intrinsic::nvvm_floor_d:
2899 return ConstantFoldFP(
2900 floor, APF, Ty,
2902 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2903
2904 case Intrinsic::nvvm_rcp_rm_ftz_f:
2905 case Intrinsic::nvvm_rcp_rn_ftz_f:
2906 case Intrinsic::nvvm_rcp_rp_ftz_f:
2907 case Intrinsic::nvvm_rcp_rz_ftz_f:
2908 case Intrinsic::nvvm_rcp_rm_d:
2909 case Intrinsic::nvvm_rcp_rm_f:
2910 case Intrinsic::nvvm_rcp_rn_d:
2911 case Intrinsic::nvvm_rcp_rn_f:
2912 case Intrinsic::nvvm_rcp_rp_d:
2913 case Intrinsic::nvvm_rcp_rp_f:
2914 case Intrinsic::nvvm_rcp_rz_d:
2915 case Intrinsic::nvvm_rcp_rz_f: {
2916 APFloat::roundingMode RoundMode = nvvm::GetRCPRoundingMode(IntrinsicID);
2917 bool IsFTZ = nvvm::RCPShouldFTZ(IntrinsicID);
2918
2919 auto Denominator = IsFTZ ? FTZPreserveSign(APF) : APF;
2921 APFloat::opStatus Status = Res.divide(Denominator, RoundMode);
2922
2924 if (IsFTZ)
2925 Res = FTZPreserveSign(Res);
2926 return ConstantFP::get(Ty, Res);
2927 }
2928 return nullptr;
2929 }
2930
2931 case Intrinsic::nvvm_round_ftz_f:
2932 case Intrinsic::nvvm_round_f:
2933 case Intrinsic::nvvm_round_d: {
2934 // nvvm_round is lowered to PTX cvt.rni, which will round to nearest
2935 // integer, choosing even integer if source is equidistant between two
2936 // integers, so the semantics are closer to "rint" rather than "round".
2937 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2938 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2940 return ConstantFP::get(Ty, V);
2941 }
2942
2943 case Intrinsic::nvvm_saturate_ftz_f:
2944 case Intrinsic::nvvm_saturate_d:
2945 case Intrinsic::nvvm_saturate_f: {
2946 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2947 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2948 if (V.isNegative() || V.isZero() || V.isNaN())
2949 return ConstantFP::getZero(Ty);
2951 if (V > One)
2952 return ConstantFP::get(Ty, One);
2953 return ConstantFP::get(Ty, APF);
2954 }
2955
2956 case Intrinsic::nvvm_sqrt_rn_ftz_f:
2957 case Intrinsic::nvvm_sqrt_f:
2958 case Intrinsic::nvvm_sqrt_rn_d:
2959 case Intrinsic::nvvm_sqrt_rn_f:
2960 if (APF.isNegative())
2961 return nullptr;
2962 return ConstantFoldFP(
2963 sqrt, APF, Ty,
2965 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2966
2967 // AMDGCN Intrinsics:
2968 case Intrinsic::amdgcn_cos:
2969 case Intrinsic::amdgcn_sin: {
2970 double V = getValueAsDouble(Op);
2971 if (V < -256.0 || V > 256.0)
2972 // The gfx8 and gfx9 architectures handle arguments outside the range
2973 // [-256, 256] differently. This should be a rare case so bail out
2974 // rather than trying to handle the difference.
2975 return nullptr;
2976 bool IsCos = IntrinsicID == Intrinsic::amdgcn_cos;
2977 double V4 = V * 4.0;
2978 if (V4 == floor(V4)) {
2979 // Force exact results for quarter-integer inputs.
2980 const double SinVals[4] = { 0.0, 1.0, 0.0, -1.0 };
2981 V = SinVals[((int)V4 + (IsCos ? 1 : 0)) & 3];
2982 } else {
2983 if (IsCos)
2984 V = cos(V * 2.0 * numbers::pi);
2985 else
2986 V = sin(V * 2.0 * numbers::pi);
2987 }
2988 return GetConstantFoldFPValue(V, Ty);
2989 }
2990 }
2991
2992 if (!TLI)
2993 return nullptr;
2994
2995 LibFunc Func = NotLibFunc;
2996 if (!TLI->getLibFunc(Name, Func))
2997 return nullptr;
2998
2999 switch (Func) {
3000 default:
3001 break;
3002 case LibFunc_acos:
3003 case LibFunc_acosf:
3004 case LibFunc_acos_finite:
3005 case LibFunc_acosf_finite:
3006 if (TLI->has(Func))
3007 return ConstantFoldFP(acos, APF, Ty);
3008 break;
3009 case LibFunc_asin:
3010 case LibFunc_asinf:
3011 case LibFunc_asin_finite:
3012 case LibFunc_asinf_finite:
3013 if (TLI->has(Func))
3014 return ConstantFoldFP(asin, APF, Ty);
3015 break;
3016 case LibFunc_atan:
3017 case LibFunc_atanf:
3018 // Implement optional behavior from C's Annex F for +/-0.0.
3019 if (U.isZero())
3020 return ConstantFP::get(Ty, U);
3021 if (TLI->has(Func))
3022 return ConstantFoldFP(atan, APF, Ty);
3023 break;
3024 case LibFunc_ceil:
3025 case LibFunc_ceilf:
3026 if (TLI->has(Func)) {
3027 U.roundToIntegral(APFloat::rmTowardPositive);
3028 return ConstantFP::get(Ty, U);
3029 }
3030 break;
3031 case LibFunc_cos:
3032 case LibFunc_cosf:
3033 if (TLI->has(Func))
3034 return ConstantFoldFP(cos, APF, Ty);
3035 break;
3036 case LibFunc_cosh:
3037 case LibFunc_coshf:
3038 case LibFunc_cosh_finite:
3039 case LibFunc_coshf_finite:
3040 if (TLI->has(Func))
3041 return ConstantFoldFP(cosh, APF, Ty);
3042 break;
3043 case LibFunc_exp:
3044 case LibFunc_expf:
3045 case LibFunc_exp_finite:
3046 case LibFunc_expf_finite:
3047 if (TLI->has(Func))
3048 return ConstantFoldFP(exp, APF, Ty);
3049 break;
3050 case LibFunc_exp2:
3051 case LibFunc_exp2f:
3052 case LibFunc_exp2_finite:
3053 case LibFunc_exp2f_finite:
3054 if (TLI->has(Func))
3055 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
3056 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
3057 break;
3058 case LibFunc_fabs:
3059 case LibFunc_fabsf:
3060 if (TLI->has(Func)) {
3061 U.clearSign();
3062 return ConstantFP::get(Ty, U);
3063 }
3064 break;
3065 case LibFunc_floor:
3066 case LibFunc_floorf:
3067 if (TLI->has(Func)) {
3068 U.roundToIntegral(APFloat::rmTowardNegative);
3069 return ConstantFP::get(Ty, U);
3070 }
3071 break;
3072 case LibFunc_log:
3073 case LibFunc_logf:
3074 case LibFunc_log_finite:
3075 case LibFunc_logf_finite:
3076 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3077 return ConstantFoldFP(log, APF, Ty);
3078 break;
3079 case LibFunc_log2:
3080 case LibFunc_log2f:
3081 case LibFunc_log2_finite:
3082 case LibFunc_log2f_finite:
3083 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3084 // TODO: What about hosts that lack a C99 library?
3085 return ConstantFoldFP(log2, APF, Ty);
3086 break;
3087 case LibFunc_log10:
3088 case LibFunc_log10f:
3089 case LibFunc_log10_finite:
3090 case LibFunc_log10f_finite:
3091 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3092 // TODO: What about hosts that lack a C99 library?
3093 return ConstantFoldFP(log10, APF, Ty);
3094 break;
3095 case LibFunc_ilogb:
3096 case LibFunc_ilogbf:
3097 if (!APF.isZero() && TLI->has(Func))
3098 return ConstantInt::get(Ty, ilogb(APF), true);
3099 break;
3100 case LibFunc_logb:
3101 case LibFunc_logbf:
3102 if (!APF.isZero() && TLI->has(Func))
3103 return ConstantFoldFP(logb, APF, Ty);
3104 break;
3105 case LibFunc_log1p:
3106 case LibFunc_log1pf:
3107 // Implement optional behavior from C's Annex F for +/-0.0.
3108 if (U.isZero())
3109 return ConstantFP::get(Ty, U);
3110 if (APF > APFloat::getOne(APF.getSemantics(), true) && TLI->has(Func))
3111 return ConstantFoldFP(log1p, APF, Ty);
3112 break;
3113 case LibFunc_logl:
3114 return nullptr;
3115 case LibFunc_erf:
3116 case LibFunc_erff:
3117 if (TLI->has(Func))
3118 return ConstantFoldFP(erf, APF, Ty);
3119 break;
3120 case LibFunc_nearbyint:
3121 case LibFunc_nearbyintf:
3122 case LibFunc_rint:
3123 case LibFunc_rintf:
3124 case LibFunc_roundeven:
3125 case LibFunc_roundevenf:
3126 if (TLI->has(Func)) {
3127 U.roundToIntegral(APFloat::rmNearestTiesToEven);
3128 return ConstantFP::get(Ty, U);
3129 }
3130 break;
3131 case LibFunc_round:
3132 case LibFunc_roundf:
3133 if (TLI->has(Func)) {
3134 U.roundToIntegral(APFloat::rmNearestTiesToAway);
3135 return ConstantFP::get(Ty, U);
3136 }
3137 break;
3138 case LibFunc_sin:
3139 case LibFunc_sinf:
3140 if (TLI->has(Func))
3141 return ConstantFoldFP(sin, APF, Ty);
3142 break;
3143 case LibFunc_sinh:
3144 case LibFunc_sinhf:
3145 case LibFunc_sinh_finite:
3146 case LibFunc_sinhf_finite:
3147 if (TLI->has(Func))
3148 return ConstantFoldFP(sinh, APF, Ty);
3149 break;
3150 case LibFunc_sqrt:
3151 case LibFunc_sqrtf:
3152 if (!APF.isNegative() && TLI->has(Func))
3153 return ConstantFoldFP(sqrt, APF, Ty);
3154 break;
3155 case LibFunc_tan:
3156 case LibFunc_tanf:
3157 if (TLI->has(Func))
3158 return ConstantFoldFP(tan, APF, Ty);
3159 break;
3160 case LibFunc_tanh:
3161 case LibFunc_tanhf:
3162 if (TLI->has(Func))
3163 return ConstantFoldFP(tanh, APF, Ty);
3164 break;
3165 case LibFunc_trunc:
3166 case LibFunc_truncf:
3167 if (TLI->has(Func)) {
3168 U.roundToIntegral(APFloat::rmTowardZero);
3169 return ConstantFP::get(Ty, U);
3170 }
3171 break;
3172 }
3173 return nullptr;
3174 }
3175
3176 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
3177 switch (IntrinsicID) {
3178 case Intrinsic::bswap:
3179 return ConstantInt::get(Ty->getContext(), Op->getValue().byteSwap());
3180 case Intrinsic::ctpop:
3181 return ConstantInt::get(Ty, Op->getValue().popcount());
3182 case Intrinsic::bitreverse:
3183 return ConstantInt::get(Ty->getContext(), Op->getValue().reverseBits());
3184 case Intrinsic::amdgcn_s_wqm: {
3185 uint64_t Val = Op->getZExtValue();
3186 Val |= (Val & 0x5555555555555555ULL) << 1 |
3187 ((Val >> 1) & 0x5555555555555555ULL);
3188 Val |= (Val & 0x3333333333333333ULL) << 2 |
3189 ((Val >> 2) & 0x3333333333333333ULL);
3190 return ConstantInt::get(Ty, Val);
3191 }
3192
3193 case Intrinsic::amdgcn_s_quadmask: {
3194 uint64_t Val = Op->getZExtValue();
3195 uint64_t QuadMask = 0;
3196 for (unsigned I = 0; I < Op->getBitWidth() / 4; ++I, Val >>= 4) {
3197 if (!(Val & 0xF))
3198 continue;
3199
3200 QuadMask |= (1ULL << I);
3201 }
3202 return ConstantInt::get(Ty, QuadMask);
3203 }
3204
3205 case Intrinsic::amdgcn_s_bitreplicate: {
3206 uint64_t Val = Op->getZExtValue();
3207 Val = (Val & 0x000000000000FFFFULL) | (Val & 0x00000000FFFF0000ULL) << 16;
3208 Val = (Val & 0x000000FF000000FFULL) | (Val & 0x0000FF000000FF00ULL) << 8;
3209 Val = (Val & 0x000F000F000F000FULL) | (Val & 0x00F000F000F000F0ULL) << 4;
3210 Val = (Val & 0x0303030303030303ULL) | (Val & 0x0C0C0C0C0C0C0C0CULL) << 2;
3211 Val = (Val & 0x1111111111111111ULL) | (Val & 0x2222222222222222ULL) << 1;
3212 Val = Val | Val << 1;
3213 return ConstantInt::get(Ty, Val);
3214 }
3215 }
3216 }
3217
3218 if (Operands[0]->getType()->isVectorTy()) {
3219 auto *Op = cast<Constant>(Operands[0]);
3220 switch (IntrinsicID) {
3221 default: break;
3222 case Intrinsic::vector_reduce_add:
3223 case Intrinsic::vector_reduce_mul:
3224 case Intrinsic::vector_reduce_and:
3225 case Intrinsic::vector_reduce_or:
3226 case Intrinsic::vector_reduce_xor:
3227 case Intrinsic::vector_reduce_smin:
3228 case Intrinsic::vector_reduce_smax:
3229 case Intrinsic::vector_reduce_umin:
3230 case Intrinsic::vector_reduce_umax:
3231 if (Constant *C = constantFoldVectorReduce(IntrinsicID, Operands[0]))
3232 return C;
3233 break;
3234 case Intrinsic::x86_sse_cvtss2si:
3235 case Intrinsic::x86_sse_cvtss2si64:
3236 case Intrinsic::x86_sse2_cvtsd2si:
3237 case Intrinsic::x86_sse2_cvtsd2si64:
3238 if (ConstantFP *FPOp =
3239 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3240 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3241 /*roundTowardZero=*/false, Ty,
3242 /*IsSigned*/true);
3243 break;
3244 case Intrinsic::x86_sse_cvttss2si:
3245 case Intrinsic::x86_sse_cvttss2si64:
3246 case Intrinsic::x86_sse2_cvttsd2si:
3247 case Intrinsic::x86_sse2_cvttsd2si64:
3248 if (ConstantFP *FPOp =
3249 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3250 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3251 /*roundTowardZero=*/true, Ty,
3252 /*IsSigned*/true);
3253 break;
3254
3255 case Intrinsic::wasm_anytrue:
3256 return Op->isNullValue() ? ConstantInt::get(Ty, 0)
3257 : ConstantInt::get(Ty, 1);
3258
3259 case Intrinsic::wasm_alltrue:
3260 // Check each element individually
3261 unsigned E = cast<FixedVectorType>(Op->getType())->getNumElements();
3262 for (unsigned I = 0; I != E; ++I) {
3263 Constant *Elt = Op->getAggregateElement(I);
3264 // Return false as soon as we find a non-true element.
3265 if (Elt && Elt->isNullValue())
3266 return ConstantInt::get(Ty, 0);
3267 // Bail as soon as we find an element we cannot prove to be true.
3268 if (!Elt || !isa<ConstantInt>(Elt))
3269 return nullptr;
3270 }
3271
3272 return ConstantInt::get(Ty, 1);
3273 }
3274 }
3275
3276 return nullptr;
3277}
3278
3279static Constant *evaluateCompare(const APFloat &Op1, const APFloat &Op2,
3283 FCmpInst::Predicate Cond = FCmp->getPredicate();
3284 if (FCmp->isSignaling()) {
3285 if (Op1.isNaN() || Op2.isNaN())
3287 } else {
3288 if (Op1.isSignaling() || Op2.isSignaling())
3290 }
3291 bool Result = FCmpInst::compare(Op1, Op2, Cond);
3292 if (mayFoldConstrained(const_cast<ConstrainedFPCmpIntrinsic *>(FCmp), St))
3293 return ConstantInt::get(Call->getType()->getScalarType(), Result);
3294 return nullptr;
3295}
3296
3297static Constant *ConstantFoldNextToward(const APFloat &Op0, const APFloat &Op1,
3298 const Type *RetTy) {
3299 assert(RetTy != nullptr);
3300 bool LosesInfo;
3301
3302 if (Op1.isSignaling())
3303 return nullptr;
3304 if (Op1.isNaN()) {
3305 APFloat Ret(Op1);
3306 Ret.convert(RetTy->getFltSemantics(), detail::rmNearestTiesToEven,
3307 &LosesInfo);
3308 return ConstantFP::get(RetTy->getContext(), Ret);
3309 }
3310
3311 // Recall that the second argument of nexttoward is always a long double,
3312 // so we may need to promote the first argument for comparisons to be valid.
3313 APFloat PromotedOp0(Op0);
3314 PromotedOp0.convert(Op1.getSemantics(), detail::rmNearestTiesToEven,
3315 &LosesInfo);
3316 assert(!LosesInfo && "Unexpected lossy promotion");
3317 const APFloat::cmpResult Result = PromotedOp0.compare(Op1);
3318
3319 // When equal, the standard says we must return the second argument.
3320 // This allows nice behavior such as nexttoward(0.0, -0.0) = -0.0 and
3321 // nexttoward(-0.0, 0.0) = 0.0
3322 if (Result == detail::cmpEqual) {
3323 APFloat Ret(Op1);
3324 Ret.convert(RetTy->getFltSemantics(), detail::rmNearestTiesToEven,
3325 &LosesInfo);
3326 return ConstantFP::get(RetTy->getContext(), Ret);
3327 }
3328
3329 APFloat Next(Op0);
3330 Next.next(/*nextDown=*/Result == APFloat::cmpGreaterThan);
3331 if (Next.isZero() || Next.isDenormal() || Next.isSignaling())
3332 return nullptr;
3333 return ConstantFP::get(RetTy->getContext(), Next);
3334}
3335
3336static Constant *ConstantFoldLibCall2(StringRef Name, Type *Ty,
3337 ArrayRef<Constant *> Operands,
3338 const TargetLibraryInfo *TLI) {
3339 if (!TLI)
3340 return nullptr;
3341
3342 LibFunc Func = NotLibFunc;
3343 if (!TLI->getLibFunc(Name, Func))
3344 return nullptr;
3345
3346 const auto *Op1 = dyn_cast<ConstantFP>(Operands[0]);
3347 if (!Op1)
3348 return nullptr;
3349
3350 const auto *Op2 = dyn_cast<ConstantFP>(Operands[1]);
3351 if (!Op2)
3352 return nullptr;
3353
3354 const APFloat &Op1V = Op1->getValueAPF();
3355 const APFloat &Op2V = Op2->getValueAPF();
3356
3357 switch (Func) {
3358 default:
3359 break;
3360 case LibFunc_pow:
3361 case LibFunc_powf:
3362 case LibFunc_pow_finite:
3363 case LibFunc_powf_finite:
3364 if (TLI->has(Func))
3365 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3366 break;
3367 case LibFunc_fmod:
3368 case LibFunc_fmodf:
3369 if (TLI->has(Func)) {
3370 APFloat V = Op1->getValueAPF();
3371 if (APFloat::opStatus::opOK == V.mod(Op2->getValueAPF()))
3372 return ConstantFP::get(Ty, V);
3373 }
3374 break;
3375 case LibFunc_remainder:
3376 case LibFunc_remainderf:
3377 if (TLI->has(Func)) {
3378 APFloat V = Op1->getValueAPF();
3379 if (APFloat::opStatus::opOK == V.remainder(Op2->getValueAPF()))
3380 return ConstantFP::get(Ty, V);
3381 }
3382 break;
3383 case LibFunc_atan2:
3384 case LibFunc_atan2f:
3385 // atan2(+/-0.0, +/-0.0) is known to raise an exception on some libm
3386 // (Solaris), so we do not assume a known result for that.
3387 if (Op1V.isZero() && Op2V.isZero())
3388 return nullptr;
3389 [[fallthrough]];
3390 case LibFunc_atan2_finite:
3391 case LibFunc_atan2f_finite:
3392 if (TLI->has(Func))
3393 return ConstantFoldBinaryFP(atan2, Op1V, Op2V, Ty);
3394 break;
3395 case LibFunc_nextafter:
3396 case LibFunc_nextafterf:
3397 case LibFunc_nexttoward:
3398 case LibFunc_nexttowardf:
3399 if (TLI->has(Func))
3400 return ConstantFoldNextToward(Op1V, Op2V, Ty);
3401 break;
3402 }
3403
3404 return nullptr;
3405}
3406
3407static Constant *ConstantFoldIntrinsicCall2(Intrinsic::ID IntrinsicID, Type *Ty,
3408 ArrayRef<Constant *> Operands,
3409 const CallBase *Call) {
3410 assert(Operands.size() == 2 && "Wrong number of operands.");
3411
3412 if (Ty->isFloatingPointTy()) {
3413 // TODO: We should have undef handling for all of the FP intrinsics that
3414 // are attempted to be folded in this function.
3415 bool IsOp0Undef = isa<UndefValue>(Operands[0]);
3416 bool IsOp1Undef = isa<UndefValue>(Operands[1]);
3417 switch (IntrinsicID) {
3418 case Intrinsic::maxnum:
3419 case Intrinsic::minnum:
3420 case Intrinsic::maximum:
3421 case Intrinsic::minimum:
3422 case Intrinsic::maximumnum:
3423 case Intrinsic::minimumnum:
3424 case Intrinsic::nvvm_fmax_d:
3425 case Intrinsic::nvvm_fmin_d:
3426 // If one argument is undef, return the other argument.
3427 if (IsOp0Undef)
3428 return Operands[1];
3429 if (IsOp1Undef)
3430 return Operands[0];
3431 break;
3432
3433 case Intrinsic::nvvm_fmax_f:
3434 case Intrinsic::nvvm_fmax_ftz_f:
3435 case Intrinsic::nvvm_fmax_ftz_nan_f:
3436 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3437 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3438 case Intrinsic::nvvm_fmax_nan_f:
3439 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3440 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3441
3442 case Intrinsic::nvvm_fmin_f:
3443 case Intrinsic::nvvm_fmin_ftz_f:
3444 case Intrinsic::nvvm_fmin_ftz_nan_f:
3445 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3446 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3447 case Intrinsic::nvvm_fmin_nan_f:
3448 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3449 case Intrinsic::nvvm_fmin_xorsign_abs_f:
3450 // If one arg is undef, the other arg can be returned only if it is
3451 // constant, as we may need to flush it to sign-preserving zero or
3452 // canonicalize the NaN.
3453 if (!IsOp0Undef && !IsOp1Undef)
3454 break;
3455 if (auto *Op = dyn_cast<ConstantFP>(Operands[IsOp0Undef ? 1 : 0])) {
3456 if (Op->isNaN()) {
3457 APInt NVCanonicalNaN(32, 0x7fffffff);
3458 return ConstantFP::get(
3459 Ty, APFloat(Ty->getFltSemantics(), NVCanonicalNaN));
3460 }
3461 if (nvvm::FMinFMaxShouldFTZ(IntrinsicID))
3462 return ConstantFP::get(Ty, FTZPreserveSign(Op->getValueAPF()));
3463 else
3464 return Op;
3465 }
3466 break;
3467 }
3468 }
3469
3470 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3471 const APFloat &Op1V = Op1->getValueAPF();
3472
3473 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3474 if (Op2->getType() != Op1->getType())
3475 return nullptr;
3476 const APFloat &Op2V = Op2->getValueAPF();
3477
3478 if (const auto *ConstrIntr =
3480 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3481 APFloat Res = Op1V;
3483 switch (IntrinsicID) {
3484 default:
3485 return nullptr;
3486 case Intrinsic::experimental_constrained_fadd:
3487 St = Res.add(Op2V, RM);
3488 break;
3489 case Intrinsic::experimental_constrained_fsub:
3490 St = Res.subtract(Op2V, RM);
3491 break;
3492 case Intrinsic::experimental_constrained_fmul:
3493 St = Res.multiply(Op2V, RM);
3494 break;
3495 case Intrinsic::experimental_constrained_fdiv:
3496 St = Res.divide(Op2V, RM);
3497 break;
3498 case Intrinsic::experimental_constrained_frem:
3499 St = Res.mod(Op2V);
3500 break;
3501 case Intrinsic::experimental_constrained_fcmp:
3502 case Intrinsic::experimental_constrained_fcmps:
3503 return evaluateCompare(Op1V, Op2V, ConstrIntr);
3504 }
3505 if (mayFoldConstrained(const_cast<ConstrainedFPIntrinsic *>(ConstrIntr),
3506 St))
3507 return ConstantFP::get(Ty, Res);
3508 return nullptr;
3509 }
3510
3511 switch (IntrinsicID) {
3512 default:
3513 break;
3514 case Intrinsic::copysign:
3515 return ConstantFP::get(Ty, APFloat::copySign(Op1V, Op2V));
3516 case Intrinsic::minnum:
3517 return ConstantFP::get(Ty, minnum(Op1V, Op2V));
3518 case Intrinsic::maxnum:
3519 return ConstantFP::get(Ty, maxnum(Op1V, Op2V));
3520 case Intrinsic::minimum:
3521 return ConstantFP::get(Ty, minimum(Op1V, Op2V));
3522 case Intrinsic::maximum:
3523 return ConstantFP::get(Ty, maximum(Op1V, Op2V));
3524 case Intrinsic::minimumnum:
3525 return ConstantFP::get(Ty, minimumnum(Op1V, Op2V));
3526 case Intrinsic::maximumnum:
3527 return ConstantFP::get(Ty, maximumnum(Op1V, Op2V));
3528
3529 case Intrinsic::nvvm_fmax_d:
3530 case Intrinsic::nvvm_fmax_f:
3531 case Intrinsic::nvvm_fmax_ftz_f:
3532 case Intrinsic::nvvm_fmax_ftz_nan_f:
3533 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3534 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3535 case Intrinsic::nvvm_fmax_nan_f:
3536 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3537 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3538
3539 case Intrinsic::nvvm_fmin_d:
3540 case Intrinsic::nvvm_fmin_f:
3541 case Intrinsic::nvvm_fmin_ftz_f:
3542 case Intrinsic::nvvm_fmin_ftz_nan_f:
3543 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3544 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3545 case Intrinsic::nvvm_fmin_nan_f:
3546 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3547 case Intrinsic::nvvm_fmin_xorsign_abs_f: {
3548
3549 bool ShouldCanonicalizeNaNs = !(IntrinsicID == Intrinsic::nvvm_fmax_d ||
3550 IntrinsicID == Intrinsic::nvvm_fmin_d);
3551 bool IsFTZ = nvvm::FMinFMaxShouldFTZ(IntrinsicID);
3552 bool IsNaNPropagating = nvvm::FMinFMaxPropagatesNaNs(IntrinsicID);
3553 bool IsXorSignAbs = nvvm::FMinFMaxIsXorSignAbs(IntrinsicID);
3554
3555 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3556 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3557
3558 bool XorSign = false;
3559 if (IsXorSignAbs) {
3560 XorSign = A.isNegative() ^ B.isNegative();
3561 A = abs(A);
3562 B = abs(B);
3563 }
3564
3565 bool IsFMax = false;
3566 switch (IntrinsicID) {
3567 case Intrinsic::nvvm_fmax_d:
3568 case Intrinsic::nvvm_fmax_f:
3569 case Intrinsic::nvvm_fmax_ftz_f:
3570 case Intrinsic::nvvm_fmax_ftz_nan_f:
3571 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3572 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3573 case Intrinsic::nvvm_fmax_nan_f:
3574 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3575 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3576 IsFMax = true;
3577 break;
3578 }
3579 APFloat Res =
3580 IsFMax ? (IsNaNPropagating ? maximum(A, B) : maximumnum(A, B))
3581 : (IsNaNPropagating ? minimum(A, B) : minimumnum(A, B));
3582
3583 if (ShouldCanonicalizeNaNs && Res.isNaN()) {
3584 APFloat NVCanonicalNaN(Res.getSemantics(), APInt(32, 0x7fffffff));
3585 return ConstantFP::get(Ty, NVCanonicalNaN);
3586 }
3587
3588 if (IsXorSignAbs && XorSign != Res.isNegative())
3589 Res.changeSign();
3590
3591 return ConstantFP::get(Ty, Res);
3592 }
3593
3594 case Intrinsic::nvvm_add_rm_f:
3595 case Intrinsic::nvvm_add_rn_f:
3596 case Intrinsic::nvvm_add_rp_f:
3597 case Intrinsic::nvvm_add_rz_f:
3598 case Intrinsic::nvvm_add_rm_d:
3599 case Intrinsic::nvvm_add_rn_d:
3600 case Intrinsic::nvvm_add_rp_d:
3601 case Intrinsic::nvvm_add_rz_d:
3602 case Intrinsic::nvvm_add_rm_ftz_f:
3603 case Intrinsic::nvvm_add_rn_ftz_f:
3604 case Intrinsic::nvvm_add_rp_ftz_f:
3605 case Intrinsic::nvvm_add_rz_ftz_f: {
3606
3607 bool IsFTZ = nvvm::FAddShouldFTZ(IntrinsicID);
3608 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3609 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3610
3611 APFloat::roundingMode RoundMode =
3612 nvvm::GetFAddRoundingMode(IntrinsicID);
3613
3614 APFloat Res = A;
3615 APFloat::opStatus Status = Res.add(B, RoundMode);
3616
3617 if (!Res.isNaN() &&
3619 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3620 return ConstantFP::get(Ty, Res);
3621 }
3622 return nullptr;
3623 }
3624
3625 case Intrinsic::nvvm_mul_rm_f:
3626 case Intrinsic::nvvm_mul_rn_f:
3627 case Intrinsic::nvvm_mul_rp_f:
3628 case Intrinsic::nvvm_mul_rz_f:
3629 case Intrinsic::nvvm_mul_rm_d:
3630 case Intrinsic::nvvm_mul_rn_d:
3631 case Intrinsic::nvvm_mul_rp_d:
3632 case Intrinsic::nvvm_mul_rz_d:
3633 case Intrinsic::nvvm_mul_rm_ftz_f:
3634 case Intrinsic::nvvm_mul_rn_ftz_f:
3635 case Intrinsic::nvvm_mul_rp_ftz_f:
3636 case Intrinsic::nvvm_mul_rz_ftz_f: {
3637
3638 bool IsFTZ = nvvm::FMulShouldFTZ(IntrinsicID);
3639 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3640 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3641
3642 APFloat::roundingMode RoundMode =
3643 nvvm::GetFMulRoundingMode(IntrinsicID);
3644
3645 APFloat Res = A;
3646 APFloat::opStatus Status = Res.multiply(B, RoundMode);
3647
3648 if (!Res.isNaN() &&
3650 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3651 return ConstantFP::get(Ty, Res);
3652 }
3653 return nullptr;
3654 }
3655
3656 case Intrinsic::nvvm_div_rm_f:
3657 case Intrinsic::nvvm_div_rn_f:
3658 case Intrinsic::nvvm_div_rp_f:
3659 case Intrinsic::nvvm_div_rz_f:
3660 case Intrinsic::nvvm_div_rm_d:
3661 case Intrinsic::nvvm_div_rn_d:
3662 case Intrinsic::nvvm_div_rp_d:
3663 case Intrinsic::nvvm_div_rz_d:
3664 case Intrinsic::nvvm_div_rm_ftz_f:
3665 case Intrinsic::nvvm_div_rn_ftz_f:
3666 case Intrinsic::nvvm_div_rp_ftz_f:
3667 case Intrinsic::nvvm_div_rz_ftz_f: {
3668 bool IsFTZ = nvvm::FDivShouldFTZ(IntrinsicID);
3669 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3670 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3671 APFloat::roundingMode RoundMode =
3672 nvvm::GetFDivRoundingMode(IntrinsicID);
3673
3674 APFloat Res = A;
3675 APFloat::opStatus Status = Res.divide(B, RoundMode);
3676 if (!Res.isNaN() &&
3678 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3679 return ConstantFP::get(Ty, Res);
3680 }
3681 return nullptr;
3682 }
3683 }
3684
3685 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy())
3686 return nullptr;
3687
3688 switch (IntrinsicID) {
3689 default:
3690 break;
3691 case Intrinsic::pow:
3692 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3693 case Intrinsic::amdgcn_fmul_legacy:
3694 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3695 // NaN or infinity, gives +0.0.
3696 if (Op1V.isZero() || Op2V.isZero())
3697 return ConstantFP::getZero(Ty);
3698 return ConstantFP::get(Ty, Op1V * Op2V);
3699 }
3700
3701 } else if (auto *Op2C = dyn_cast<ConstantInt>(Operands[1])) {
3702 switch (IntrinsicID) {
3703 case Intrinsic::ldexp: {
3704 return ConstantFP::get(
3705 Ty->getContext(),
3706 scalbn(Op1V, Op2C->getSExtValue(), APFloat::rmNearestTiesToEven));
3707 }
3708 case Intrinsic::is_fpclass: {
3709 FPClassTest Mask = static_cast<FPClassTest>(Op2C->getZExtValue());
3710 bool Result =
3711 ((Mask & fcSNan) && Op1V.isNaN() && Op1V.isSignaling()) ||
3712 ((Mask & fcQNan) && Op1V.isNaN() && !Op1V.isSignaling()) ||
3713 ((Mask & fcNegInf) && Op1V.isNegInfinity()) ||
3714 ((Mask & fcNegNormal) && Op1V.isNormal() && Op1V.isNegative()) ||
3715 ((Mask & fcNegSubnormal) && Op1V.isDenormal() && Op1V.isNegative()) ||
3716 ((Mask & fcNegZero) && Op1V.isZero() && Op1V.isNegative()) ||
3717 ((Mask & fcPosZero) && Op1V.isZero() && !Op1V.isNegative()) ||
3718 ((Mask & fcPosSubnormal) && Op1V.isDenormal() && !Op1V.isNegative()) ||
3719 ((Mask & fcPosNormal) && Op1V.isNormal() && !Op1V.isNegative()) ||
3720 ((Mask & fcPosInf) && Op1V.isPosInfinity());
3721 return ConstantInt::get(Ty, Result);
3722 }
3723 case Intrinsic::powi: {
3724 int Exp = static_cast<int>(Op2C->getSExtValue());
3725 switch (Ty->getTypeID()) {
3726 case Type::HalfTyID:
3727 case Type::FloatTyID: {
3728 APFloat Res(static_cast<float>(std::pow(Op1V.convertToFloat(), Exp)));
3729 if (Ty->isHalfTy()) {
3730 bool Unused;
3732 &Unused);
3733 }
3734 return ConstantFP::get(Ty, Res);
3735 }
3736 case Type::DoubleTyID:
3737 return ConstantFP::get(Ty, std::pow(Op1V.convertToDouble(), Exp));
3738 default:
3739 return nullptr;
3740 }
3741 }
3742 default:
3743 break;
3744 }
3745 }
3746 return nullptr;
3747 }
3748
3749 if (Operands[0]->getType()->isIntegerTy() &&
3750 Operands[1]->getType()->isIntegerTy()) {
3751 const APInt *C0, *C1;
3752 if (!getConstIntOrUndef(Operands[0], C0) ||
3753 !getConstIntOrUndef(Operands[1], C1))
3754 return nullptr;
3755
3756 switch (IntrinsicID) {
3757 default: break;
3758 case Intrinsic::smax:
3759 case Intrinsic::smin:
3760 case Intrinsic::umax:
3761 case Intrinsic::umin:
3762 if (!C0 && !C1)
3763 return UndefValue::get(Ty);
3764 if (!C0 || !C1)
3765 return MinMaxIntrinsic::getSaturationPoint(IntrinsicID, Ty);
3766 return ConstantInt::get(
3767 Ty, ICmpInst::compare(*C0, *C1,
3768 MinMaxIntrinsic::getPredicate(IntrinsicID))
3769 ? *C0
3770 : *C1);
3771
3772 case Intrinsic::scmp:
3773 case Intrinsic::ucmp:
3774 if (!C0 || !C1)
3775 return ConstantInt::get(Ty, 0);
3776
3777 int Res;
3778 if (IntrinsicID == Intrinsic::scmp)
3779 Res = C0->sgt(*C1) ? 1 : C0->slt(*C1) ? -1 : 0;
3780 else
3781 Res = C0->ugt(*C1) ? 1 : C0->ult(*C1) ? -1 : 0;
3782 return ConstantInt::get(Ty, Res, /*IsSigned=*/true);
3783
3784 case Intrinsic::usub_with_overflow:
3785 case Intrinsic::ssub_with_overflow:
3786 // X - undef -> { 0, false }
3787 // undef - X -> { 0, false }
3788 if (!C0 || !C1)
3789 return Constant::getNullValue(Ty);
3790 [[fallthrough]];
3791 case Intrinsic::uadd_with_overflow:
3792 case Intrinsic::sadd_with_overflow:
3793 // X + undef -> { -1, false }
3794 // undef + x -> { -1, false }
3795 if (!C0 || !C1) {
3796 return ConstantStruct::get(
3797 cast<StructType>(Ty),
3798 {Constant::getAllOnesValue(Ty->getStructElementType(0)),
3799 Constant::getNullValue(Ty->getStructElementType(1))});
3800 }
3801 [[fallthrough]];
3802 case Intrinsic::smul_with_overflow:
3803 case Intrinsic::umul_with_overflow: {
3804 // undef * X -> { 0, false }
3805 // X * undef -> { 0, false }
3806 if (!C0 || !C1)
3807 return Constant::getNullValue(Ty);
3808
3809 APInt Res;
3810 bool Overflow;
3811 switch (IntrinsicID) {
3812 default: llvm_unreachable("Invalid case");
3813 case Intrinsic::sadd_with_overflow:
3814 Res = C0->sadd_ov(*C1, Overflow);
3815 break;
3816 case Intrinsic::uadd_with_overflow:
3817 Res = C0->uadd_ov(*C1, Overflow);
3818 break;
3819 case Intrinsic::ssub_with_overflow:
3820 Res = C0->ssub_ov(*C1, Overflow);
3821 break;
3822 case Intrinsic::usub_with_overflow:
3823 Res = C0->usub_ov(*C1, Overflow);
3824 break;
3825 case Intrinsic::smul_with_overflow:
3826 Res = C0->smul_ov(*C1, Overflow);
3827 break;
3828 case Intrinsic::umul_with_overflow:
3829 Res = C0->umul_ov(*C1, Overflow);
3830 break;
3831 }
3832 Constant *Ops[] = {
3833 ConstantInt::get(Ty->getContext(), Res),
3834 ConstantInt::get(Type::getInt1Ty(Ty->getContext()), Overflow)
3835 };
3837 }
3838 case Intrinsic::uadd_sat:
3839 case Intrinsic::sadd_sat:
3840 if (!C0 && !C1)
3841 return UndefValue::get(Ty);
3842 if (!C0 || !C1)
3843 return Constant::getAllOnesValue(Ty);
3844 if (IntrinsicID == Intrinsic::uadd_sat)
3845 return ConstantInt::get(Ty, C0->uadd_sat(*C1));
3846 else
3847 return ConstantInt::get(Ty, C0->sadd_sat(*C1));
3848 case Intrinsic::usub_sat:
3849 case Intrinsic::ssub_sat:
3850 if (!C0 && !C1)
3851 return UndefValue::get(Ty);
3852 if (!C0 || !C1)
3853 return Constant::getNullValue(Ty);
3854 if (IntrinsicID == Intrinsic::usub_sat)
3855 return ConstantInt::get(Ty, C0->usub_sat(*C1));
3856 else
3857 return ConstantInt::get(Ty, C0->ssub_sat(*C1));
3858 case Intrinsic::cttz:
3859 case Intrinsic::ctlz:
3860 assert(C1 && "Must be constant int");
3861
3862 // cttz(0, 1) and ctlz(0, 1) are poison.
3863 if (C1->isOne() && (!C0 || C0->isZero()))
3864 return PoisonValue::get(Ty);
3865 if (!C0)
3866 return Constant::getNullValue(Ty);
3867 if (IntrinsicID == Intrinsic::cttz)
3868 return ConstantInt::get(Ty, C0->countr_zero());
3869 else
3870 return ConstantInt::get(Ty, C0->countl_zero());
3871
3872 case Intrinsic::abs:
3873 assert(C1 && "Must be constant int");
3874 assert((C1->isOne() || C1->isZero()) && "Must be 0 or 1");
3875
3876 // Undef or minimum val operand with poison min --> poison
3877 if (C1->isOne() && (!C0 || C0->isMinSignedValue()))
3878 return PoisonValue::get(Ty);
3879
3880 // Undef operand with no poison min --> 0 (sign bit must be clear)
3881 if (!C0)
3882 return Constant::getNullValue(Ty);
3883
3884 return ConstantInt::get(Ty, C0->abs());
3885 case Intrinsic::amdgcn_wave_reduce_umin:
3886 case Intrinsic::amdgcn_wave_reduce_umax:
3887 case Intrinsic::amdgcn_wave_reduce_max:
3888 case Intrinsic::amdgcn_wave_reduce_min:
3889 case Intrinsic::amdgcn_wave_reduce_and:
3890 case Intrinsic::amdgcn_wave_reduce_or:
3891 return Operands[0];
3892 }
3893
3894 return nullptr;
3895 }
3896
3897 // Support ConstantVector in case we have an Undef in the top.
3898 if ((isa<ConstantVector>(Operands[0]) ||
3899 isa<ConstantDataVector>(Operands[0])) &&
3900 // Check for default rounding mode.
3901 // FIXME: Support other rounding modes?
3902 isa<ConstantInt>(Operands[1]) &&
3903 cast<ConstantInt>(Operands[1])->getValue() == 4) {
3904 auto *Op = cast<Constant>(Operands[0]);
3905 switch (IntrinsicID) {
3906 default: break;
3907 case Intrinsic::x86_avx512_vcvtss2si32:
3908 case Intrinsic::x86_avx512_vcvtss2si64:
3909 case Intrinsic::x86_avx512_vcvtsd2si32:
3910 case Intrinsic::x86_avx512_vcvtsd2si64:
3911 if (ConstantFP *FPOp =
3912 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3913 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3914 /*roundTowardZero=*/false, Ty,
3915 /*IsSigned*/true);
3916 break;
3917 case Intrinsic::x86_avx512_vcvtss2usi32:
3918 case Intrinsic::x86_avx512_vcvtss2usi64:
3919 case Intrinsic::x86_avx512_vcvtsd2usi32:
3920 case Intrinsic::x86_avx512_vcvtsd2usi64:
3921 if (ConstantFP *FPOp =
3922 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3923 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3924 /*roundTowardZero=*/false, Ty,
3925 /*IsSigned*/false);
3926 break;
3927 case Intrinsic::x86_avx512_cvttss2si:
3928 case Intrinsic::x86_avx512_cvttss2si64:
3929 case Intrinsic::x86_avx512_cvttsd2si:
3930 case Intrinsic::x86_avx512_cvttsd2si64:
3931 if (ConstantFP *FPOp =
3932 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3933 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3934 /*roundTowardZero=*/true, Ty,
3935 /*IsSigned*/true);
3936 break;
3937 case Intrinsic::x86_avx512_cvttss2usi:
3938 case Intrinsic::x86_avx512_cvttss2usi64:
3939 case Intrinsic::x86_avx512_cvttsd2usi:
3940 case Intrinsic::x86_avx512_cvttsd2usi64:
3941 if (ConstantFP *FPOp =
3942 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3943 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3944 /*roundTowardZero=*/true, Ty,
3945 /*IsSigned*/false);
3946 break;
3947 }
3948 }
3949
3950 if (IntrinsicID == Intrinsic::experimental_cttz_elts) {
3951 auto *FVTy = dyn_cast<FixedVectorType>(Operands[0]->getType());
3952 bool ZeroIsPoison = cast<ConstantInt>(Operands[1])->isOne();
3953 if (!FVTy)
3954 return nullptr;
3955 unsigned Width = Ty->getIntegerBitWidth();
3956 if (APInt::getMaxValue(Width).ult(FVTy->getNumElements()))
3957 return PoisonValue::get(Ty);
3958 for (unsigned I = 0; I < FVTy->getNumElements(); ++I) {
3959 Constant *Elt = Operands[0]->getAggregateElement(I);
3960 if (!Elt)
3961 return nullptr;
3962 if (isa<UndefValue>(Elt) || Elt->isNullValue())
3963 continue;
3964 return ConstantInt::get(Ty, I);
3965 }
3966 if (ZeroIsPoison)
3967 return PoisonValue::get(Ty);
3968 return ConstantInt::get(Ty, FVTy->getNumElements());
3969 }
3970 return nullptr;
3971}
3972
3973static APFloat ConstantFoldAMDGCNCubeIntrinsic(Intrinsic::ID IntrinsicID,
3974 const APFloat &S0,
3975 const APFloat &S1,
3976 const APFloat &S2) {
3977 unsigned ID;
3978 const fltSemantics &Sem = S0.getSemantics();
3979 APFloat MA(Sem), SC(Sem), TC(Sem);
3980 if (abs(S2) >= abs(S0) && abs(S2) >= abs(S1)) {
3981 if (S2.isNegative() && S2.isNonZero() && !S2.isNaN()) {
3982 // S2 < 0
3983 ID = 5;
3984 SC = -S0;
3985 } else {
3986 ID = 4;
3987 SC = S0;
3988 }
3989 MA = S2;
3990 TC = -S1;
3991 } else if (abs(S1) >= abs(S0)) {
3992 if (S1.isNegative() && S1.isNonZero() && !S1.isNaN()) {
3993 // S1 < 0
3994 ID = 3;
3995 TC = -S2;
3996 } else {
3997 ID = 2;
3998 TC = S2;
3999 }
4000 MA = S1;
4001 SC = S0;
4002 } else {
4003 if (S0.isNegative() && S0.isNonZero() && !S0.isNaN()) {
4004 // S0 < 0
4005 ID = 1;
4006 SC = S2;
4007 } else {
4008 ID = 0;
4009 SC = -S2;
4010 }
4011 MA = S0;
4012 TC = -S1;
4013 }
4014 switch (IntrinsicID) {
4015 default:
4016 llvm_unreachable("unhandled amdgcn cube intrinsic");
4017 case Intrinsic::amdgcn_cubeid:
4018 return APFloat(Sem, ID);
4019 case Intrinsic::amdgcn_cubema:
4020 return MA + MA;
4021 case Intrinsic::amdgcn_cubesc:
4022 return SC;
4023 case Intrinsic::amdgcn_cubetc:
4024 return TC;
4025 }
4026}
4027
4028static Constant *ConstantFoldAMDGCNPermIntrinsic(ArrayRef<Constant *> Operands,
4029 Type *Ty) {
4030 const APInt *C0, *C1, *C2;
4031 if (!getConstIntOrUndef(Operands[0], C0) ||
4032 !getConstIntOrUndef(Operands[1], C1) ||
4033 !getConstIntOrUndef(Operands[2], C2))
4034 return nullptr;
4035
4036 if (!C2)
4037 return UndefValue::get(Ty);
4038
4039 APInt Val(32, 0);
4040 unsigned NumUndefBytes = 0;
4041 for (unsigned I = 0; I < 32; I += 8) {
4042 unsigned Sel = C2->extractBitsAsZExtValue(8, I);
4043 unsigned B = 0;
4044
4045 if (Sel >= 13)
4046 B = 0xff;
4047 else if (Sel == 12)
4048 B = 0x00;
4049 else {
4050 const APInt *Src = ((Sel & 10) == 10 || (Sel & 12) == 4) ? C0 : C1;
4051 if (!Src)
4052 ++NumUndefBytes;
4053 else if (Sel < 8)
4054 B = Src->extractBitsAsZExtValue(8, (Sel & 3) * 8);
4055 else
4056 B = Src->extractBitsAsZExtValue(1, (Sel & 1) ? 31 : 15) * 0xff;
4057 }
4058
4059 Val.insertBits(B, I, 8);
4060 }
4061
4062 if (NumUndefBytes == 4)
4063 return UndefValue::get(Ty);
4064
4065 return ConstantInt::get(Ty, Val);
4066}
4067
4068static Constant *ConstantFoldScalarCall3(StringRef Name,
4069 Intrinsic::ID IntrinsicID,
4070 Type *Ty,
4071 ArrayRef<Constant *> Operands,
4072 const TargetLibraryInfo *TLI,
4073 const CallBase *Call) {
4074 assert(Operands.size() == 3 && "Wrong number of operands.");
4075
4076 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
4077 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
4078 if (const auto *Op3 = dyn_cast<ConstantFP>(Operands[2])) {
4079 const APFloat &C1 = Op1->getValueAPF();
4080 const APFloat &C2 = Op2->getValueAPF();
4081 const APFloat &C3 = Op3->getValueAPF();
4082
4083 if (const auto *ConstrIntr = dyn_cast<ConstrainedFPIntrinsic>(Call)) {
4084 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
4085 APFloat Res = C1;
4087 switch (IntrinsicID) {
4088 default:
4089 return nullptr;
4090 case Intrinsic::experimental_constrained_fma:
4091 case Intrinsic::experimental_constrained_fmuladd:
4092 St = Res.fusedMultiplyAdd(C2, C3, RM);
4093 break;
4094 }
4095 if (mayFoldConstrained(
4096 const_cast<ConstrainedFPIntrinsic *>(ConstrIntr), St))
4097 return ConstantFP::get(Ty, Res);
4098 return nullptr;
4099 }
4100
4101 switch (IntrinsicID) {
4102 default: break;
4103 case Intrinsic::amdgcn_fma_legacy: {
4104 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
4105 // NaN or infinity, gives +0.0.
4106 if (C1.isZero() || C2.isZero()) {
4107 // It's tempting to just return C3 here, but that would give the
4108 // wrong result if C3 was -0.0.
4109 return ConstantFP::get(Ty, APFloat(0.0f) + C3);
4110 }
4111 [[fallthrough]];
4112 }
4113 case Intrinsic::fma:
4114 case Intrinsic::fmuladd: {
4115 APFloat V = C1;
4117 return ConstantFP::get(Ty, V);
4118 }
4119
4120 case Intrinsic::nvvm_fma_rm_f:
4121 case Intrinsic::nvvm_fma_rn_f:
4122 case Intrinsic::nvvm_fma_rp_f:
4123 case Intrinsic::nvvm_fma_rz_f:
4124 case Intrinsic::nvvm_fma_rm_d:
4125 case Intrinsic::nvvm_fma_rn_d:
4126 case Intrinsic::nvvm_fma_rp_d:
4127 case Intrinsic::nvvm_fma_rz_d:
4128 case Intrinsic::nvvm_fma_rm_ftz_f:
4129 case Intrinsic::nvvm_fma_rn_ftz_f:
4130 case Intrinsic::nvvm_fma_rp_ftz_f:
4131 case Intrinsic::nvvm_fma_rz_ftz_f: {
4132 bool IsFTZ = nvvm::FMAShouldFTZ(IntrinsicID);
4133 APFloat A = IsFTZ ? FTZPreserveSign(C1) : C1;
4134 APFloat B = IsFTZ ? FTZPreserveSign(C2) : C2;
4135 APFloat C = IsFTZ ? FTZPreserveSign(C3) : C3;
4136
4137 APFloat::roundingMode RoundMode =
4138 nvvm::GetFMARoundingMode(IntrinsicID);
4139
4140 APFloat Res = A;
4141 APFloat::opStatus Status = Res.fusedMultiplyAdd(B, C, RoundMode);
4142
4143 if (!Res.isNaN() &&
4145 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
4146 return ConstantFP::get(Ty, Res);
4147 }
4148 return nullptr;
4149 }
4150
4151 case Intrinsic::amdgcn_cubeid:
4152 case Intrinsic::amdgcn_cubema:
4153 case Intrinsic::amdgcn_cubesc:
4154 case Intrinsic::amdgcn_cubetc: {
4155 APFloat V = ConstantFoldAMDGCNCubeIntrinsic(IntrinsicID, C1, C2, C3);
4156 return ConstantFP::get(Ty, V);
4157 }
4158 }
4159 }
4160 }
4161 }
4162
4163 if (IntrinsicID == Intrinsic::smul_fix ||
4164 IntrinsicID == Intrinsic::smul_fix_sat) {
4165 const APInt *C0, *C1;
4166 if (!getConstIntOrUndef(Operands[0], C0) ||
4167 !getConstIntOrUndef(Operands[1], C1))
4168 return nullptr;
4169
4170 // undef * C -> 0
4171 // C * undef -> 0
4172 if (!C0 || !C1)
4173 return Constant::getNullValue(Ty);
4174
4175 // This code performs rounding towards negative infinity in case the result
4176 // cannot be represented exactly for the given scale. Targets that do care
4177 // about rounding should use a target hook for specifying how rounding
4178 // should be done, and provide their own folding to be consistent with
4179 // rounding. This is the same approach as used by
4180 // DAGTypeLegalizer::ExpandIntRes_MULFIX.
4181 unsigned Scale = cast<ConstantInt>(Operands[2])->getZExtValue();
4182 unsigned Width = C0->getBitWidth();
4183 assert(Scale < Width && "Illegal scale.");
4184 unsigned ExtendedWidth = Width * 2;
4185 APInt Product =
4186 (C0->sext(ExtendedWidth) * C1->sext(ExtendedWidth)).ashr(Scale);
4187 if (IntrinsicID == Intrinsic::smul_fix_sat) {
4188 APInt Max = APInt::getSignedMaxValue(Width).sext(ExtendedWidth);
4189 APInt Min = APInt::getSignedMinValue(Width).sext(ExtendedWidth);
4190 Product = APIntOps::smin(Product, Max);
4191 Product = APIntOps::smax(Product, Min);
4192 }
4193 return ConstantInt::get(Ty->getContext(), Product.sextOrTrunc(Width));
4194 }
4195
4196 if (IntrinsicID == Intrinsic::fshl || IntrinsicID == Intrinsic::fshr) {
4197 const APInt *C0, *C1, *C2;
4198 if (!getConstIntOrUndef(Operands[0], C0) ||
4199 !getConstIntOrUndef(Operands[1], C1) ||
4200 !getConstIntOrUndef(Operands[2], C2))
4201 return nullptr;
4202
4203 bool IsRight = IntrinsicID == Intrinsic::fshr;
4204 if (!C2)
4205 return Operands[IsRight ? 1 : 0];
4206 if (!C0 && !C1)
4207 return UndefValue::get(Ty);
4208
4209 // The shift amount is interpreted as modulo the bitwidth. If the shift
4210 // amount is effectively 0, avoid UB due to oversized inverse shift below.
4211 unsigned BitWidth = C2->getBitWidth();
4212 unsigned ShAmt = C2->urem(BitWidth);
4213 if (!ShAmt)
4214 return Operands[IsRight ? 1 : 0];
4215
4216 // (C0 << ShlAmt) | (C1 >> LshrAmt)
4217 unsigned LshrAmt = IsRight ? ShAmt : BitWidth - ShAmt;
4218 unsigned ShlAmt = !IsRight ? ShAmt : BitWidth - ShAmt;
4219 if (!C0)
4220 return ConstantInt::get(Ty, C1->lshr(LshrAmt));
4221 if (!C1)
4222 return ConstantInt::get(Ty, C0->shl(ShlAmt));
4223 return ConstantInt::get(Ty, C0->shl(ShlAmt) | C1->lshr(LshrAmt));
4224 }
4225
4226 if (IntrinsicID == Intrinsic::amdgcn_perm)
4227 return ConstantFoldAMDGCNPermIntrinsic(Operands, Ty);
4228
4229 return nullptr;
4230}
4231
4232static Constant *ConstantFoldScalarCall(StringRef Name,
4233 Intrinsic::ID IntrinsicID,
4234 Type *Ty,
4235 ArrayRef<Constant *> Operands,
4236 const TargetLibraryInfo *TLI,
4237 const CallBase *Call) {
4238 if (IntrinsicID != Intrinsic::not_intrinsic &&
4239 any_of(Operands, IsaPred<PoisonValue>) &&
4240 intrinsicPropagatesPoison(IntrinsicID))
4241 return PoisonValue::get(Ty);
4242
4243 if (Operands.size() == 1)
4244 return ConstantFoldScalarCall1(Name, IntrinsicID, Ty, Operands, TLI, Call);
4245
4246 if (Operands.size() == 2) {
4247 if (Constant *FoldedLibCall =
4248 ConstantFoldLibCall2(Name, Ty, Operands, TLI)) {
4249 return FoldedLibCall;
4250 }
4251 return ConstantFoldIntrinsicCall2(IntrinsicID, Ty, Operands, Call);
4252 }
4253
4254 if (Operands.size() == 3)
4255 return ConstantFoldScalarCall3(Name, IntrinsicID, Ty, Operands, TLI, Call);
4256
4257 return nullptr;
4258}
4259
4260static Constant *ConstantFoldFixedVectorCall(
4261 StringRef Name, Intrinsic::ID IntrinsicID, FixedVectorType *FVTy,
4262 ArrayRef<Constant *> Operands, const DataLayout &DL,
4263 const TargetLibraryInfo *TLI, const CallBase *Call) {
4265 SmallVector<Constant *, 4> Lane(Operands.size());
4266 Type *Ty = FVTy->getElementType();
4267
4268 switch (IntrinsicID) {
4269 case Intrinsic::masked_load: {
4270 auto *SrcPtr = Operands[0];
4271 auto *Mask = Operands[1];
4272 auto *Passthru = Operands[2];
4273
4274 Constant *VecData = ConstantFoldLoadFromConstPtr(SrcPtr, FVTy, DL);
4275
4276 SmallVector<Constant *, 32> NewElements;
4277 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4278 auto *MaskElt = Mask->getAggregateElement(I);
4279 if (!MaskElt)
4280 break;
4281 auto *PassthruElt = Passthru->getAggregateElement(I);
4282 auto *VecElt = VecData ? VecData->getAggregateElement(I) : nullptr;
4283 if (isa<UndefValue>(MaskElt)) {
4284 if (PassthruElt)
4285 NewElements.push_back(PassthruElt);
4286 else if (VecElt)
4287 NewElements.push_back(VecElt);
4288 else
4289 return nullptr;
4290 }
4291 if (MaskElt->isNullValue()) {
4292 if (!PassthruElt)
4293 return nullptr;
4294 NewElements.push_back(PassthruElt);
4295 } else if (MaskElt->isOneValue()) {
4296 if (!VecElt)
4297 return nullptr;
4298 NewElements.push_back(VecElt);
4299 } else {
4300 return nullptr;
4301 }
4302 }
4303 if (NewElements.size() != FVTy->getNumElements())
4304 return nullptr;
4305 return ConstantVector::get(NewElements);
4306 }
4307 case Intrinsic::arm_mve_vctp8:
4308 case Intrinsic::arm_mve_vctp16:
4309 case Intrinsic::arm_mve_vctp32:
4310 case Intrinsic::arm_mve_vctp64: {
4311 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
4312 unsigned Lanes = FVTy->getNumElements();
4313 uint64_t Limit = Op->getZExtValue();
4314
4316 for (unsigned i = 0; i < Lanes; i++) {
4317 if (i < Limit)
4319 else
4321 }
4322 return ConstantVector::get(NCs);
4323 }
4324 return nullptr;
4325 }
4326 case Intrinsic::get_active_lane_mask: {
4327 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4328 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4329 if (Op0 && Op1) {
4330 unsigned Lanes = FVTy->getNumElements();
4331 uint64_t Base = Op0->getZExtValue();
4332 uint64_t Limit = Op1->getZExtValue();
4333
4335 for (unsigned i = 0; i < Lanes; i++) {
4336 if (Base + i < Limit)
4338 else
4340 }
4341 return ConstantVector::get(NCs);
4342 }
4343 return nullptr;
4344 }
4345 case Intrinsic::vector_extract: {
4346 auto *Idx = dyn_cast<ConstantInt>(Operands[1]);
4347 Constant *Vec = Operands[0];
4348 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4349 return nullptr;
4350
4351 unsigned NumElements = FVTy->getNumElements();
4352 unsigned VecNumElements =
4353 cast<FixedVectorType>(Vec->getType())->getNumElements();
4354 unsigned StartingIndex = Idx->getZExtValue();
4355
4356 // Extracting entire vector is nop
4357 if (NumElements == VecNumElements && StartingIndex == 0)
4358 return Vec;
4359
4360 for (unsigned I = StartingIndex, E = StartingIndex + NumElements; I < E;
4361 ++I) {
4362 Constant *Elt = Vec->getAggregateElement(I);
4363 if (!Elt)
4364 return nullptr;
4365 Result[I - StartingIndex] = Elt;
4366 }
4367
4368 return ConstantVector::get(Result);
4369 }
4370 case Intrinsic::vector_insert: {
4371 Constant *Vec = Operands[0];
4372 Constant *SubVec = Operands[1];
4373 auto *Idx = dyn_cast<ConstantInt>(Operands[2]);
4374 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4375 return nullptr;
4376
4377 unsigned SubVecNumElements =
4378 cast<FixedVectorType>(SubVec->getType())->getNumElements();
4379 unsigned VecNumElements =
4380 cast<FixedVectorType>(Vec->getType())->getNumElements();
4381 unsigned IdxN = Idx->getZExtValue();
4382 // Replacing entire vector with a subvec is nop
4383 if (SubVecNumElements == VecNumElements && IdxN == 0)
4384 return SubVec;
4385
4386 for (unsigned I = 0; I < VecNumElements; ++I) {
4387 Constant *Elt;
4388 if (I < IdxN + SubVecNumElements)
4389 Elt = SubVec->getAggregateElement(I - IdxN);
4390 else
4391 Elt = Vec->getAggregateElement(I);
4392 if (!Elt)
4393 return nullptr;
4394 Result[I] = Elt;
4395 }
4396 return ConstantVector::get(Result);
4397 }
4398 case Intrinsic::vector_interleave2:
4399 case Intrinsic::vector_interleave3:
4400 case Intrinsic::vector_interleave4:
4401 case Intrinsic::vector_interleave5:
4402 case Intrinsic::vector_interleave6:
4403 case Intrinsic::vector_interleave7:
4404 case Intrinsic::vector_interleave8: {
4405 unsigned NumElements =
4406 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4407 unsigned NumOperands = Operands.size();
4408 for (unsigned I = 0; I < NumElements; ++I) {
4409 for (unsigned J = 0; J < NumOperands; ++J) {
4410 Constant *Elt = Operands[J]->getAggregateElement(I);
4411 if (!Elt)
4412 return nullptr;
4413 Result[NumOperands * I + J] = Elt;
4414 }
4415 }
4416 return ConstantVector::get(Result);
4417 }
4418 case Intrinsic::wasm_dot: {
4419 unsigned NumElements =
4420 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4421
4422 assert(NumElements == 8 && Result.size() == 4 &&
4423 "wasm dot takes i16x8 and produces i32x4");
4424 assert(Ty->isIntegerTy());
4425 int32_t MulVector[8];
4426
4427 for (unsigned I = 0; I < NumElements; ++I) {
4428 ConstantInt *Elt0 =
4429 cast<ConstantInt>(Operands[0]->getAggregateElement(I));
4430 ConstantInt *Elt1 =
4431 cast<ConstantInt>(Operands[1]->getAggregateElement(I));
4432
4433 MulVector[I] = Elt0->getSExtValue() * Elt1->getSExtValue();
4434 }
4435 for (unsigned I = 0; I < Result.size(); I++) {
4436 int64_t IAdd = (int64_t)MulVector[I * 2] + (int64_t)MulVector[I * 2 + 1];
4437 Result[I] = ConstantInt::getSigned(Ty, IAdd, /*ImplicitTrunc=*/true);
4438 }
4439
4440 return ConstantVector::get(Result);
4441 }
4442 default:
4443 break;
4444 }
4445
4446 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4447 // Gather a column of constants.
4448 for (unsigned J = 0, JE = Operands.size(); J != JE; ++J) {
4449 // Some intrinsics use a scalar type for certain arguments.
4450 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, J, /*TTI=*/nullptr)) {
4451 Lane[J] = Operands[J];
4452 continue;
4453 }
4454
4455 Constant *Agg = Operands[J]->getAggregateElement(I);
4456 if (!Agg)
4457 return nullptr;
4458
4459 Lane[J] = Agg;
4460 }
4461
4462 // Use the regular scalar folding to simplify this column.
4463 Constant *Folded =
4464 ConstantFoldScalarCall(Name, IntrinsicID, Ty, Lane, TLI, Call);
4465 if (!Folded)
4466 return nullptr;
4467 Result[I] = Folded;
4468 }
4469
4470 return ConstantVector::get(Result);
4471}
4472
4473static Constant *ConstantFoldScalableVectorCall(
4474 StringRef Name, Intrinsic::ID IntrinsicID, ScalableVectorType *SVTy,
4475 ArrayRef<Constant *> Operands, const DataLayout &DL,
4476 const TargetLibraryInfo *TLI, const CallBase *Call) {
4477 switch (IntrinsicID) {
4478 case Intrinsic::aarch64_sve_convert_from_svbool: {
4479 Constant *Src = Operands[0];
4480 if (!Src->isNullValue())
4481 break;
4482
4483 return ConstantInt::getFalse(SVTy);
4484 }
4485 case Intrinsic::get_active_lane_mask: {
4486 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4487 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4488 if (Op0 && Op1 && Op0->getValue().uge(Op1->getValue()))
4489 return ConstantVector::getNullValue(SVTy);
4490 break;
4491 }
4492 case Intrinsic::vector_interleave2:
4493 case Intrinsic::vector_interleave3:
4494 case Intrinsic::vector_interleave4:
4495 case Intrinsic::vector_interleave5:
4496 case Intrinsic::vector_interleave6:
4497 case Intrinsic::vector_interleave7:
4498 case Intrinsic::vector_interleave8: {
4499 Constant *SplatVal = Operands[0]->getSplatValue();
4500 if (!SplatVal)
4501 return nullptr;
4502
4503 if (!llvm::all_equal(Operands))
4504 return nullptr;
4505
4506 return ConstantVector::getSplat(SVTy->getElementCount(), SplatVal);
4507 }
4508 default:
4509 break;
4510 }
4511
4512 // If trivially vectorizable, try folding it via the scalar call if all
4513 // operands are splats.
4514
4515 // TODO: ConstantFoldFixedVectorCall should probably check this too?
4516 if (!isTriviallyVectorizable(IntrinsicID))
4517 return nullptr;
4518
4520 for (auto [I, Op] : enumerate(Operands)) {
4521 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, I, /*TTI=*/nullptr)) {
4522 SplatOps.push_back(Op);
4523 continue;
4524 }
4525 Constant *Splat = Op->getSplatValue();
4526 if (!Splat)
4527 return nullptr;
4528 SplatOps.push_back(Splat);
4529 }
4530 Constant *Folded = ConstantFoldScalarCall(
4531 Name, IntrinsicID, SVTy->getElementType(), SplatOps, TLI, Call);
4532 if (!Folded)
4533 return nullptr;
4534 return ConstantVector::getSplat(SVTy->getElementCount(), Folded);
4535}
4536
4537static std::pair<Constant *, Constant *>
4538ConstantFoldScalarFrexpCall(Constant *Op, Type *IntTy) {
4539 if (isa<PoisonValue>(Op))
4540 return {Op, PoisonValue::get(IntTy)};
4541
4542 auto *ConstFP = dyn_cast<ConstantFP>(Op);
4543 if (!ConstFP)
4544 return {};
4545
4546 const APFloat &U = ConstFP->getValueAPF();
4547 int FrexpExp;
4548 APFloat FrexpMant = frexp(U, FrexpExp, APFloat::rmNearestTiesToEven);
4549 Constant *Result0 = ConstantFP::get(ConstFP->getType(), FrexpMant);
4550
4551 // The exponent is an "unspecified value" for inf/nan. We use zero to avoid
4552 // using undef.
4553 Constant *Result1 = FrexpMant.isFinite()
4554 ? ConstantInt::getSigned(IntTy, FrexpExp)
4555 : ConstantInt::getNullValue(IntTy);
4556 return {Result0, Result1};
4557}
4558
4559/// Handle intrinsics that return tuples, which may be tuples of vectors.
4560static Constant *
4561ConstantFoldStructCall(StringRef Name, Intrinsic::ID IntrinsicID,
4562 StructType *StTy, ArrayRef<Constant *> Operands,
4563 const DataLayout &DL, const TargetLibraryInfo *TLI,
4564 const CallBase *Call) {
4565
4566 switch (IntrinsicID) {
4567 case Intrinsic::frexp: {
4568 Type *Ty0 = StTy->getContainedType(0);
4569 Type *Ty1 = StTy->getContainedType(1)->getScalarType();
4570
4571 if (auto *FVTy0 = dyn_cast<FixedVectorType>(Ty0)) {
4572 SmallVector<Constant *, 4> Results0(FVTy0->getNumElements());
4573 SmallVector<Constant *, 4> Results1(FVTy0->getNumElements());
4574
4575 for (unsigned I = 0, E = FVTy0->getNumElements(); I != E; ++I) {
4576 Constant *Lane = Operands[0]->getAggregateElement(I);
4577 std::tie(Results0[I], Results1[I]) =
4578 ConstantFoldScalarFrexpCall(Lane, Ty1);
4579 if (!Results0[I])
4580 return nullptr;
4581 }
4582
4583 return ConstantStruct::get(StTy, ConstantVector::get(Results0),
4584 ConstantVector::get(Results1));
4585 }
4586
4587 auto [Result0, Result1] = ConstantFoldScalarFrexpCall(Operands[0], Ty1);
4588 if (!Result0)
4589 return nullptr;
4590 return ConstantStruct::get(StTy, Result0, Result1);
4591 }
4592 case Intrinsic::sincos: {
4593 Type *Ty = StTy->getContainedType(0);
4594 Type *TyScalar = Ty->getScalarType();
4595
4596 auto ConstantFoldScalarSincosCall =
4597 [&](Constant *Op) -> std::pair<Constant *, Constant *> {
4598 Constant *SinResult =
4599 ConstantFoldScalarCall(Name, Intrinsic::sin, TyScalar, Op, TLI, Call);
4600 Constant *CosResult =
4601 ConstantFoldScalarCall(Name, Intrinsic::cos, TyScalar, Op, TLI, Call);
4602 return std::make_pair(SinResult, CosResult);
4603 };
4604
4605 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty)) {
4606 SmallVector<Constant *> SinResults(FVTy->getNumElements());
4607 SmallVector<Constant *> CosResults(FVTy->getNumElements());
4608
4609 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4610 Constant *Lane = Operands[0]->getAggregateElement(I);
4611 std::tie(SinResults[I], CosResults[I]) =
4612 ConstantFoldScalarSincosCall(Lane);
4613 if (!SinResults[I] || !CosResults[I])
4614 return nullptr;
4615 }
4616
4617 return ConstantStruct::get(StTy, ConstantVector::get(SinResults),
4618 ConstantVector::get(CosResults));
4619 }
4620
4621 auto [SinResult, CosResult] = ConstantFoldScalarSincosCall(Operands[0]);
4622 if (!SinResult || !CosResult)
4623 return nullptr;
4624 return ConstantStruct::get(StTy, SinResult, CosResult);
4625 }
4626 case Intrinsic::vector_deinterleave2:
4627 case Intrinsic::vector_deinterleave3:
4628 case Intrinsic::vector_deinterleave4:
4629 case Intrinsic::vector_deinterleave5:
4630 case Intrinsic::vector_deinterleave6:
4631 case Intrinsic::vector_deinterleave7:
4632 case Intrinsic::vector_deinterleave8: {
4633 unsigned NumResults = StTy->getNumElements();
4634 auto *Vec = Operands[0];
4635 auto *VecTy = cast<VectorType>(Vec->getType());
4636
4637 ElementCount ResultEC =
4638 VecTy->getElementCount().divideCoefficientBy(NumResults);
4639
4640 if (auto *EltC = Vec->getSplatValue()) {
4641 auto *ResultVec = ConstantVector::getSplat(ResultEC, EltC);
4642 SmallVector<Constant *, 8> Results(NumResults, ResultVec);
4643 return ConstantStruct::get(StTy, Results);
4644 }
4645
4646 if (!ResultEC.isFixed())
4647 return nullptr;
4648
4649 unsigned NumElements = ResultEC.getFixedValue();
4651 SmallVector<Constant *> Elements(NumElements);
4652 for (unsigned I = 0; I != NumResults; ++I) {
4653 for (unsigned J = 0; J != NumElements; ++J) {
4654 Constant *Elt = Vec->getAggregateElement(J * NumResults + I);
4655 if (!Elt)
4656 return nullptr;
4657 Elements[J] = Elt;
4658 }
4659 Results[I] = ConstantVector::get(Elements);
4660 }
4661 return ConstantStruct::get(StTy, Results);
4662 }
4663 default:
4664 // TODO: Constant folding of vector intrinsics that fall through here does
4665 // not work (e.g. overflow intrinsics)
4666 return ConstantFoldScalarCall(Name, IntrinsicID, StTy, Operands, TLI, Call);
4667 }
4668
4669 return nullptr;
4670}
4671
4672} // end anonymous namespace
4673
4675 Constant *RHS, Type *Ty,
4678 // Ensure we check flags like StrictFP that might prevent this from getting
4679 // folded before generating a result.
4680 if (Call && !canConstantFoldCallTo(Call, Call->getCalledFunction()))
4681 return nullptr;
4682 return ConstantFoldIntrinsicCall2(ID, Ty, {LHS, RHS}, Call);
4683}
4684
4686 ArrayRef<Constant *> Operands,
4687 const TargetLibraryInfo *TLI,
4688 bool AllowNonDeterministic) {
4689 if (Call->isNoBuiltin())
4690 return nullptr;
4691 if (!F->hasName())
4692 return nullptr;
4693
4694 // If this is not an intrinsic and not recognized as a library call, bail out.
4695 Intrinsic::ID IID = F->getIntrinsicID();
4696 if (IID == Intrinsic::not_intrinsic) {
4697 if (!TLI)
4698 return nullptr;
4699 LibFunc LibF;
4700 if (!TLI->getLibFunc(*F, LibF))
4701 return nullptr;
4702 }
4703
4704 // Conservatively assume that floating-point libcalls may be
4705 // non-deterministic.
4706 Type *Ty = F->getReturnType();
4707 if (!AllowNonDeterministic && Ty->isFPOrFPVectorTy())
4708 return nullptr;
4709
4710 StringRef Name = F->getName();
4711 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty))
4712 return ConstantFoldFixedVectorCall(
4713 Name, IID, FVTy, Operands, F->getDataLayout(), TLI, Call);
4714
4715 if (auto *SVTy = dyn_cast<ScalableVectorType>(Ty))
4716 return ConstantFoldScalableVectorCall(
4717 Name, IID, SVTy, Operands, F->getDataLayout(), TLI, Call);
4718
4719 if (auto *StTy = dyn_cast<StructType>(Ty))
4720 return ConstantFoldStructCall(Name, IID, StTy, Operands,
4721 F->getDataLayout(), TLI, Call);
4722
4723 // TODO: If this is a library function, we already discovered that above,
4724 // so we should pass the LibFunc, not the name (and it might be better
4725 // still to separate intrinsic handling from libcalls).
4726 return ConstantFoldScalarCall(Name, IID, Ty, Operands, TLI, Call);
4727}
4728
4730 const TargetLibraryInfo *TLI) {
4731 // FIXME: Refactor this code; this duplicates logic in LibCallsShrinkWrap
4732 // (and to some extent ConstantFoldScalarCall).
4733 if (Call->isNoBuiltin() || Call->isStrictFP())
4734 return false;
4735 Function *F = Call->getCalledFunction();
4736 if (!F)
4737 return false;
4738
4739 LibFunc Func;
4740 if (!TLI || !TLI->getLibFunc(*F, Func))
4741 return false;
4742
4743 if (Call->arg_size() == 1) {
4744 if (ConstantFP *OpC = dyn_cast<ConstantFP>(Call->getArgOperand(0))) {
4745 const APFloat &Op = OpC->getValueAPF();
4746 switch (Func) {
4747 case LibFunc_logl:
4748 case LibFunc_log:
4749 case LibFunc_logf:
4750 case LibFunc_log2l:
4751 case LibFunc_log2:
4752 case LibFunc_log2f:
4753 case LibFunc_log10l:
4754 case LibFunc_log10:
4755 case LibFunc_log10f:
4756 return Op.isNaN() || (!Op.isZero() && !Op.isNegative());
4757
4758 case LibFunc_ilogb:
4759 return !Op.isNaN() && !Op.isZero() && !Op.isInfinity();
4760
4761 case LibFunc_expl:
4762 case LibFunc_exp:
4763 case LibFunc_expf:
4764 // FIXME: These boundaries are slightly conservative.
4765 if (OpC->getType()->isDoubleTy())
4766 return !(Op < APFloat(-745.0) || Op > APFloat(709.0));
4767 if (OpC->getType()->isFloatTy())
4768 return !(Op < APFloat(-103.0f) || Op > APFloat(88.0f));
4769 break;
4770
4771 case LibFunc_exp2l:
4772 case LibFunc_exp2:
4773 case LibFunc_exp2f:
4774 // FIXME: These boundaries are slightly conservative.
4775 if (OpC->getType()->isDoubleTy())
4776 return !(Op < APFloat(-1074.0) || Op > APFloat(1023.0));
4777 if (OpC->getType()->isFloatTy())
4778 return !(Op < APFloat(-149.0f) || Op > APFloat(127.0f));
4779 break;
4780
4781 case LibFunc_sinl:
4782 case LibFunc_sin:
4783 case LibFunc_sinf:
4784 case LibFunc_cosl:
4785 case LibFunc_cos:
4786 case LibFunc_cosf:
4787 return !Op.isInfinity();
4788
4789 case LibFunc_tanl:
4790 case LibFunc_tan:
4791 case LibFunc_tanf: {
4792 // FIXME: Stop using the host math library.
4793 // FIXME: The computation isn't done in the right precision.
4794 Type *Ty = OpC->getType();
4795 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy())
4796 return ConstantFoldFP(tan, OpC->getValueAPF(), Ty) != nullptr;
4797 break;
4798 }
4799
4800 case LibFunc_atan:
4801 case LibFunc_atanf:
4802 case LibFunc_atanl:
4803 // Per POSIX, this MAY fail if Op is denormal. We choose not failing.
4804 return true;
4805
4806 case LibFunc_asinl:
4807 case LibFunc_asin:
4808 case LibFunc_asinf:
4809 case LibFunc_acosl:
4810 case LibFunc_acos:
4811 case LibFunc_acosf:
4812 return !(Op < APFloat::getOne(Op.getSemantics(), true) ||
4813 Op > APFloat::getOne(Op.getSemantics()));
4814
4815 case LibFunc_sinh:
4816 case LibFunc_cosh:
4817 case LibFunc_sinhf:
4818 case LibFunc_coshf:
4819 case LibFunc_sinhl:
4820 case LibFunc_coshl:
4821 // FIXME: These boundaries are slightly conservative.
4822 if (OpC->getType()->isDoubleTy())
4823 return !(Op < APFloat(-710.0) || Op > APFloat(710.0));
4824 if (OpC->getType()->isFloatTy())
4825 return !(Op < APFloat(-89.0f) || Op > APFloat(89.0f));
4826 break;
4827
4828 case LibFunc_sqrtl:
4829 case LibFunc_sqrt:
4830 case LibFunc_sqrtf:
4831 return Op.isNaN() || Op.isZero() || !Op.isNegative();
4832
4833 // FIXME: Add more functions: sqrt_finite, atanh, expm1, log1p,
4834 // maybe others?
4835 default:
4836 break;
4837 }
4838 }
4839 }
4840
4841 if (Call->arg_size() == 2) {
4842 ConstantFP *Op0C = dyn_cast<ConstantFP>(Call->getArgOperand(0));
4843 ConstantFP *Op1C = dyn_cast<ConstantFP>(Call->getArgOperand(1));
4844 if (Op0C && Op1C) {
4845 const APFloat &Op0 = Op0C->getValueAPF();
4846 const APFloat &Op1 = Op1C->getValueAPF();
4847
4848 switch (Func) {
4849 case LibFunc_powl:
4850 case LibFunc_pow:
4851 case LibFunc_powf: {
4852 // FIXME: Stop using the host math library.
4853 // FIXME: The computation isn't done in the right precision.
4854 Type *Ty = Op0C->getType();
4855 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy()) {
4856 if (Ty == Op1C->getType())
4857 return ConstantFoldBinaryFP(pow, Op0, Op1, Ty) != nullptr;
4858 }
4859 break;
4860 }
4861
4862 case LibFunc_fmodl:
4863 case LibFunc_fmod:
4864 case LibFunc_fmodf:
4865 case LibFunc_remainderl:
4866 case LibFunc_remainder:
4867 case LibFunc_remainderf:
4868 return Op0.isNaN() || Op1.isNaN() ||
4869 (!Op0.isInfinity() && !Op1.isZero());
4870
4871 case LibFunc_atan2:
4872 case LibFunc_atan2f:
4873 case LibFunc_atan2l:
4874 // Although IEEE-754 says atan2(+/-0.0, +/-0.0) are well-defined, and
4875 // GLIBC and MSVC do not appear to raise an error on those, we
4876 // cannot rely on that behavior. POSIX and C11 say that a domain error
4877 // may occur, so allow for that possibility.
4878 return !Op0.isZero() || !Op1.isZero();
4879
4880 case LibFunc_nextafter:
4881 case LibFunc_nextafterf:
4882 case LibFunc_nextafterl:
4883 case LibFunc_nexttoward:
4884 case LibFunc_nexttowardf:
4885 case LibFunc_nexttowardl: {
4886 return ConstantFoldNextToward(Op0, Op1, F->getReturnType()) != nullptr;
4887 }
4888 default:
4889 break;
4890 }
4891 }
4892 }
4893
4894 return false;
4895}
4896
4898 unsigned CastOp, const DataLayout &DL,
4899 PreservedCastFlags *Flags) {
4900 switch (CastOp) {
4901 case Instruction::BitCast:
4902 // Bitcast is always lossless.
4903 return ConstantFoldCastOperand(Instruction::BitCast, C, InvCastTo, DL);
4904 case Instruction::Trunc: {
4905 auto *ZExtC = ConstantFoldCastOperand(Instruction::ZExt, C, InvCastTo, DL);
4906 if (Flags) {
4907 // Truncation back on ZExt value is always NUW.
4908 Flags->NUW = true;
4909 // Test positivity of C.
4910 auto *SExtC =
4911 ConstantFoldCastOperand(Instruction::SExt, C, InvCastTo, DL);
4912 Flags->NSW = ZExtC == SExtC;
4913 }
4914 return ZExtC;
4915 }
4916 case Instruction::SExt:
4917 case Instruction::ZExt: {
4918 auto *InvC = ConstantExpr::getTrunc(C, InvCastTo);
4919 auto *CastInvC = ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4920 // Must satisfy CastOp(InvC) == C.
4921 if (!CastInvC || CastInvC != C)
4922 return nullptr;
4923 if (Flags && CastOp == Instruction::ZExt) {
4924 auto *SExtInvC =
4925 ConstantFoldCastOperand(Instruction::SExt, InvC, C->getType(), DL);
4926 // Test positivity of InvC.
4927 Flags->NNeg = CastInvC == SExtInvC;
4928 }
4929 return InvC;
4930 }
4931 case Instruction::FPExt: {
4932 Constant *InvC =
4933 ConstantFoldCastOperand(Instruction::FPTrunc, C, InvCastTo, DL);
4934 if (InvC) {
4935 Constant *CastInvC =
4936 ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4937 if (CastInvC == C)
4938 return InvC;
4939 }
4940 return nullptr;
4941 }
4942 default:
4943 return nullptr;
4944 }
4945}
4946
4948 const DataLayout &DL,
4949 PreservedCastFlags *Flags) {
4950 return getLosslessInvCast(C, DestTy, Instruction::ZExt, DL, Flags);
4951}
4952
4954 const DataLayout &DL,
4955 PreservedCastFlags *Flags) {
4956 return getLosslessInvCast(C, DestTy, Instruction::SExt, DL, Flags);
4957}
4958
4959void TargetFolder::anchor() {}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
#define X(NUM, ENUM, NAME)
Definition ELF.h:851
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static Constant * FoldBitCast(Constant *V, Type *DestTy)
Constant * getConstantAtOffset(Constant *Base, APInt Offset, const DataLayout &DL)
If this Offset points exactly to the start of an aggregate element, return that element,...
static cl::opt< bool > DisableFPCallFolding("disable-fp-call-folding", cl::desc("Disable constant-folding of FP intrinsics and libcalls."), cl::init(false), cl::Hidden)
static Constant * flushDenormalConstant(Type *Ty, const APFloat &APF, DenormalMode::DenormalModeKind Mode)
static Constant * flushDenormalConstantFP(ConstantFP *CFP, const Instruction *Inst, bool IsOutput)
static DenormalMode getInstrDenormalMode(const Instruction *CtxI, Type *Ty)
Return the denormal mode that can be assumed when executing a floating point operation at CtxI.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
This file defines the DenseMap class.
Hexagon Common GEP
amode Optimize addressing mode
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
static bool InRange(int64_t Value, unsigned short Shift, int LBound, int HBound)
This file contains the definitions of the enumerations and flags associated with NVVM Intrinsics,...
if(PassOpts->AAPipeline)
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
This file contains some templates that are useful if you are working with the STL at all.
This file implements the SmallBitVector class.
This file defines the SmallVector class.
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39
The Input class is used to parse a yaml document into in-memory structs and vectors.
cmpResult
IEEE-754R 5.11: Floating Point Comparison Relations.
Definition APFloat.h:334
static constexpr roundingMode rmTowardZero
Definition APFloat.h:348
llvm::RoundingMode roundingMode
IEEE-754R 4.3: Rounding-direction attributes.
Definition APFloat.h:342
static const fltSemantics & IEEEdouble()
Definition APFloat.h:297
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:347
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:344
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:346
static const fltSemantics & IEEEhalf()
Definition APFloat.h:294
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:349
opStatus
IEEE-754R 7: Default exception handling.
Definition APFloat.h:360
static APFloat getQNaN(const fltSemantics &Sem, bool Negative=false, const APInt *payload=nullptr)
Factory for QNaN values.
Definition APFloat.h:1175
opStatus divide(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1263
void copySign(const APFloat &RHS)
Definition APFloat.h:1357
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:5890
opStatus subtract(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1245
bool isNegative() const
Definition APFloat.h:1516
LLVM_ABI double convertToDouble() const
Converts this APFloat to host double value.
Definition APFloat.cpp:5949
bool isPosInfinity() const
Definition APFloat.h:1529
bool isNormal() const
Definition APFloat.h:1520
bool isDenormal() const
Definition APFloat.h:1517
opStatus add(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1236
const fltSemantics & getSemantics() const
Definition APFloat.h:1524
bool isNonZero() const
Definition APFloat.h:1525
bool isFinite() const
Definition APFloat.h:1521
bool isNaN() const
Definition APFloat.h:1514
static APFloat getOne(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative One.
Definition APFloat.h:1143
opStatus multiply(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1254
LLVM_ABI float convertToFloat() const
Converts this APFloat to host float value.
Definition APFloat.cpp:5977
bool isSignaling() const
Definition APFloat.h:1518
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
Definition APFloat.h:1290
bool isZero() const
Definition APFloat.h:1512
opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.h:1387
opStatus mod(const APFloat &RHS)
Definition APFloat.h:1281
bool isNegInfinity() const
Definition APFloat.h:1530
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1303
void changeSign()
Definition APFloat.h:1352
static APFloat getZero(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Zero.
Definition APFloat.h:1134
bool isInfinity() const
Definition APFloat.h:1513
Class for arbitrary precision integers.
Definition APInt.h:78
LLVM_ABI APInt umul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2022
LLVM_ABI APInt usub_sat(const APInt &RHS) const
Definition APInt.cpp:2106
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition APInt.h:424
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1563
LLVM_ABI uint64_t extractBitsAsZExtValue(unsigned numBits, unsigned bitPosition) const
Definition APInt.cpp:520
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1075
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:207
APInt abs() const
Get the absolute value.
Definition APInt.h:1818
LLVM_ABI APInt sadd_sat(const APInt &RHS) const
Definition APInt.cpp:2077
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1208
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1999
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1189
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1708
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1511
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1118
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1979
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1986
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1662
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition APInt.h:1621
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:220
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition APInt.cpp:1083
LLVM_ABI APInt uadd_sat(const APInt &RHS) const
Definition APInt.cpp:2087
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition APInt.h:834
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2011
LLVM_ABI APInt sext(unsigned width) const
Sign extend to a new width.
Definition APInt.cpp:1027
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
bool slt(const APInt &RHS) const
Signed less than comparison.
Definition APInt.h:1137
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201
LLVM_ABI APInt extractBits(unsigned numBits, unsigned bitPosition) const
Return an APInt with the extracted bits [bitPosition,bitPosition+numBits).
Definition APInt.cpp:482
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1992
bool isOne() const
Determine if this is a value of 1.
Definition APInt.h:390
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:858
LLVM_ABI APInt ssub_sat(const APInt &RHS) const
Definition APInt.cpp:2096
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
static LLVM_ABI unsigned isEliminableCastPair(Instruction::CastOps firstOpcode, Instruction::CastOps secondOpcode, Type *SrcTy, Type *MidTy, Type *DstTy, const DataLayout *DL)
Determine how a pair of casts can be eliminated, if they can be at all.
static LLVM_ABI bool castIsValid(Instruction::CastOps op, Type *SrcTy, Type *DstTy)
This method can be used to determine if a cast from SrcTy to DstTy using Opcode op is valid or not.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676
bool isSigned() const
Definition InstrTypes.h:930
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:827
static bool isFPPredicate(Predicate P)
Definition InstrTypes.h:770
static Constant * get(LLVMContext &Context, ArrayRef< ElementTy > Elts)
get() constructor - Return a constant with array type with an element count and element type matching...
Definition Constants.h:859
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getExtractElement(Constant *Vec, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI bool isDesirableCastOp(unsigned Opcode)
Whether creating a constant expression for this cast is desirable.
static LLVM_ABI Constant * getCast(unsigned ops, Constant *C, Type *Ty, bool OnlyIfReduced=false)
Convenience function for getting a Cast operation.
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
static Constant * getPtrAdd(Constant *Ptr, Constant *Offset, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReduced=nullptr)
Create a getelementptr i8, ptr, offset constant expression.
Definition Constants.h:1472
static LLVM_ABI Constant * getInsertElement(Constant *Vec, Constant *Elt, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI Constant * getShuffleVector(Constant *V1, Constant *V2, ArrayRef< int > Mask, Type *OnlyIfReducedTy=nullptr)
static bool isSupportedGetElementPtr(const Type *SrcElemTy)
Whether creating a constant expression for this getelementptr type is supported.
Definition Constants.h:1573
static LLVM_ABI Constant * get(unsigned Opcode, Constant *C1, Constant *C2, unsigned Flags=0, Type *OnlyIfReducedTy=nullptr)
get - Return a binary or shift operator constant expression, folding if possible.
static LLVM_ABI bool isDesirableBinOp(unsigned Opcode)
Whether creating a constant expression for this binary operator is desirable.
static Constant * getGetElementPtr(Type *Ty, Constant *C, ArrayRef< Constant * > IdxList, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReducedTy=nullptr)
Getelementptr form.
Definition Constants.h:1445
static LLVM_ABI Constant * getBitCast(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getTrunc(Constant *C, Type *Ty, bool OnlyIfReduced=false)
ConstantFP - Floating Point Values [float, double].
Definition Constants.h:420
const APFloat & getValueAPF() const
Definition Constants.h:463
static LLVM_ABI Constant * getInfinity(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getNaN(Type *Ty, bool Negative=false, uint64_t Payload=0)
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=false)
Return a ConstantInt with the specified value for the specified type.
Definition Constants.h:135
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
Definition Constants.h:174
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
static LLVM_ABI Constant * get(ArrayRef< Constant * > V)
This is an important base class in LLVM.
Definition Constant.h:43
LLVM_ABI Constant * getSplatValue(bool AllowPoison=false) const
If all elements of the vector constant have the same value, return that value.
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI Constant * getAggregateElement(unsigned Elt) const
For aggregates (struct/array/vector) return the constant that corresponds to the specified element if...
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition Constants.cpp:74
Constrained floating point compare intrinsics.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI std::optional< RoundingMode > getRoundingMode() const
Wrapper for a function that represents a value that functionally represents the original function.
Definition Constants.h:1118
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:178
iterator end()
Definition DenseMap.h:81
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:241
static LLVM_ABI bool compare(const APFloat &LHS, const APFloat &RHS, FCmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
This provides a helper for copying FMF from an instruction or setting specified flags.
Definition IRBuilder.h:93
Class to represent fixed width SIMD vectors.
unsigned getNumElements() const
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:873
DenormalMode getDenormalMode(const fltSemantics &FPType) const
Returns the denormal handling type for the default rounding mode of the function.
Definition Function.cpp:804
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags inBounds()
GEPNoWrapFlags withoutNoUnsignedSignedWrap() const
static GEPNoWrapFlags noUnsignedWrap()
bool hasNoUnsignedSignedWrap() const
bool isInBounds() const
static LLVM_ABI Type * getIndexedType(Type *Ty, ArrayRef< Value * > IdxList)
Returns the result type of a getelementptr with the given source element type and indexes.
PointerType * getType() const
Global values are always pointers.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this global belongs to.
Definition Globals.cpp:141
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
bool isEquality() const
Return true if this predicate is either EQ or NE.
bool isCast() const
bool isBinaryOp() const
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
bool isUnaryOp() const
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:354
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
static APInt getSaturationPoint(Intrinsic::ID ID, unsigned numBits)
Min/max intrinsics are monotonic, they operate on a fixed-bitwidth values, so there is a certain thre...
static ICmpInst::Predicate getPredicate(Intrinsic::ID ID)
Returns the comparison predicate underlying the intrinsic.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Class to represent scalable SIMD vectors.
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
SmallBitVector & set()
iterator_range< const_set_bits_iterator > set_bits() const
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
Used to lazily calculate structure layout information for a target machine, based on the DataLayout s...
Definition DataLayout.h:736
LLVM_ABI unsigned getElementContainingOffset(uint64_t FixedOffset) const
Given a valid byte offset into the structure, returns the structure index that contains it.
TypeSize getElementOffset(unsigned Idx) const
Definition DataLayout.h:767
Class to represent struct types.
unsigned getNumElements() const
Random access to the elements.
Provides information about what library functions are available for the current target.
bool has(LibFunc F) const
Tests whether a library function is available.
bool getLibFunc(StringRef funcName, LibFunc &F) const
Searches for a particular function name.
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI IntegerType * getInt64Ty(LLVMContext &C)
Definition Type.cpp:314
bool isByteTy() const
True if this is an instance of ByteType.
Definition Type.h:242
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:290
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:313
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:284
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
Definition Type.h:57
@ FloatTyID
32-bit floating point type
Definition Type.h:59
@ DoubleTyID
64-bit floating point type
Definition Type.h:60
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:370
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:201
static LLVM_ABI IntegerType * getInt16Ty(LLVMContext &C)
Definition Type.cpp:312
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:328
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:130
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:236
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
Definition Type.cpp:310
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition Type.h:186
bool isPtrOrPtrVectorTy() const
Return true if this is a pointer type or a vector of pointer types.
Definition Type.h:287
bool isX86_AMXTy() const
Return true if this is X86 AMX.
Definition Type.h:202
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:317
Type * getContainedType(unsigned i) const
This method is used to implement the type iterator (defined at the end of the file).
Definition Type.h:399
LLVM_ABI const fltSemantics & getFltSemantics() const
Definition Type.cpp:110
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
A Use represents the edge between a Value definition and its users.
Definition Use.h:35
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
LLVM_ABI uint64_t getPointerDereferenceableBytes(const DataLayout &DL, bool &CanBeNull, bool &CanBeFreed) const
Returns the number of bytes known to be dereferenceable for the pointer value.
Definition Value.cpp:890
Base class of all SIMD vector types.
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Type * getElementType() const
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition TypeSize.h:171
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
Definition TypeSize.h:252
static constexpr bool isKnownGE(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:237
const ParentTy * getParent() const
Definition ilist_node.h:34
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
const APInt & smin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be signed.
Definition APInt.h:2277
const APInt & smax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be signed.
Definition APInt.h:2282
const APInt & umin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be unsigned.
Definition APInt.h:2287
const APInt & umax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be unsigned.
Definition APInt.h:2292
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:48
initializer< Ty > init(const Ty &Val)
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:431
static constexpr cmpResult cmpEqual
Definition APFloat.h:439
@ ebStrict
This corresponds to "fpexcept.strict".
Definition FPEnv.h:42
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
constexpr double pi
APFloat::roundingMode GetFMARoundingMode(Intrinsic::ID IntrinsicID)
DenormalMode GetNVVMDenormMode(bool ShouldFTZ)
bool FPToIntegerIntrinsicNaNZero(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFDivRoundingMode(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicResultIsSigned(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFPToIntegerRoundingMode(Intrinsic::ID IntrinsicID)
bool RCPShouldFTZ(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FDivShouldFTZ(Intrinsic::ID IntrinsicID)
bool FAddShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxIsXorSignAbs(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFMulRoundingMode(Intrinsic::ID IntrinsicID)
bool UnaryMathIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFAddRoundingMode(Intrinsic::ID IntrinsicID)
bool FMAShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMulShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetRCPRoundingMode(Intrinsic::ID IntrinsicID)
bool FMinFMaxPropagatesNaNs(Intrinsic::ID IntrinsicID)
NodeAddr< FuncNode * > Func
Definition RDFGraph.h:393
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:316
@ Offset
Definition DWP.cpp:532
LLVM_ABI Constant * ConstantFoldBinaryIntrinsic(Intrinsic::ID ID, Constant *LHS, Constant *RHS, Type *Ty, Instruction *FMFSource)
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1739
LLVM_ABI Constant * ConstantFoldLoadThroughBitcast(Constant *C, Type *DestTy, const DataLayout &DL)
ConstantFoldLoadThroughBitcast - try to cast constant to destination type returning null if unsuccess...
static double log2(double V)
LLVM_ABI Constant * ConstantFoldSelectInstruction(Constant *Cond, Constant *V1, Constant *V2)
Attempt to constant fold a select instruction with the specified operands.
LLVM_ABI Constant * ConstantFoldFPInstOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL, const Instruction *I, bool AllowNonDeterministic=true)
Attempt to constant fold a floating point binary operation with the specified operands,...
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2554
LLVM_ABI bool canConstantFoldCallTo(const CallBase *Call, const Function *F)
canConstantFoldCallTo - Return true if its even possible to fold a call to the specified function.
unsigned getPointerAddressSpace(const Type *T)
Definition SPIRVUtils.h:378
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
LLVM_ABI Constant * ConstantFoldInstruction(const Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
APFloat abs(APFloat X)
Returns the absolute value of the argument.
Definition APFloat.h:1630
LLVM_ABI Constant * ConstantFoldCompareInstruction(CmpInst::Predicate Predicate, Constant *C1, Constant *C2)
LLVM_ABI Constant * ConstantFoldUnaryInstruction(unsigned Opcode, Constant *V)
LLVM_ABI bool IsConstantOffsetFromGlobal(Constant *C, GlobalValue *&GV, APInt &Offset, const DataLayout &DL, DSOLocalEquivalent **DSOEquiv=nullptr)
If this constant is a constant offset from a global, return the global and the constant.
LLVM_ABI bool isMathLibCallNoop(const CallBase *Call, const TargetLibraryInfo *TLI)
Check whether the given call has no side-effects.
LLVM_ABI Constant * ReadByteArrayFromGlobal(const GlobalVariable *GV, uint64_t Offset)
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition APFloat.h:1710
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1601
bool isa_and_nonnull(const Y &Val)
Definition Casting.h:676
LLVM_ABI Constant * ConstantFoldCall(const CallBase *Call, Function *F, ArrayRef< Constant * > Operands, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldCall - Attempt to constant fold a call to the specified function with the specified argum...
APFloat frexp(const APFloat &X, int &Exp, APFloat::roundingMode RM)
Equivalent of C standard library function.
Definition APFloat.h:1622
LLVM_ABI Constant * ConstantFoldExtractValueInstruction(Constant *Agg, ArrayRef< unsigned > Idxs)
Attempt to constant fold an extractvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1746
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 maxNum semantics.
Definition APFloat.h:1665
LLVM_ABI Constant * ConstantFoldLoadFromUniformValue(Constant *C, Type *Ty, const DataLayout &DL)
If C is a uniform value where all bits are the same (either all zero, all ones, all undef or all pois...
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
LLVM_ABI Constant * FlushFPConstant(Constant *Operand, const Instruction *I, bool IsOutput)
Attempt to flush float point constant according to denormal mode set in the instruction's parent func...
LLVM_ABI Constant * getLosslessUnsignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_READONLY APFloat minimumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimumNumber semantics.
Definition APFloat.h:1696
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1610
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI Constant * getLosslessSignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
LLVM_ABI bool intrinsicPropagatesPoison(Intrinsic::ID IID)
Return whether this intrinsic propagates poison for all operands.
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 minNum semantics.
Definition APFloat.h:1646
@ Sub
Subtraction of integers.
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
FunctionAddr VTableAddr Next
Definition InstrProf.h:141
DWARFExpression::Operation Op
RoundingMode
Rounding mode.
@ NearestTiesToEven
roundTiesToEven.
@ Dynamic
Denotes mode unknown at compile time.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
constexpr unsigned BitWidth
LLVM_ABI Constant * getLosslessInvCast(Constant *C, Type *InvCastTo, unsigned CastOp, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Try to cast C to InvC losslessly, satisfying CastOp(InvC) equals C, or CastOp(InvC) is a refined valu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition STLExtras.h:2166
LLVM_ABI Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
LLVM_ABI Constant * ConstantFoldInsertValueInstruction(Constant *Agg, Constant *Val, ArrayRef< unsigned > Idxs)
Attempt to constant fold an insertvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldLoadFromConstPtr(Constant *C, Type *Ty, APInt Offset, const DataLayout &DL)
Return the value that a load from C with offset Offset would produce if it is constant and determinab...
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition APFloat.h:1683
LLVM_READONLY APFloat maximumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximumNumber semantics.
Definition APFloat.h:1723
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
LLVM_ABI bool isTriviallyVectorizable(Intrinsic::ID ID)
Identify if the intrinsic is trivially vectorizable.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
Definition Casting.h:866
LLVM_ABI Constant * ConstantFoldBinaryInstruction(unsigned Opcode, Constant *V1, Constant *V2)
Represent subnormal handling kind for floating point instruction inputs and outputs.
DenormalModeKind Input
Denormal treatment kind for floating point instruction inputs in the default floating-point environme...
DenormalModeKind
Represent handled modes for denormal (aka subnormal) modes in the floating point environment.
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
@ PositiveZero
Denormals are flushed to positive zero.
@ Dynamic
Denormals have unknown treatment.
@ IEEE
IEEE-754 denormal numbers preserved.
DenormalModeKind Output
Denormal flushing mode for floating point instruction results in the default floating point environme...
static constexpr DenormalMode getDynamic()
static constexpr DenormalMode getIEEE()
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:58