LLVM 23.0.0git
ConstantFolding.cpp
Go to the documentation of this file.
1//===-- ConstantFolding.cpp - Fold instructions into constants ------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines routines for folding instructions into constants.
10//
11// Also, to supplement the basic IR ConstantExpr simplifications,
12// this file defines some additional folding routines that can make use of
13// DataLayout information. These functions cannot go in IR due to library
14// dependency issues.
15//
16//===----------------------------------------------------------------------===//
17
19#include "llvm/ADT/APFloat.h"
20#include "llvm/ADT/APInt.h"
21#include "llvm/ADT/APSInt.h"
22#include "llvm/ADT/ArrayRef.h"
23#include "llvm/ADT/DenseMap.h"
24#include "llvm/ADT/STLExtras.h"
27#include "llvm/ADT/StringRef.h"
32#include "llvm/Config/config.h"
33#include "llvm/IR/Constant.h"
35#include "llvm/IR/Constants.h"
36#include "llvm/IR/DataLayout.h"
38#include "llvm/IR/Function.h"
39#include "llvm/IR/GlobalValue.h"
41#include "llvm/IR/InstrTypes.h"
42#include "llvm/IR/Instruction.h"
45#include "llvm/IR/Intrinsics.h"
46#include "llvm/IR/IntrinsicsAArch64.h"
47#include "llvm/IR/IntrinsicsAMDGPU.h"
48#include "llvm/IR/IntrinsicsARM.h"
49#include "llvm/IR/IntrinsicsNVPTX.h"
50#include "llvm/IR/IntrinsicsWebAssembly.h"
51#include "llvm/IR/IntrinsicsX86.h"
53#include "llvm/IR/Operator.h"
54#include "llvm/IR/Type.h"
55#include "llvm/IR/Value.h"
60#include <cassert>
61#include <cerrno>
62#include <cfenv>
63#include <cmath>
64#include <cstdint>
65
66using namespace llvm;
67
69 "disable-fp-call-folding",
70 cl::desc("Disable constant-folding of FP intrinsics and libcalls."),
71 cl::init(false), cl::Hidden);
72
73namespace {
74
75//===----------------------------------------------------------------------===//
76// Constant Folding internal helper functions
77//===----------------------------------------------------------------------===//
78
79static Constant *foldConstVectorToAPInt(APInt &Result, Type *DestTy,
80 Constant *C, Type *SrcEltTy,
81 unsigned NumSrcElts,
82 const DataLayout &DL) {
83 // Now that we know that the input value is a vector of integers, just shift
84 // and insert them into our result.
85 unsigned BitShift = DL.getTypeSizeInBits(SrcEltTy);
86 for (unsigned i = 0; i != NumSrcElts; ++i) {
87 Constant *Element;
88 if (DL.isLittleEndian())
89 Element = C->getAggregateElement(NumSrcElts - i - 1);
90 else
91 Element = C->getAggregateElement(i);
92
93 if (isa_and_nonnull<UndefValue>(Element)) {
94 Result <<= BitShift;
95 continue;
96 }
97
98 auto *ElementCI = dyn_cast_or_null<ConstantInt>(Element);
99 if (!ElementCI)
100 return ConstantExpr::getBitCast(C, DestTy);
101
102 Result <<= BitShift;
103 Result |= ElementCI->getValue().zext(Result.getBitWidth());
104 }
105
106 return nullptr;
107}
108
109/// Check whether folding this bitcast into a byte vector would mix poison and
110/// non-poison bits in the same output lane. While integer types track poison on
111/// a per-value basis, byte types track it on a per-bit basis. However,
112/// `ConstantByte` cannot represent values with both poison and non-poison bits.
113///
114/// Source elements are grouped by the output lane they map to. Returns true if
115/// any group contains both poison and non-poison elements.
116static bool foldMixesPoisonBits(Constant *C, unsigned NumSrcElt,
117 unsigned NumDstElt) {
118 // If element counts don't divide evenly, bail out if a poison source element
119 // might span multiple destination lanes.
120 if (NumSrcElt % NumDstElt != 0)
121 return C->containsPoisonElement();
122 unsigned Ratio = NumSrcElt / NumDstElt;
123 for (unsigned i = 0; i != NumSrcElt; i += Ratio) {
124 bool HasPoison = false;
125 bool HasNonPoison = false;
126 for (unsigned j = 0; j != Ratio; ++j) {
127 Constant *Src = C->getAggregateElement(i + j);
128 // Conservatively bail out.
129 if (!Src)
130 return true;
131 if (isa<PoisonValue>(Src))
132 HasPoison = true;
133 else
134 HasNonPoison = true;
135 }
136 if (HasPoison && HasNonPoison)
137 return true;
138 }
139 return false;
140}
141
142/// Track which destination lanes of a bitcast are produced from poison bytes.
143/// A destination lane is marked if any source element mapped to it is poison.
144/// Returns false if an aggregate element cannot be inspected. The caller should
145/// bail out of folding.
146static bool computePoisonDstLanes(Constant *C, unsigned NumSrcElt,
147 unsigned NumDstElt,
148 SmallBitVector &PoisonDstElts) {
149 // If element counts don't divide evenly, bail out if a poison source element
150 // might span multiple destination lanes.
151 if ((NumDstElt < NumSrcElt ? NumSrcElt % NumDstElt : NumDstElt % NumSrcElt))
152 return !C->containsPoisonElement();
153 if (NumDstElt < NumSrcElt) {
154 unsigned Ratio = NumSrcElt / NumDstElt;
155 for (unsigned i = 0; i != NumDstElt; ++i) {
156 for (unsigned j = 0; j != Ratio; ++j) {
157 Constant *Src = C->getAggregateElement(i * Ratio + j);
158 if (!Src)
159 return false;
160 if (isa<PoisonValue>(Src)) {
161 PoisonDstElts[i] = true;
162 break;
163 }
164 }
165 }
166 } else {
167 unsigned Ratio = NumDstElt / NumSrcElt;
168 for (unsigned i = 0; i != NumSrcElt; ++i) {
169 Constant *Src = C->getAggregateElement(i);
170 if (!Src)
171 return false;
172 if (isa<PoisonValue>(Src))
173 PoisonDstElts.set(i * Ratio, (i + 1) * Ratio);
174 }
175 }
176 return true;
177}
178
179/// Constant fold bitcast, symbolically evaluating it with DataLayout.
180/// This always returns a non-null constant, but it may be a
181/// ConstantExpr if unfoldable.
182Constant *FoldBitCast(Constant *C, Type *DestTy, const DataLayout &DL) {
183 assert(CastInst::castIsValid(Instruction::BitCast, C, DestTy) &&
184 "Invalid constantexpr bitcast!");
185
186 // Catch the obvious splat cases.
187 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
188 return Res;
189
190 if (auto *VTy = dyn_cast<VectorType>(C->getType())) {
191 // Handle a vector->scalar integer/fp cast.
192 if (isa<IntegerType>(DestTy) || DestTy->isFloatingPointTy()) {
193 unsigned NumSrcElts = cast<FixedVectorType>(VTy)->getNumElements();
194 Type *SrcEltTy = VTy->getElementType();
195
196 // Bitcasting a byte containing any poison bit to an integer or fp type
197 // yields poison.
198 if (SrcEltTy->isByteTy() && C->containsPoisonElement())
199 return PoisonValue::get(DestTy);
200
201 // If the vector is a vector of floating point or bytes, convert it to a
202 // vector of int to simplify things.
203 if (SrcEltTy->isFloatingPointTy() || SrcEltTy->isByteTy()) {
204 unsigned Width = SrcEltTy->getPrimitiveSizeInBits();
205 auto *SrcIVTy = FixedVectorType::get(
206 IntegerType::get(C->getContext(), Width), NumSrcElts);
207 // Ask IR to do the conversion now that #elts line up.
208 C = ConstantExpr::getBitCast(C, SrcIVTy);
209 }
210
211 APInt Result(DL.getTypeSizeInBits(DestTy), 0);
212 if (Constant *CE = foldConstVectorToAPInt(Result, DestTy, C,
213 SrcEltTy, NumSrcElts, DL))
214 return CE;
215
216 if (isa<IntegerType>(DestTy))
217 return ConstantInt::get(DestTy, Result);
218
219 APFloat FP(DestTy->getFltSemantics(), Result);
220 return ConstantFP::get(DestTy->getContext(), FP);
221 }
222 }
223
224 // The code below only handles casts to vectors currently.
225 auto *DestVTy = dyn_cast<VectorType>(DestTy);
226 if (!DestVTy)
227 return ConstantExpr::getBitCast(C, DestTy);
228
229 // If this is a scalar -> vector cast, convert the input into a <1 x scalar>
230 // vector so the code below can handle it uniformly.
231 if (!isa<VectorType>(C->getType()) &&
233 Constant *Ops = C; // don't take the address of C!
234 return FoldBitCast(ConstantVector::get(Ops), DestTy, DL);
235 }
236
237 // Some of what follows may extend to cover scalable vectors but the current
238 // implementation is fixed length specific.
239 if (!isa<FixedVectorType>(C->getType()))
240 return ConstantExpr::getBitCast(C, DestTy);
241
242 // If this is a bitcast from constant vector -> vector, fold it.
245 return ConstantExpr::getBitCast(C, DestTy);
246
247 // If the element types match, IR can fold it.
248 unsigned NumDstElt = cast<FixedVectorType>(DestVTy)->getNumElements();
249 unsigned NumSrcElt = cast<FixedVectorType>(C->getType())->getNumElements();
250 if (NumDstElt == NumSrcElt)
251 return ConstantExpr::getBitCast(C, DestTy);
252
253 Type *SrcEltTy = cast<VectorType>(C->getType())->getElementType();
254 Type *DstEltTy = DestVTy->getElementType();
255
256 // Otherwise, we're changing the number of elements in a vector, which
257 // requires endianness information to do the right thing. For example,
258 // bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
259 // folds to (little endian):
260 // <4 x i32> <i32 0, i32 0, i32 1, i32 0>
261 // and to (big endian):
262 // <4 x i32> <i32 0, i32 0, i32 0, i32 1>
263
264 // First thing is first. We only want to think about integer here, so if
265 // we have something in FP form, recast it as integer.
266 if (DstEltTy->isFloatingPointTy()) {
267 // Fold to an vector of integers with same size as our FP type.
268 unsigned FPWidth = DstEltTy->getPrimitiveSizeInBits();
269 auto *DestIVTy = FixedVectorType::get(
270 IntegerType::get(C->getContext(), FPWidth), NumDstElt);
271 // Recursively handle this integer conversion, if possible.
272 C = FoldBitCast(C, DestIVTy, DL);
273
274 // Finally, IR can handle this now that #elts line up.
275 return ConstantExpr::getBitCast(C, DestTy);
276 }
277
278 // Handle byte destination type by folding through integers.
279 if (DstEltTy->isByteTy()) {
280 // When combining elements into larger byte values, bail out if the fold
281 // mixes poison and non-poison bits in the same destination element. Byte
282 // types track poison per bit, and no constant value can represent that.
283 if (NumDstElt < NumSrcElt && foldMixesPoisonBits(C, NumSrcElt, NumDstElt))
284 return ConstantExpr::getBitCast(C, DestTy);
285
286 // Fold to a vector of integers with same size as the byte type.
287 unsigned ByteWidth = DstEltTy->getPrimitiveSizeInBits();
288 auto *DestIVTy = FixedVectorType::get(
289 IntegerType::get(C->getContext(), ByteWidth), NumDstElt);
290 C = FoldBitCast(C, DestIVTy, DL);
291 return ConstantExpr::getBitCast(C, DestTy);
292 }
293
294 // Okay, we know the destination is integer, if the input is FP, convert
295 // it to integer first.
296 if (SrcEltTy->isFloatingPointTy()) {
297 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
298 auto *SrcIVTy = FixedVectorType::get(
299 IntegerType::get(C->getContext(), FPWidth), NumSrcElt);
300 // Ask IR to do the conversion now that #elts line up.
301 C = ConstantExpr::getBitCast(C, SrcIVTy);
302 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
304 "Constant folding cannot fail for plain fp->int bitcast!");
305 }
306
307 // Handle byte source type by folding through integers. Byte types track
308 // poison per bit, so any poison bit makes the destination lane poison.
309 // Record which destination lanes contain poison bits, before the generic
310 // fold below refines them to undef/zero, so they can be restored.
311 SmallBitVector PoisonDstElts(NumDstElt);
312 if (SrcEltTy->isByteTy()) {
313 if (!computePoisonDstLanes(C, NumSrcElt, NumDstElt, PoisonDstElts))
314 return ConstantExpr::getBitCast(C, DestTy);
315
316 unsigned ByteWidth = SrcEltTy->getPrimitiveSizeInBits();
317 auto *SrcIVTy = FixedVectorType::get(
318 IntegerType::get(C->getContext(), ByteWidth), NumSrcElt);
319 // Ask IR to do the conversion now that #elts line up.
320 C = ConstantExpr::getBitCast(C, SrcIVTy);
321 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
323 "Constant folding cannot fail for plain byte->int bitcast!");
324 }
325
326 // Now we know that the input and output vectors are both integer vectors
327 // of the same size, and that their #elements is not the same.
328 // Use data buffer for easy non-integer element ratio vectors handling,
329 // For example: <4 x i24> to <3 x i32>.
330 bool isLittleEndian = DL.isLittleEndian();
331 unsigned SrcBitSize = SrcEltTy->getPrimitiveSizeInBits();
332 unsigned DstBitSize = DstEltTy->getPrimitiveSizeInBits();
334 unsigned SrcElt = 0;
335
336 APInt Buffer(2 * std::max(SrcBitSize, DstBitSize), 0);
337 APInt UndefMask(Buffer.getBitWidth(), 0);
338 APInt PoisonMask(Buffer.getBitWidth(), 0);
339 unsigned BufferBitSize = 0;
340
341 while (Result.size() != NumDstElt) {
342 // Load SrcElts into Buffer.
343 while (BufferBitSize < DstBitSize) {
344 Constant *Element = C->getAggregateElement(SrcElt++);
345 if (!Element) // Reject constantexpr elements
346 return ConstantExpr::getBitCast(C, DestTy);
347
348 // Shift Buffer & Masks to fit next SrcElt.
349 if (!isLittleEndian) {
350 Buffer <<= SrcBitSize;
351 UndefMask <<= SrcBitSize;
352 PoisonMask <<= SrcBitSize;
353 }
354
355 APInt SrcValue;
356 unsigned BitPosition = isLittleEndian ? BufferBitSize : 0;
357 if (isa<UndefValue>(Element)) {
358 // Set masks fragments bits.
359 UndefMask.setBits(BitPosition, BitPosition + SrcBitSize);
360 if (isa<PoisonValue>(Element))
361 PoisonMask.setBits(BitPosition, BitPosition + SrcBitSize);
362 SrcValue = APInt::getZero(DstBitSize);
363 } else {
364 auto *Src = dyn_cast<ConstantInt>(Element);
365 if (!Src)
366 return ConstantExpr::getBitCast(C, DestTy);
367 SrcValue = Src->getValue();
368 }
369
370 // Insert src element bits into Buffer on correct position.
371 Buffer.insertBits(SrcValue, BitPosition);
372 BufferBitSize += SrcBitSize;
373 }
374
375 // Create DstElts from Buffer.
376 while (BufferBitSize >= DstBitSize) {
377 unsigned ShiftAmt = isLittleEndian ? 0 : BufferBitSize - DstBitSize;
378 // Emit undef/poison, if all undef mask fragment bits are set.
379 if (UndefMask.extractBits(DstBitSize, ShiftAmt).isAllOnes()) {
380 // Push poison, if any bit in poison mask fragment is set.
381 if (!PoisonMask.extractBits(DstBitSize, ShiftAmt).isZero()) {
382 Result.push_back(PoisonValue::get(DstEltTy));
383 } else {
384 Result.push_back(UndefValue::get(DstEltTy));
385 }
386 } else {
387 // Create and push DstElt.
388 APInt Elt = Buffer.extractBits(DstBitSize, ShiftAmt);
389 Result.push_back(ConstantInt::get(DstEltTy, Elt));
390 }
391
392 // Shift unused Buffer fragment to lower bits.
393 if (isLittleEndian) {
394 Buffer.lshrInPlace(DstBitSize);
395 UndefMask.lshrInPlace(DstBitSize);
396 PoisonMask.lshrInPlace(DstBitSize);
397 }
398 BufferBitSize -= DstBitSize;
399 }
400 }
401
402 // Restore destination lanes whose source bytes contained poison bits.
403 for (unsigned I : PoisonDstElts.set_bits())
404 Result[I] = PoisonValue::get(DstEltTy);
405
406 return ConstantVector::get(Result);
407}
408
409} // end anonymous namespace
410
411/// If this constant is a constant offset from a global, return the global and
412/// the constant. Because of constantexprs, this function is recursive.
414 APInt &Offset, const DataLayout &DL,
415 DSOLocalEquivalent **DSOEquiv) {
416 if (DSOEquiv)
417 *DSOEquiv = nullptr;
418
419 // Trivial case, constant is the global.
420 if ((GV = dyn_cast<GlobalValue>(C))) {
421 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
422 Offset = APInt(BitWidth, 0);
423 return true;
424 }
425
426 if (auto *FoundDSOEquiv = dyn_cast<DSOLocalEquivalent>(C)) {
427 if (DSOEquiv)
428 *DSOEquiv = FoundDSOEquiv;
429 GV = FoundDSOEquiv->getGlobalValue();
430 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
431 Offset = APInt(BitWidth, 0);
432 return true;
433 }
434
435 // Otherwise, if this isn't a constant expr, bail out.
436 auto *CE = dyn_cast<ConstantExpr>(C);
437 if (!CE) return false;
438
439 // Look through ptr->int and ptr->ptr casts.
440 if (CE->getOpcode() == Instruction::PtrToInt ||
441 CE->getOpcode() == Instruction::PtrToAddr)
442 return IsConstantOffsetFromGlobal(CE->getOperand(0), GV, Offset, DL,
443 DSOEquiv);
444
445 // i32* getelementptr ([5 x i32]* @a, i32 0, i32 5)
446 auto *GEP = dyn_cast<GEPOperator>(CE);
447 if (!GEP)
448 return false;
449
450 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
451 APInt TmpOffset(BitWidth, 0);
452
453 // If the base isn't a global+constant, we aren't either.
454 if (!IsConstantOffsetFromGlobal(CE->getOperand(0), GV, TmpOffset, DL,
455 DSOEquiv))
456 return false;
457
458 // Otherwise, add any offset that our operands provide.
459 if (!GEP->accumulateConstantOffset(DL, TmpOffset))
460 return false;
461
462 Offset = TmpOffset;
463 return true;
464}
465
467 const DataLayout &DL) {
468 do {
469 Type *SrcTy = C->getType();
470 if (SrcTy == DestTy)
471 return C;
472
473 TypeSize DestSize = DL.getTypeSizeInBits(DestTy);
474 TypeSize SrcSize = DL.getTypeSizeInBits(SrcTy);
475 if (!TypeSize::isKnownGE(SrcSize, DestSize))
476 return nullptr;
477
478 // Catch the obvious splat cases (since all-zeros can coerce non-integral
479 // pointers legally).
480 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
481 return Res;
482
483 // If the type sizes are the same and a cast is legal, just directly
484 // cast the constant.
485 // But be careful not to coerce non-integral pointers illegally.
486 if (SrcSize == DestSize &&
487 DL.isNonIntegralPointerType(SrcTy->getScalarType()) ==
488 DL.isNonIntegralPointerType(DestTy->getScalarType())) {
489 Instruction::CastOps Cast = Instruction::BitCast;
490 // If we are going from a pointer to int or vice versa, we spell the cast
491 // differently.
492 if (SrcTy->isIntegerTy() && DestTy->isPointerTy())
493 Cast = Instruction::IntToPtr;
494 else if (SrcTy->isPointerTy() && DestTy->isIntegerTy())
495 Cast = Instruction::PtrToInt;
496
497 if (CastInst::castIsValid(Cast, C, DestTy))
498 return ConstantFoldCastOperand(Cast, C, DestTy, DL);
499 }
500
501 // If this isn't an aggregate type, there is nothing we can do to drill down
502 // and find a bitcastable constant.
503 if (!SrcTy->isAggregateType() && !SrcTy->isVectorTy())
504 return nullptr;
505
506 // We're simulating a load through a pointer that was bitcast to point to
507 // a different type, so we can try to walk down through the initial
508 // elements of an aggregate to see if some part of the aggregate is
509 // castable to implement the "load" semantic model.
510 if (SrcTy->isStructTy()) {
511 // Struct types might have leading zero-length elements like [0 x i32],
512 // which are certainly not what we are looking for, so skip them.
513 unsigned Elem = 0;
514 Constant *ElemC;
515 do {
516 ElemC = C->getAggregateElement(Elem++);
517 } while (ElemC && DL.getTypeSizeInBits(ElemC->getType()).isZero());
518 C = ElemC;
519 } else {
520 // For non-byte-sized vector elements, the first element is not
521 // necessarily located at the vector base address.
522 if (auto *VT = dyn_cast<VectorType>(SrcTy))
523 if (!DL.typeSizeEqualsStoreSize(VT->getElementType()))
524 return nullptr;
525
526 C = C->getAggregateElement(0u);
527 }
528 } while (C);
529
530 return nullptr;
531}
532
533namespace {
534
535/// Recursive helper to read bits out of global. C is the constant being copied
536/// out of. ByteOffset is an offset into C. CurPtr is the pointer to copy
537/// results into and BytesLeft is the number of bytes left in
538/// the CurPtr buffer. DL is the DataLayout.
539bool ReadDataFromGlobal(Constant *C, uint64_t ByteOffset, unsigned char *CurPtr,
540 unsigned BytesLeft, const DataLayout &DL) {
541 assert(ByteOffset <= DL.getTypeAllocSize(C->getType()) &&
542 "Out of range access");
543
544 // Reading type padding, return zero.
545 if (ByteOffset >= DL.getTypeStoreSize(C->getType()))
546 return true;
547
548 // If this element is zero or undefined, we can just return since *CurPtr is
549 // zero initialized.
551 return true;
552
553 auto *CI = dyn_cast<ConstantInt>(C);
554 if (CI && CI->getType()->isIntegerTy()) {
555 if ((CI->getBitWidth() & 7) != 0)
556 return false;
557 const APInt &Val = CI->getValue();
558 unsigned IntBytes = unsigned(CI->getBitWidth()/8);
559
560 for (unsigned i = 0; i != BytesLeft && ByteOffset != IntBytes; ++i) {
561 unsigned n = ByteOffset;
562 if (!DL.isLittleEndian())
563 n = IntBytes - n - 1;
564 CurPtr[i] = Val.extractBits(8, n * 8).getZExtValue();
565 ++ByteOffset;
566 }
567 return true;
568 }
569
570 auto *CFP = dyn_cast<ConstantFP>(C);
571 if (CFP && CFP->getType()->isFloatingPointTy()) {
572 if (CFP->getType()->isDoubleTy()) {
573 C = FoldBitCast(C, Type::getInt64Ty(C->getContext()), DL);
574 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
575 }
576 if (CFP->getType()->isFloatTy()){
577 C = FoldBitCast(C, Type::getInt32Ty(C->getContext()), DL);
578 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
579 }
580 if (CFP->getType()->isHalfTy()){
581 C = FoldBitCast(C, Type::getInt16Ty(C->getContext()), DL);
582 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL);
583 }
584 return false;
585 }
586
587 if (auto *CS = dyn_cast<ConstantStruct>(C)) {
588 const StructLayout *SL = DL.getStructLayout(CS->getType());
589 unsigned Index = SL->getElementContainingOffset(ByteOffset);
590 uint64_t CurEltOffset = SL->getElementOffset(Index);
591 ByteOffset -= CurEltOffset;
592
593 while (true) {
594 // If the element access is to the element itself and not to tail padding,
595 // read the bytes from the element.
596 uint64_t EltSize = DL.getTypeAllocSize(CS->getOperand(Index)->getType());
597
598 if (ByteOffset < EltSize &&
599 !ReadDataFromGlobal(CS->getOperand(Index), ByteOffset, CurPtr,
600 BytesLeft, DL))
601 return false;
602
603 ++Index;
604
605 // Check to see if we read from the last struct element, if so we're done.
606 if (Index == CS->getType()->getNumElements())
607 return true;
608
609 // If we read all of the bytes we needed from this element we're done.
610 uint64_t NextEltOffset = SL->getElementOffset(Index);
611
612 if (BytesLeft <= NextEltOffset - CurEltOffset - ByteOffset)
613 return true;
614
615 // Move to the next element of the struct.
616 CurPtr += NextEltOffset - CurEltOffset - ByteOffset;
617 BytesLeft -= NextEltOffset - CurEltOffset - ByteOffset;
618 ByteOffset = 0;
619 CurEltOffset = NextEltOffset;
620 }
621 // not reached.
622 }
623
627 uint64_t NumElts, EltSize;
628 Type *EltTy;
629 if (auto *AT = dyn_cast<ArrayType>(C->getType())) {
630 NumElts = AT->getNumElements();
631 EltTy = AT->getElementType();
632 EltSize = DL.getTypeAllocSize(EltTy);
633 } else {
634 NumElts = cast<FixedVectorType>(C->getType())->getNumElements();
635 EltTy = cast<FixedVectorType>(C->getType())->getElementType();
636 // TODO: For non-byte-sized vectors, current implementation assumes there is
637 // padding to the next byte boundary between elements.
638 if (!DL.typeSizeEqualsStoreSize(EltTy))
639 return false;
640
641 EltSize = DL.getTypeStoreSize(EltTy);
642 }
643 uint64_t Index = ByteOffset / EltSize;
644 uint64_t Offset = ByteOffset - Index * EltSize;
645
646 for (; Index != NumElts; ++Index) {
647 if (!ReadDataFromGlobal(C->getAggregateElement(Index), Offset, CurPtr,
648 BytesLeft, DL))
649 return false;
650
651 uint64_t BytesWritten = EltSize - Offset;
652 assert(BytesWritten <= EltSize && "Not indexing into this element?");
653 if (BytesWritten >= BytesLeft)
654 return true;
655
656 Offset = 0;
657 BytesLeft -= BytesWritten;
658 CurPtr += BytesWritten;
659 }
660 return true;
661 }
662
663 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
664 if (CE->getOpcode() == Instruction::IntToPtr &&
665 CE->getOperand(0)->getType() == DL.getIntPtrType(CE->getType())) {
666 return ReadDataFromGlobal(CE->getOperand(0), ByteOffset, CurPtr,
667 BytesLeft, DL);
668 }
669 }
670
671 // Otherwise, unknown initializer type.
672 return false;
673}
674
675Constant *FoldReinterpretLoadFromConst(Constant *C, Type *LoadTy,
676 int64_t Offset, const DataLayout &DL) {
677 // Bail out early. Not expect to load from scalable global variable.
678 if (isa<ScalableVectorType>(LoadTy))
679 return nullptr;
680
681 auto *IntType = dyn_cast<IntegerType>(LoadTy);
682
683 // If this isn't an integer load we can't fold it directly.
684 if (!IntType) {
685 // If this is a non-integer load, we can try folding it as an int load and
686 // then bitcast the result. This can be useful for union cases. Note
687 // that address spaces don't matter here since we're not going to result in
688 // an actual new load.
689 if (!LoadTy->isFloatingPointTy() && !LoadTy->isPointerTy() &&
690 !LoadTy->isVectorTy())
691 return nullptr;
692
693 Type *MapTy = Type::getIntNTy(C->getContext(),
694 DL.getTypeSizeInBits(LoadTy).getFixedValue());
695 if (Constant *Res = FoldReinterpretLoadFromConst(C, MapTy, Offset, DL)) {
696 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
697 // Materializing a zero can be done trivially without a bitcast
698 return Constant::getNullValue(LoadTy);
699 Type *CastTy = LoadTy->isPtrOrPtrVectorTy() ? DL.getIntPtrType(LoadTy) : LoadTy;
700 Res = FoldBitCast(Res, CastTy, DL);
701 if (LoadTy->isPtrOrPtrVectorTy()) {
702 // For vector of pointer, we needed to first convert to a vector of integer, then do vector inttoptr
703 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
704 return Constant::getNullValue(LoadTy);
705 if (DL.isNonIntegralPointerType(LoadTy->getScalarType()))
706 // Be careful not to replace a load of an addrspace value with an inttoptr here
707 return nullptr;
708 Res = ConstantExpr::getIntToPtr(Res, LoadTy);
709 }
710 return Res;
711 }
712 return nullptr;
713 }
714
715 unsigned BytesLoaded = (IntType->getBitWidth() + 7) / 8;
716 if (BytesLoaded > 32 || BytesLoaded == 0)
717 return nullptr;
718
719 // If we're not accessing anything in this constant, the result is undefined.
720 if (Offset <= -1 * static_cast<int64_t>(BytesLoaded))
721 return PoisonValue::get(IntType);
722
723 // TODO: We should be able to support scalable types.
724 TypeSize InitializerSize = DL.getTypeAllocSize(C->getType());
725 if (InitializerSize.isScalable())
726 return nullptr;
727
728 // If we're not accessing anything in this constant, the result is undefined.
729 if (Offset >= (int64_t)InitializerSize.getFixedValue())
730 return PoisonValue::get(IntType);
731
732 unsigned char RawBytes[32] = {0};
733 unsigned char *CurPtr = RawBytes;
734 unsigned BytesLeft = BytesLoaded;
735
736 // If we're loading off the beginning of the global, some bytes may be valid.
737 if (Offset < 0) {
738 CurPtr += -Offset;
739 BytesLeft += Offset;
740 Offset = 0;
741 }
742
743 if (!ReadDataFromGlobal(C, Offset, CurPtr, BytesLeft, DL))
744 return nullptr;
745
746 APInt ResultVal = APInt(IntType->getBitWidth(), 0);
747 if (DL.isLittleEndian()) {
748 ResultVal = RawBytes[BytesLoaded - 1];
749 for (unsigned i = 1; i != BytesLoaded; ++i) {
750 ResultVal <<= 8;
751 ResultVal |= RawBytes[BytesLoaded - 1 - i];
752 }
753 } else {
754 ResultVal = RawBytes[0];
755 for (unsigned i = 1; i != BytesLoaded; ++i) {
756 ResultVal <<= 8;
757 ResultVal |= RawBytes[i];
758 }
759 }
760
761 return ConstantInt::get(IntType->getContext(), ResultVal);
762}
763
764} // anonymous namespace
765
766// If GV is a constant with an initializer read its representation starting
767// at Offset and return it as a constant array of unsigned char. Otherwise
768// return null.
771 if (!GV->isConstant() || !GV->hasDefinitiveInitializer())
772 return nullptr;
773
774 const DataLayout &DL = GV->getDataLayout();
775 Constant *Init = const_cast<Constant *>(GV->getInitializer());
776 TypeSize InitSize = DL.getTypeAllocSize(Init->getType());
777 if (InitSize < Offset)
778 return nullptr;
779
780 uint64_t NBytes = InitSize - Offset;
781 if (NBytes > UINT16_MAX)
782 // Bail for large initializers in excess of 64K to avoid allocating
783 // too much memory.
784 // Offset is assumed to be less than or equal than InitSize (this
785 // is enforced in ReadDataFromGlobal).
786 return nullptr;
787
788 SmallVector<unsigned char, 256> RawBytes(static_cast<size_t>(NBytes));
789 unsigned char *CurPtr = RawBytes.data();
790
791 if (!ReadDataFromGlobal(Init, Offset, CurPtr, NBytes, DL))
792 return nullptr;
793
794 return ConstantDataArray::get(GV->getContext(), RawBytes);
795}
796
797/// If this Offset points exactly to the start of an aggregate element, return
798/// that element, otherwise return nullptr.
800 const DataLayout &DL) {
801 if (Offset.isZero())
802 return Base;
803
805 return nullptr;
806
807 Type *ElemTy = Base->getType();
808 SmallVector<APInt> Indices = DL.getGEPIndicesForOffset(ElemTy, Offset);
809 if (!Offset.isZero() || !Indices[0].isZero())
810 return nullptr;
811
812 Constant *C = Base;
813 for (const APInt &Index : drop_begin(Indices)) {
814 if (Index.isNegative() || Index.getActiveBits() >= 32)
815 return nullptr;
816
817 C = C->getAggregateElement(Index.getZExtValue());
818 if (!C)
819 return nullptr;
820 }
821
822 return C;
823}
824
826 const APInt &Offset,
827 const DataLayout &DL) {
828 if (Constant *AtOffset = getConstantAtOffset(C, Offset, DL))
829 if (Constant *Result = ConstantFoldLoadThroughBitcast(AtOffset, Ty, DL))
830 return Result;
831
832 // Explicitly check for out-of-bounds access, so we return poison even if the
833 // constant is a uniform value.
834 TypeSize Size = DL.getTypeAllocSize(C->getType());
835 if (!Size.isScalable() && Offset.sge(Size.getFixedValue()))
836 return PoisonValue::get(Ty);
837
838 // Try an offset-independent fold of a uniform value.
839 if (Constant *Result = ConstantFoldLoadFromUniformValue(C, Ty, DL))
840 return Result;
841
842 // Try hard to fold loads from bitcasted strange and non-type-safe things.
843 if (Offset.getSignificantBits() <= 64)
844 if (Constant *Result =
845 FoldReinterpretLoadFromConst(C, Ty, Offset.getSExtValue(), DL))
846 return Result;
847
848 return nullptr;
849}
850
855
858 const DataLayout &DL) {
859 // We can only fold loads from constant globals with a definitive initializer.
860 // Check this upfront, to skip expensive offset calculations.
862 if (!GV || !GV->isConstant() || !GV->hasDefinitiveInitializer())
863 return nullptr;
864
865 C = cast<Constant>(C->stripAndAccumulateConstantOffsets(
866 DL, Offset, /* AllowNonInbounds */ true));
867
868 if (C == GV)
869 if (Constant *Result = ConstantFoldLoadFromConst(GV->getInitializer(), Ty,
870 Offset, DL))
871 return Result;
872
873 // If this load comes from anywhere in a uniform constant global, the value
874 // is always the same, regardless of the loaded offset.
875 return ConstantFoldLoadFromUniformValue(GV->getInitializer(), Ty, DL);
876}
877
879 const DataLayout &DL) {
880 APInt Offset(DL.getIndexTypeSizeInBits(C->getType()), 0);
881 return ConstantFoldLoadFromConstPtr(C, Ty, std::move(Offset), DL);
882}
883
885 const DataLayout &DL) {
886 if (isa<PoisonValue>(C))
887 return PoisonValue::get(Ty);
888 if (isa<UndefValue>(C))
889 return UndefValue::get(Ty);
890 // If padding is needed when storing C to memory, then it isn't considered as
891 // uniform.
892 if (!DL.typeSizeEqualsStoreSize(C->getType()))
893 return nullptr;
894 if (C->isNullValue() && !Ty->isX86_AMXTy())
895 return Constant::getNullValue(Ty);
896 if (C->isAllOnesValue() &&
897 (Ty->isIntOrIntVectorTy() || Ty->isFPOrFPVectorTy()))
898 return Constant::getAllOnesValue(Ty);
899 return nullptr;
900}
901
902namespace {
903
904/// One of Op0/Op1 is a constant expression.
905/// Attempt to symbolically evaluate the result of a binary operator merging
906/// these together. If target data info is available, it is provided as DL,
907/// otherwise DL is null.
908Constant *SymbolicallyEvaluateBinop(unsigned Opc, Constant *Op0, Constant *Op1,
909 const DataLayout &DL) {
910 // SROA
911
912 // Fold (and 0xffffffff00000000, (shl x, 32)) -> shl.
913 // Fold (lshr (or X, Y), 32) -> (lshr [X/Y], 32) if one doesn't contribute
914 // bits.
915
916 if (Opc == Instruction::And) {
917 KnownBits Known0 = computeKnownBits(Op0, DL);
918 KnownBits Known1 = computeKnownBits(Op1, DL);
919 if ((Known1.One | Known0.Zero).isAllOnes()) {
920 // All the bits of Op0 that the 'and' could be masking are already zero.
921 return Op0;
922 }
923 if ((Known0.One | Known1.Zero).isAllOnes()) {
924 // All the bits of Op1 that the 'and' could be masking are already zero.
925 return Op1;
926 }
927
928 Known0 &= Known1;
929 if (Known0.isConstant())
930 return ConstantInt::get(Op0->getType(), Known0.getConstant());
931 }
932
933 // If the constant expr is something like &A[123] - &A[4].f, fold this into a
934 // constant. This happens frequently when iterating over a global array.
935 if (Opc == Instruction::Sub) {
936 GlobalValue *GV1, *GV2;
937 APInt Offs1, Offs2;
938
939 if (IsConstantOffsetFromGlobal(Op0, GV1, Offs1, DL))
940 if (IsConstantOffsetFromGlobal(Op1, GV2, Offs2, DL) && GV1 == GV2) {
941 unsigned OpSize = DL.getTypeSizeInBits(Op0->getType());
942
943 // (&GV+C1) - (&GV+C2) -> C1-C2, pointer arithmetic cannot overflow.
944 // PtrToInt may change the bitwidth so we have convert to the right size
945 // first.
946 return ConstantInt::get(Op0->getType(), Offs1.zextOrTrunc(OpSize) -
947 Offs2.zextOrTrunc(OpSize));
948 }
949 }
950
951 return nullptr;
952}
953
954/// If array indices are not pointer-sized integers, explicitly cast them so
955/// that they aren't implicitly casted by the getelementptr.
956Constant *CastGEPIndices(Type *SrcElemTy, ArrayRef<Constant *> Ops,
957 Type *ResultTy, GEPNoWrapFlags NW,
958 std::optional<ConstantRange> InRange,
959 const DataLayout &DL, const TargetLibraryInfo *TLI) {
960 Type *IntIdxTy = DL.getIndexType(ResultTy);
961 Type *IntIdxScalarTy = IntIdxTy->getScalarType();
962
963 bool Any = false;
965 for (unsigned i = 1, e = Ops.size(); i != e; ++i) {
966 if ((i == 1 ||
968 SrcElemTy, Ops.slice(1, i - 1)))) &&
969 Ops[i]->getType()->getScalarType() != IntIdxScalarTy) {
970 Any = true;
971 Type *NewType =
972 Ops[i]->getType()->isVectorTy() ? IntIdxTy : IntIdxScalarTy;
974 CastInst::getCastOpcode(Ops[i], true, NewType, true), Ops[i], NewType,
975 DL);
976 if (!NewIdx)
977 return nullptr;
978 NewIdxs.push_back(NewIdx);
979 } else
980 NewIdxs.push_back(Ops[i]);
981 }
982
983 if (!Any)
984 return nullptr;
985
986 Constant *C =
987 ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], NewIdxs, NW, InRange);
988 return ConstantFoldConstant(C, DL, TLI);
989}
990
991/// If we can symbolically evaluate the GEP constant expression, do so.
992Constant *SymbolicallyEvaluateGEP(const GEPOperator *GEP,
994 const DataLayout &DL,
995 const TargetLibraryInfo *TLI) {
996 Type *SrcElemTy = GEP->getSourceElementType();
997 Type *ResTy = GEP->getType();
998 if (!SrcElemTy->isSized() || isa<ScalableVectorType>(SrcElemTy))
999 return nullptr;
1000
1001 if (Constant *C = CastGEPIndices(SrcElemTy, Ops, ResTy, GEP->getNoWrapFlags(),
1002 GEP->getInRange(), DL, TLI))
1003 return C;
1004
1005 Constant *Ptr = Ops[0];
1006 if (!Ptr->getType()->isPointerTy())
1007 return nullptr;
1008
1009 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1010
1011 for (unsigned i = 1, e = Ops.size(); i != e; ++i)
1012 if (!isa<ConstantInt>(Ops[i]) || !Ops[i]->getType()->isIntegerTy())
1013 return nullptr;
1014
1015 unsigned BitWidth = DL.getTypeSizeInBits(IntIdxTy);
1016 APInt Offset = APInt(
1017 BitWidth,
1018 DL.getIndexedOffsetInType(
1019 SrcElemTy, ArrayRef((Value *const *)Ops.data() + 1, Ops.size() - 1)),
1020 /*isSigned=*/true, /*implicitTrunc=*/true);
1021
1022 std::optional<ConstantRange> InRange = GEP->getInRange();
1023 if (InRange)
1024 InRange = InRange->sextOrTrunc(BitWidth);
1025
1026 // If this is a GEP of a GEP, fold it all into a single GEP.
1027 GEPNoWrapFlags NW = GEP->getNoWrapFlags();
1028 bool Overflow = false;
1029 while (auto *GEP = dyn_cast<GEPOperator>(Ptr)) {
1030 NW &= GEP->getNoWrapFlags();
1031
1032 SmallVector<Value *, 4> NestedOps(llvm::drop_begin(GEP->operands()));
1033
1034 // Do not try the incorporate the sub-GEP if some index is not a number.
1035 bool AllConstantInt = true;
1036 for (Value *NestedOp : NestedOps)
1037 if (!isa<ConstantInt>(NestedOp)) {
1038 AllConstantInt = false;
1039 break;
1040 }
1041 if (!AllConstantInt)
1042 break;
1043
1044 // Adjust inrange offset and intersect inrange attributes
1045 if (auto GEPRange = GEP->getInRange()) {
1046 auto AdjustedGEPRange = GEPRange->sextOrTrunc(BitWidth).subtract(Offset);
1047 InRange =
1048 InRange ? InRange->intersectWith(AdjustedGEPRange) : AdjustedGEPRange;
1049 }
1050
1051 Ptr = cast<Constant>(GEP->getOperand(0));
1052 SrcElemTy = GEP->getSourceElementType();
1053 Offset = Offset.sadd_ov(
1054 APInt(BitWidth, DL.getIndexedOffsetInType(SrcElemTy, NestedOps),
1055 /*isSigned=*/true, /*implicitTrunc=*/true),
1056 Overflow);
1057 }
1058
1059 // Preserving nusw (without inbounds) also requires that the offset
1060 // additions did not overflow.
1061 if (NW.hasNoUnsignedSignedWrap() && !NW.isInBounds() && Overflow)
1063
1064 // If the base value for this address is a literal integer value, fold the
1065 // getelementptr to the resulting integer value casted to the pointer type.
1066 APInt BaseIntVal(DL.getPointerTypeSizeInBits(Ptr->getType()), 0);
1067 if (auto *CE = dyn_cast<ConstantExpr>(Ptr)) {
1068 if (CE->getOpcode() == Instruction::IntToPtr) {
1069 if (auto *Base = dyn_cast<ConstantInt>(CE->getOperand(0)))
1070 BaseIntVal = Base->getValue().zextOrTrunc(BaseIntVal.getBitWidth());
1071 }
1072 }
1073
1074 if ((Ptr->isNullValue() || BaseIntVal != 0) &&
1075 !DL.mustNotIntroduceIntToPtr(Ptr->getType())) {
1076
1077 // If the index size is smaller than the pointer size, add to the low
1078 // bits only.
1079 BaseIntVal.insertBits(BaseIntVal.trunc(BitWidth) + Offset, 0);
1080 Constant *C = ConstantInt::get(Ptr->getContext(), BaseIntVal);
1081 return ConstantExpr::getIntToPtr(C, ResTy);
1082 }
1083
1084 // Try to infer inbounds for GEPs of globals.
1085 if (!NW.isInBounds() && Offset.isNonNegative()) {
1086 bool CanBeNull, CanBeFreed;
1087 uint64_t DerefBytes =
1088 Ptr->getPointerDereferenceableBytes(DL, CanBeNull, CanBeFreed);
1089 if (DerefBytes != 0 && !CanBeNull && Offset.sle(DerefBytes))
1091 }
1092
1093 // nusw + nneg -> nuw
1094 if (NW.hasNoUnsignedSignedWrap() && Offset.isNonNegative())
1096
1097 // Otherwise canonicalize this to a single ptradd.
1098 LLVMContext &Ctx = Ptr->getContext();
1099 return ConstantExpr::getPtrAdd(Ptr, ConstantInt::get(Ctx, Offset), NW,
1100 InRange);
1101}
1102
1103/// Attempt to constant fold an instruction with the
1104/// specified opcode and operands. If successful, the constant result is
1105/// returned, if not, null is returned. Note that this function can fail when
1106/// attempting to fold instructions like loads and stores, which have no
1107/// constant expression form.
1108Constant *ConstantFoldInstOperandsImpl(const Value *InstOrCE, unsigned Opcode,
1110 const DataLayout &DL,
1111 const TargetLibraryInfo *TLI,
1112 bool AllowNonDeterministic) {
1113 Type *DestTy = InstOrCE->getType();
1114
1115 if (Instruction::isUnaryOp(Opcode))
1116 return ConstantFoldUnaryOpOperand(Opcode, Ops[0], DL);
1117
1118 if (Instruction::isBinaryOp(Opcode)) {
1119 switch (Opcode) {
1120 default:
1121 break;
1122 case Instruction::FAdd:
1123 case Instruction::FSub:
1124 case Instruction::FMul:
1125 case Instruction::FDiv:
1126 case Instruction::FRem:
1127 // Handle floating point instructions separately to account for denormals
1128 // TODO: If a constant expression is being folded rather than an
1129 // instruction, denormals will not be flushed/treated as zero
1130 if (const auto *I = dyn_cast<Instruction>(InstOrCE)) {
1131 return ConstantFoldFPInstOperands(Opcode, Ops[0], Ops[1], DL, I,
1132 AllowNonDeterministic);
1133 }
1134 }
1135 return ConstantFoldBinaryOpOperands(Opcode, Ops[0], Ops[1], DL);
1136 }
1137
1138 if (Instruction::isCast(Opcode))
1139 return ConstantFoldCastOperand(Opcode, Ops[0], DestTy, DL);
1140
1141 if (auto *GEP = dyn_cast<GEPOperator>(InstOrCE)) {
1142 Type *SrcElemTy = GEP->getSourceElementType();
1144 return nullptr;
1145
1146 if (Constant *C = SymbolicallyEvaluateGEP(GEP, Ops, DL, TLI))
1147 return C;
1148
1149 return ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], Ops.slice(1),
1150 GEP->getNoWrapFlags(),
1151 GEP->getInRange());
1152 }
1153
1154 if (auto *CE = dyn_cast<ConstantExpr>(InstOrCE))
1155 return CE->getWithOperands(Ops);
1156
1157 switch (Opcode) {
1158 default: return nullptr;
1159 case Instruction::ICmp:
1160 case Instruction::FCmp: {
1161 auto *C = cast<CmpInst>(InstOrCE);
1162 return ConstantFoldCompareInstOperands(C->getPredicate(), Ops[0], Ops[1],
1163 DL, TLI, C);
1164 }
1165 case Instruction::Freeze:
1166 return isGuaranteedNotToBeUndefOrPoison(Ops[0]) ? Ops[0] : nullptr;
1167 case Instruction::Call:
1168 if (auto *F = dyn_cast<Function>(Ops.back())) {
1169 const auto *Call = cast<CallBase>(InstOrCE);
1171 return ConstantFoldCall(Call, F, Ops.slice(0, Ops.size() - 1), TLI,
1172 AllowNonDeterministic);
1173 }
1174 return nullptr;
1175 case Instruction::Select:
1176 return ConstantFoldSelectInstruction(Ops[0], Ops[1], Ops[2]);
1177 case Instruction::ExtractElement:
1179 case Instruction::ExtractValue:
1181 Ops[0], cast<ExtractValueInst>(InstOrCE)->getIndices());
1182 case Instruction::InsertElement:
1183 return ConstantExpr::getInsertElement(Ops[0], Ops[1], Ops[2]);
1184 case Instruction::InsertValue:
1186 Ops[0], Ops[1], cast<InsertValueInst>(InstOrCE)->getIndices());
1187 case Instruction::ShuffleVector:
1189 Ops[0], Ops[1], cast<ShuffleVectorInst>(InstOrCE)->getShuffleMask());
1190 case Instruction::Load: {
1191 const auto *LI = dyn_cast<LoadInst>(InstOrCE);
1192 if (LI->isVolatile())
1193 return nullptr;
1194 return ConstantFoldLoadFromConstPtr(Ops[0], LI->getType(), DL);
1195 }
1196 }
1197}
1198
1199} // end anonymous namespace
1200
1201//===----------------------------------------------------------------------===//
1202// Constant Folding public APIs
1203//===----------------------------------------------------------------------===//
1204
1205namespace {
1206
1207Constant *
1208ConstantFoldConstantImpl(const Constant *C, const DataLayout &DL,
1209 const TargetLibraryInfo *TLI,
1212 return const_cast<Constant *>(C);
1213
1215 for (const Use &OldU : C->operands()) {
1216 Constant *OldC = cast<Constant>(&OldU);
1217 Constant *NewC = OldC;
1218 // Recursively fold the ConstantExpr's operands. If we have already folded
1219 // a ConstantExpr, we don't have to process it again.
1220 if (isa<ConstantVector>(OldC) || isa<ConstantExpr>(OldC)) {
1221 auto It = FoldedOps.find(OldC);
1222 if (It == FoldedOps.end()) {
1223 NewC = ConstantFoldConstantImpl(OldC, DL, TLI, FoldedOps);
1224 FoldedOps.insert({OldC, NewC});
1225 } else {
1226 NewC = It->second;
1227 }
1228 }
1229 Ops.push_back(NewC);
1230 }
1231
1232 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1233 if (Constant *Res = ConstantFoldInstOperandsImpl(
1234 CE, CE->getOpcode(), Ops, DL, TLI, /*AllowNonDeterministic=*/true))
1235 return Res;
1236 return const_cast<Constant *>(C);
1237 }
1238
1240 return ConstantVector::get(Ops);
1241}
1242
1243} // end anonymous namespace
1244
1246 const DataLayout &DL,
1247 const TargetLibraryInfo *TLI) {
1248 // Handle PHI nodes quickly here...
1249 if (auto *PN = dyn_cast<PHINode>(I)) {
1250 Constant *CommonValue = nullptr;
1251
1253 for (Value *Incoming : PN->incoming_values()) {
1254 // If the incoming value is undef then skip it. Note that while we could
1255 // skip the value if it is equal to the phi node itself we choose not to
1256 // because that would break the rule that constant folding only applies if
1257 // all operands are constants.
1258 if (isa<UndefValue>(Incoming))
1259 continue;
1260 // If the incoming value is not a constant, then give up.
1261 auto *C = dyn_cast<Constant>(Incoming);
1262 if (!C)
1263 return nullptr;
1264 // Fold the PHI's operands.
1265 C = ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1266 // If the incoming value is a different constant to
1267 // the one we saw previously, then give up.
1268 if (CommonValue && C != CommonValue)
1269 return nullptr;
1270 CommonValue = C;
1271 }
1272
1273 // If we reach here, all incoming values are the same constant or undef.
1274 return CommonValue ? CommonValue : UndefValue::get(PN->getType());
1275 }
1276
1277 // Scan the operand list, checking to see if they are all constants, if so,
1278 // hand off to ConstantFoldInstOperandsImpl.
1279 if (!all_of(I->operands(), [](const Use &U) { return isa<Constant>(U); }))
1280 return nullptr;
1281
1284 for (const Use &OpU : I->operands()) {
1285 auto *Op = cast<Constant>(&OpU);
1286 // Fold the Instruction's operands.
1287 Op = ConstantFoldConstantImpl(Op, DL, TLI, FoldedOps);
1288 Ops.push_back(Op);
1289 }
1290
1291 return ConstantFoldInstOperands(I, Ops, DL, TLI);
1292}
1293
1295 const TargetLibraryInfo *TLI) {
1297 return ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1298}
1299
1302 const DataLayout &DL,
1303 const TargetLibraryInfo *TLI,
1304 bool AllowNonDeterministic) {
1305 return ConstantFoldInstOperandsImpl(I, I->getOpcode(), Ops, DL, TLI,
1306 AllowNonDeterministic);
1307}
1308
1310 unsigned IntPredicate, Constant *Ops0, Constant *Ops1, const DataLayout &DL,
1311 const TargetLibraryInfo *TLI, const Instruction *I) {
1312 CmpInst::Predicate Predicate = (CmpInst::Predicate)IntPredicate;
1313 // fold: icmp (inttoptr x), null -> icmp x, 0
1314 // fold: icmp null, (inttoptr x) -> icmp 0, x
1315 // fold: icmp (ptrtoint x), 0 -> icmp x, null
1316 // fold: icmp 0, (ptrtoint x) -> icmp null, x
1317 // fold: icmp (inttoptr x), (inttoptr y) -> icmp trunc/zext x, trunc/zext y
1318 // fold: icmp (ptrtoint x), (ptrtoint y) -> icmp x, y
1319 //
1320 // FIXME: The following comment is out of data and the DataLayout is here now.
1321 // ConstantExpr::getCompare cannot do this, because it doesn't have DL
1322 // around to know if bit truncation is happening.
1323 if (auto *CE0 = dyn_cast<ConstantExpr>(Ops0)) {
1324 if (Ops1->isNullValue()) {
1325 if (CE0->getOpcode() == Instruction::IntToPtr) {
1326 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1327 // Convert the integer value to the right size to ensure we get the
1328 // proper extension or truncation.
1329 if (Constant *C = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1330 /*IsSigned*/ false, DL)) {
1331 Constant *Null = Constant::getNullValue(C->getType());
1332 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1333 }
1334 }
1335
1336 // icmp only compares the address part of the pointer, so only do this
1337 // transform if the integer size matches the address size.
1338 if (CE0->getOpcode() == Instruction::PtrToInt ||
1339 CE0->getOpcode() == Instruction::PtrToAddr) {
1340 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1341 if (CE0->getType() == AddrTy) {
1342 Constant *C = CE0->getOperand(0);
1343 Constant *Null = Constant::getNullValue(C->getType());
1344 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1345 }
1346 }
1347 }
1348
1349 if (auto *CE1 = dyn_cast<ConstantExpr>(Ops1)) {
1350 if (CE0->getOpcode() == CE1->getOpcode()) {
1351 if (CE0->getOpcode() == Instruction::IntToPtr) {
1352 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1353
1354 // Convert the integer value to the right size to ensure we get the
1355 // proper extension or truncation.
1356 Constant *C0 = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1357 /*IsSigned*/ false, DL);
1358 Constant *C1 = ConstantFoldIntegerCast(CE1->getOperand(0), IntPtrTy,
1359 /*IsSigned*/ false, DL);
1360 if (C0 && C1)
1361 return ConstantFoldCompareInstOperands(Predicate, C0, C1, DL, TLI);
1362 }
1363
1364 // icmp only compares the address part of the pointer, so only do this
1365 // transform if the integer size matches the address size.
1366 if (CE0->getOpcode() == Instruction::PtrToInt ||
1367 CE0->getOpcode() == Instruction::PtrToAddr) {
1368 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1369 if (CE0->getType() == AddrTy &&
1370 CE0->getOperand(0)->getType() == CE1->getOperand(0)->getType()) {
1372 Predicate, CE0->getOperand(0), CE1->getOperand(0), DL, TLI);
1373 }
1374 }
1375 }
1376 }
1377
1378 // Convert pointer comparison (base+offset1) pred (base+offset2) into
1379 // offset1 pred offset2, for the case where the offset is inbounds. This
1380 // only works for equality and unsigned comparison, as inbounds permits
1381 // crossing the sign boundary. However, the offset comparison itself is
1382 // signed.
1383 if (Ops0->getType()->isPointerTy() && !ICmpInst::isSigned(Predicate)) {
1384 unsigned IndexWidth = DL.getIndexTypeSizeInBits(Ops0->getType());
1385 APInt Offset0(IndexWidth, 0);
1386 bool IsEqPred = ICmpInst::isEquality(Predicate);
1387 Value *Stripped0 = Ops0->stripAndAccumulateConstantOffsets(
1388 DL, Offset0, /*AllowNonInbounds=*/IsEqPred,
1389 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1390 /*LookThroughIntToPtr=*/IsEqPred);
1391 APInt Offset1(IndexWidth, 0);
1392 Value *Stripped1 = Ops1->stripAndAccumulateConstantOffsets(
1393 DL, Offset1, /*AllowNonInbounds=*/IsEqPred,
1394 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1395 /*LookThroughIntToPtr=*/IsEqPred);
1396 if (Stripped0 == Stripped1)
1397 return ConstantInt::getBool(
1398 Ops0->getContext(),
1399 ICmpInst::compare(Offset0, Offset1,
1400 ICmpInst::getSignedPredicate(Predicate)));
1401 }
1402 } else if (isa<ConstantExpr>(Ops1)) {
1403 // If RHS is a constant expression, but the left side isn't, swap the
1404 // operands and try again.
1405 Predicate = ICmpInst::getSwappedPredicate(Predicate);
1406 return ConstantFoldCompareInstOperands(Predicate, Ops1, Ops0, DL, TLI);
1407 }
1408
1409 if (CmpInst::isFPPredicate(Predicate)) {
1410 // Flush any denormal constant float input according to denormal handling
1411 // mode.
1412 Ops0 = FlushFPConstant(Ops0, I, /*IsOutput=*/false);
1413 if (!Ops0)
1414 return nullptr;
1415 Ops1 = FlushFPConstant(Ops1, I, /*IsOutput=*/false);
1416 if (!Ops1)
1417 return nullptr;
1418 }
1419
1420 return ConstantFoldCompareInstruction(Predicate, Ops0, Ops1);
1421}
1422
1424 const DataLayout &DL) {
1426
1427 return ConstantFoldUnaryInstruction(Opcode, Op);
1428}
1429
1431 Constant *RHS,
1432 const DataLayout &DL) {
1434 if (isa<ConstantExpr>(LHS) || isa<ConstantExpr>(RHS))
1435 if (Constant *C = SymbolicallyEvaluateBinop(Opcode, LHS, RHS, DL))
1436 return C;
1437
1439 return ConstantExpr::get(Opcode, LHS, RHS);
1440 return ConstantFoldBinaryInstruction(Opcode, LHS, RHS);
1441}
1442
1445 switch (Mode) {
1447 return nullptr;
1448 case DenormalMode::IEEE:
1449 return ConstantFP::get(Ty->getContext(), APF);
1451 return ConstantFP::get(
1452 Ty->getContext(),
1455 return ConstantFP::get(Ty->getContext(),
1456 APFloat::getZero(APF.getSemantics(), false));
1457 default:
1458 break;
1459 }
1460
1461 llvm_unreachable("unknown denormal mode");
1462}
1463
1464/// Return the denormal mode that can be assumed when executing a floating point
1465/// operation at \p CtxI.
1467 if (!CtxI || !CtxI->getParent() || !CtxI->getFunction())
1468 return DenormalMode::getDynamic();
1469 return CtxI->getFunction()->getDenormalMode(
1470 Ty->getScalarType()->getFltSemantics());
1471}
1472
1474 const Instruction *Inst,
1475 bool IsOutput) {
1476 const APFloat &APF = CFP->getValueAPF();
1477 if (!APF.isDenormal())
1478 return CFP;
1479
1481 return flushDenormalConstant(CFP->getType(), APF,
1482 IsOutput ? Mode.Output : Mode.Input);
1483}
1484
1486 bool IsOutput) {
1487 if (ConstantFP *CFP = dyn_cast<ConstantFP>(Operand))
1488 return flushDenormalConstantFP(CFP, Inst, IsOutput);
1489
1491 return Operand;
1492
1493 Type *Ty = Operand->getType();
1494 VectorType *VecTy = dyn_cast<VectorType>(Ty);
1495 if (VecTy) {
1496 if (auto *Splat = dyn_cast_or_null<ConstantFP>(Operand->getSplatValue())) {
1497 ConstantFP *Folded = flushDenormalConstantFP(Splat, Inst, IsOutput);
1498 if (!Folded)
1499 return nullptr;
1500 return ConstantVector::getSplat(VecTy->getElementCount(), Folded);
1501 }
1502
1503 Ty = VecTy->getElementType();
1504 }
1505
1506 if (isa<ConstantExpr>(Operand))
1507 return Operand;
1508
1509 if (const auto *CV = dyn_cast<ConstantVector>(Operand)) {
1511 for (unsigned i = 0, e = CV->getNumOperands(); i != e; ++i) {
1512 Constant *Element = CV->getAggregateElement(i);
1513 if (isa<UndefValue>(Element)) {
1514 NewElts.push_back(Element);
1515 continue;
1516 }
1517
1518 ConstantFP *CFP = dyn_cast<ConstantFP>(Element);
1519 if (!CFP)
1520 return nullptr;
1521
1522 ConstantFP *Folded = flushDenormalConstantFP(CFP, Inst, IsOutput);
1523 if (!Folded)
1524 return nullptr;
1525 NewElts.push_back(Folded);
1526 }
1527
1528 return ConstantVector::get(NewElts);
1529 }
1530
1531 if (const auto *CDV = dyn_cast<ConstantDataVector>(Operand)) {
1533 for (unsigned I = 0, E = CDV->getNumElements(); I < E; ++I) {
1534 const APFloat &Elt = CDV->getElementAsAPFloat(I);
1535 if (!Elt.isDenormal()) {
1536 NewElts.push_back(ConstantFP::get(Ty, Elt));
1537 } else {
1538 DenormalMode Mode = getInstrDenormalMode(Inst, Ty);
1539 ConstantFP *Folded =
1540 flushDenormalConstant(Ty, Elt, IsOutput ? Mode.Output : Mode.Input);
1541 if (!Folded)
1542 return nullptr;
1543 NewElts.push_back(Folded);
1544 }
1545 }
1546
1547 return ConstantVector::get(NewElts);
1548 }
1549
1550 return nullptr;
1551}
1552
1554 Constant *RHS, const DataLayout &DL,
1555 const Instruction *I,
1556 bool AllowNonDeterministic) {
1557 if (Instruction::isBinaryOp(Opcode)) {
1558 // Flush denormal inputs if needed.
1559 Constant *Op0 = FlushFPConstant(LHS, I, /* IsOutput */ false);
1560 if (!Op0)
1561 return nullptr;
1562 Constant *Op1 = FlushFPConstant(RHS, I, /* IsOutput */ false);
1563 if (!Op1)
1564 return nullptr;
1565
1566 // If nsz or an algebraic FMF flag is set, the result of the FP operation
1567 // may change due to future optimization. Don't constant fold them if
1568 // non-deterministic results are not allowed.
1569 if (!AllowNonDeterministic)
1571 if (FP->hasNoSignedZeros() || FP->hasAllowReassoc() ||
1572 FP->hasAllowContract() || FP->hasAllowReciprocal())
1573 return nullptr;
1574
1575 // Calculate constant result.
1576 Constant *C = ConstantFoldBinaryOpOperands(Opcode, Op0, Op1, DL);
1577 if (!C)
1578 return nullptr;
1579
1580 // Flush denormal output if needed.
1581 C = FlushFPConstant(C, I, /* IsOutput */ true);
1582 if (!C)
1583 return nullptr;
1584
1585 // The precise NaN value is non-deterministic.
1586 if (!AllowNonDeterministic && C->isNaN())
1587 return nullptr;
1588
1589 return C;
1590 }
1591 // If instruction lacks a parent/function and the denormal mode cannot be
1592 // determined, use the default (IEEE).
1593 return ConstantFoldBinaryOpOperands(Opcode, LHS, RHS, DL);
1594}
1595
1597 Type *DestTy, const DataLayout &DL) {
1598 assert(Instruction::isCast(Opcode));
1599
1600 if (auto *CE = dyn_cast<ConstantExpr>(C))
1601 if (CE->isCast())
1602 if (unsigned NewOp = CastInst::isEliminableCastPair(
1603 Instruction::CastOps(CE->getOpcode()),
1604 Instruction::CastOps(Opcode), CE->getOperand(0)->getType(),
1605 C->getType(), DestTy, &DL))
1606 return ConstantFoldCastOperand(NewOp, CE->getOperand(0), DestTy, DL);
1607
1608 switch (Opcode) {
1609 default:
1610 llvm_unreachable("Missing case");
1611 case Instruction::PtrToAddr:
1612 case Instruction::PtrToInt:
1613 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1614 Constant *FoldedValue = nullptr;
1615 // If the input is an inttoptr, eliminate the pair. This requires knowing
1616 // the width of a pointer, so it can't be done in ConstantExpr::getCast.
1617 if (CE->getOpcode() == Instruction::IntToPtr) {
1618 // zext/trunc the inttoptr to pointer/address size.
1619 Type *MidTy = Opcode == Instruction::PtrToInt
1620 ? DL.getAddressType(CE->getType())
1621 : DL.getIntPtrType(CE->getType());
1622 FoldedValue = ConstantFoldIntegerCast(CE->getOperand(0), MidTy,
1623 /*IsSigned=*/false, DL);
1624 } else if (auto *GEP = dyn_cast<GEPOperator>(CE)) {
1625 // If we have GEP, we can perform the following folds:
1626 // (ptrtoint/ptrtoaddr (gep null, x)) -> x
1627 // (ptrtoint/ptrtoaddr (gep (gep null, x), y) -> x + y, etc.
1628 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
1629 APInt BaseOffset(BitWidth, 0);
1630 auto *Base = cast<Constant>(GEP->stripAndAccumulateConstantOffsets(
1631 DL, BaseOffset, /*AllowNonInbounds=*/true));
1632 if (Base->isNullValue()) {
1633 FoldedValue = ConstantInt::get(CE->getContext(), BaseOffset);
1634 } else {
1635 // ptrtoint/ptrtoaddr (gep i8, Ptr, (sub 0, V))
1636 // -> sub (ptrtoint/ptrtoaddr Ptr), V
1637 if (GEP->getNumIndices() == 1 &&
1638 GEP->getSourceElementType()->isIntegerTy(8)) {
1639 auto *Ptr = cast<Constant>(GEP->getPointerOperand());
1640 auto *Sub = dyn_cast<ConstantExpr>(GEP->getOperand(1));
1641 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1642 if (Sub && Sub->getType() == IntIdxTy &&
1643 Sub->getOpcode() == Instruction::Sub &&
1644 Sub->getOperand(0)->isNullValue())
1645 FoldedValue = ConstantExpr::getSub(
1646 ConstantExpr::getCast(Opcode, Ptr, IntIdxTy),
1647 Sub->getOperand(1));
1648 }
1649 }
1650 }
1651 if (FoldedValue) {
1652 // Do a zext or trunc to get to the ptrtoint/ptrtoaddr dest size.
1653 return ConstantFoldIntegerCast(FoldedValue, DestTy, /*IsSigned=*/false,
1654 DL);
1655 }
1656 }
1657 break;
1658 case Instruction::IntToPtr:
1659 // If the input is a ptrtoint, turn the pair into a ptr to ptr bitcast if
1660 // the int size is >= the ptr size and the address spaces are the same.
1661 // This requires knowing the width of a pointer, so it can't be done in
1662 // ConstantExpr::getCast.
1663 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1664 if (CE->getOpcode() == Instruction::PtrToInt) {
1665 Constant *SrcPtr = CE->getOperand(0);
1666 unsigned SrcPtrSize = DL.getPointerTypeSizeInBits(SrcPtr->getType());
1667 unsigned MidIntSize = CE->getType()->getScalarSizeInBits();
1668
1669 if (MidIntSize >= SrcPtrSize) {
1670 unsigned SrcAS = SrcPtr->getType()->getPointerAddressSpace();
1671 if (SrcAS == DestTy->getPointerAddressSpace())
1672 return FoldBitCast(CE->getOperand(0), DestTy, DL);
1673 }
1674 }
1675 }
1676 break;
1677 case Instruction::Trunc:
1678 case Instruction::ZExt:
1679 case Instruction::SExt:
1680 case Instruction::FPTrunc:
1681 case Instruction::FPExt:
1682 case Instruction::UIToFP:
1683 case Instruction::SIToFP:
1684 case Instruction::FPToUI:
1685 case Instruction::FPToSI:
1686 case Instruction::AddrSpaceCast:
1687 break;
1688 case Instruction::BitCast:
1689 return FoldBitCast(C, DestTy, DL);
1690 }
1691
1693 return ConstantExpr::getCast(Opcode, C, DestTy);
1694 return ConstantFoldCastInstruction(Opcode, C, DestTy);
1695}
1696
1698 bool IsSigned, const DataLayout &DL) {
1699 Type *SrcTy = C->getType();
1700 if (SrcTy == DestTy)
1701 return C;
1702 if (SrcTy->getScalarSizeInBits() > DestTy->getScalarSizeInBits())
1703 return ConstantFoldCastOperand(Instruction::Trunc, C, DestTy, DL);
1704 if (IsSigned)
1705 return ConstantFoldCastOperand(Instruction::SExt, C, DestTy, DL);
1706 return ConstantFoldCastOperand(Instruction::ZExt, C, DestTy, DL);
1707}
1708
1709//===----------------------------------------------------------------------===//
1710// Constant Folding for Calls
1711//
1712
1714 if (Call->isNoBuiltin())
1715 return false;
1716 if (Call->getFunctionType() != F->getFunctionType())
1717 return false;
1718
1719 // Allow FP calls (both libcalls and intrinsics) to avoid being folded.
1720 // This can be useful for GPU targets or in cross-compilation scenarios
1721 // when the exact target FP behaviour is required, and the host compiler's
1722 // behaviour may be slightly different from the device's run-time behaviour.
1723 if (DisableFPCallFolding && (F->getReturnType()->isFloatingPointTy() ||
1724 any_of(F->args(), [](const Argument &Arg) {
1725 return Arg.getType()->isFloatingPointTy();
1726 })))
1727 return false;
1728
1729 switch (F->getIntrinsicID()) {
1730 // Operations that do not operate floating-point numbers and do not depend on
1731 // FP environment can be folded even in strictfp functions.
1732 case Intrinsic::bswap:
1733 case Intrinsic::ctpop:
1734 case Intrinsic::ctlz:
1735 case Intrinsic::cttz:
1736 case Intrinsic::fshl:
1737 case Intrinsic::fshr:
1738 case Intrinsic::launder_invariant_group:
1739 case Intrinsic::strip_invariant_group:
1740 case Intrinsic::masked_load:
1741 case Intrinsic::get_active_lane_mask:
1742 case Intrinsic::abs:
1743 case Intrinsic::smax:
1744 case Intrinsic::smin:
1745 case Intrinsic::umax:
1746 case Intrinsic::umin:
1747 case Intrinsic::scmp:
1748 case Intrinsic::ucmp:
1749 case Intrinsic::sadd_with_overflow:
1750 case Intrinsic::uadd_with_overflow:
1751 case Intrinsic::ssub_with_overflow:
1752 case Intrinsic::usub_with_overflow:
1753 case Intrinsic::smul_with_overflow:
1754 case Intrinsic::umul_with_overflow:
1755 case Intrinsic::sadd_sat:
1756 case Intrinsic::uadd_sat:
1757 case Intrinsic::ssub_sat:
1758 case Intrinsic::usub_sat:
1759 case Intrinsic::smul_fix:
1760 case Intrinsic::smul_fix_sat:
1761 case Intrinsic::bitreverse:
1762 case Intrinsic::is_constant:
1763 case Intrinsic::vector_reduce_add:
1764 case Intrinsic::vector_reduce_mul:
1765 case Intrinsic::vector_reduce_and:
1766 case Intrinsic::vector_reduce_or:
1767 case Intrinsic::vector_reduce_xor:
1768 case Intrinsic::vector_reduce_smin:
1769 case Intrinsic::vector_reduce_smax:
1770 case Intrinsic::vector_reduce_umin:
1771 case Intrinsic::vector_reduce_umax:
1772 case Intrinsic::vector_extract:
1773 case Intrinsic::vector_insert:
1774 case Intrinsic::vector_interleave2:
1775 case Intrinsic::vector_interleave3:
1776 case Intrinsic::vector_interleave4:
1777 case Intrinsic::vector_interleave5:
1778 case Intrinsic::vector_interleave6:
1779 case Intrinsic::vector_interleave7:
1780 case Intrinsic::vector_interleave8:
1781 case Intrinsic::vector_deinterleave2:
1782 case Intrinsic::vector_deinterleave3:
1783 case Intrinsic::vector_deinterleave4:
1784 case Intrinsic::vector_deinterleave5:
1785 case Intrinsic::vector_deinterleave6:
1786 case Intrinsic::vector_deinterleave7:
1787 case Intrinsic::vector_deinterleave8:
1788 // Target intrinsics
1789 case Intrinsic::amdgcn_perm:
1790 case Intrinsic::amdgcn_wave_reduce_umin:
1791 case Intrinsic::amdgcn_wave_reduce_umax:
1792 case Intrinsic::amdgcn_wave_reduce_max:
1793 case Intrinsic::amdgcn_wave_reduce_min:
1794 case Intrinsic::amdgcn_wave_reduce_and:
1795 case Intrinsic::amdgcn_wave_reduce_or:
1796 case Intrinsic::amdgcn_s_wqm:
1797 case Intrinsic::amdgcn_s_quadmask:
1798 case Intrinsic::amdgcn_s_bitreplicate:
1799 case Intrinsic::arm_mve_vctp8:
1800 case Intrinsic::arm_mve_vctp16:
1801 case Intrinsic::arm_mve_vctp32:
1802 case Intrinsic::arm_mve_vctp64:
1803 case Intrinsic::aarch64_sve_convert_from_svbool:
1804 case Intrinsic::wasm_alltrue:
1805 case Intrinsic::wasm_anytrue:
1806 case Intrinsic::wasm_dot:
1807 // WebAssembly float semantics are always known
1808 case Intrinsic::wasm_trunc_signed:
1809 case Intrinsic::wasm_trunc_unsigned:
1810 return true;
1811
1812 // Floating point operations cannot be folded in strictfp functions in
1813 // general case. They can be folded if FP environment is known to compiler.
1814 case Intrinsic::minnum:
1815 case Intrinsic::maxnum:
1816 case Intrinsic::minimum:
1817 case Intrinsic::maximum:
1818 case Intrinsic::minimumnum:
1819 case Intrinsic::maximumnum:
1820 case Intrinsic::log:
1821 case Intrinsic::log2:
1822 case Intrinsic::log10:
1823 case Intrinsic::exp:
1824 case Intrinsic::exp2:
1825 case Intrinsic::exp10:
1826 case Intrinsic::sqrt:
1827 case Intrinsic::sin:
1828 case Intrinsic::cos:
1829 case Intrinsic::sincos:
1830 case Intrinsic::sinh:
1831 case Intrinsic::cosh:
1832 case Intrinsic::atan:
1833 case Intrinsic::pow:
1834 case Intrinsic::powi:
1835 case Intrinsic::ldexp:
1836 case Intrinsic::fma:
1837 case Intrinsic::fmuladd:
1838 case Intrinsic::frexp:
1839 case Intrinsic::fptoui_sat:
1840 case Intrinsic::fptosi_sat:
1841 case Intrinsic::amdgcn_cos:
1842 case Intrinsic::amdgcn_cubeid:
1843 case Intrinsic::amdgcn_cubema:
1844 case Intrinsic::amdgcn_cubesc:
1845 case Intrinsic::amdgcn_cubetc:
1846 case Intrinsic::amdgcn_fmul_legacy:
1847 case Intrinsic::amdgcn_fma_legacy:
1848 case Intrinsic::amdgcn_fract:
1849 case Intrinsic::amdgcn_sin:
1850 // The intrinsics below depend on rounding mode in MXCSR.
1851 case Intrinsic::x86_sse_cvtss2si:
1852 case Intrinsic::x86_sse_cvtss2si64:
1853 case Intrinsic::x86_sse_cvttss2si:
1854 case Intrinsic::x86_sse_cvttss2si64:
1855 case Intrinsic::x86_sse2_cvtsd2si:
1856 case Intrinsic::x86_sse2_cvtsd2si64:
1857 case Intrinsic::x86_sse2_cvttsd2si:
1858 case Intrinsic::x86_sse2_cvttsd2si64:
1859 case Intrinsic::x86_avx512_vcvtss2si32:
1860 case Intrinsic::x86_avx512_vcvtss2si64:
1861 case Intrinsic::x86_avx512_cvttss2si:
1862 case Intrinsic::x86_avx512_cvttss2si64:
1863 case Intrinsic::x86_avx512_vcvtsd2si32:
1864 case Intrinsic::x86_avx512_vcvtsd2si64:
1865 case Intrinsic::x86_avx512_cvttsd2si:
1866 case Intrinsic::x86_avx512_cvttsd2si64:
1867 case Intrinsic::x86_avx512_vcvtss2usi32:
1868 case Intrinsic::x86_avx512_vcvtss2usi64:
1869 case Intrinsic::x86_avx512_cvttss2usi:
1870 case Intrinsic::x86_avx512_cvttss2usi64:
1871 case Intrinsic::x86_avx512_vcvtsd2usi32:
1872 case Intrinsic::x86_avx512_vcvtsd2usi64:
1873 case Intrinsic::x86_avx512_cvttsd2usi:
1874 case Intrinsic::x86_avx512_cvttsd2usi64:
1875
1876 // NVVM FMax intrinsics
1877 case Intrinsic::nvvm_fmax_d:
1878 case Intrinsic::nvvm_fmax_f:
1879 case Intrinsic::nvvm_fmax_ftz_f:
1880 case Intrinsic::nvvm_fmax_ftz_nan_f:
1881 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
1882 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
1883 case Intrinsic::nvvm_fmax_nan_f:
1884 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
1885 case Intrinsic::nvvm_fmax_xorsign_abs_f:
1886
1887 // NVVM FMin intrinsics
1888 case Intrinsic::nvvm_fmin_d:
1889 case Intrinsic::nvvm_fmin_f:
1890 case Intrinsic::nvvm_fmin_ftz_f:
1891 case Intrinsic::nvvm_fmin_ftz_nan_f:
1892 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
1893 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
1894 case Intrinsic::nvvm_fmin_nan_f:
1895 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
1896 case Intrinsic::nvvm_fmin_xorsign_abs_f:
1897
1898 // NVVM float/double to int32/uint32 conversion intrinsics
1899 case Intrinsic::nvvm_f2i_rm:
1900 case Intrinsic::nvvm_f2i_rn:
1901 case Intrinsic::nvvm_f2i_rp:
1902 case Intrinsic::nvvm_f2i_rz:
1903 case Intrinsic::nvvm_f2i_rm_ftz:
1904 case Intrinsic::nvvm_f2i_rn_ftz:
1905 case Intrinsic::nvvm_f2i_rp_ftz:
1906 case Intrinsic::nvvm_f2i_rz_ftz:
1907 case Intrinsic::nvvm_f2ui_rm:
1908 case Intrinsic::nvvm_f2ui_rn:
1909 case Intrinsic::nvvm_f2ui_rp:
1910 case Intrinsic::nvvm_f2ui_rz:
1911 case Intrinsic::nvvm_f2ui_rm_ftz:
1912 case Intrinsic::nvvm_f2ui_rn_ftz:
1913 case Intrinsic::nvvm_f2ui_rp_ftz:
1914 case Intrinsic::nvvm_f2ui_rz_ftz:
1915 case Intrinsic::nvvm_d2i_rm:
1916 case Intrinsic::nvvm_d2i_rn:
1917 case Intrinsic::nvvm_d2i_rp:
1918 case Intrinsic::nvvm_d2i_rz:
1919 case Intrinsic::nvvm_d2ui_rm:
1920 case Intrinsic::nvvm_d2ui_rn:
1921 case Intrinsic::nvvm_d2ui_rp:
1922 case Intrinsic::nvvm_d2ui_rz:
1923
1924 // NVVM float/double to int64/uint64 conversion intrinsics
1925 case Intrinsic::nvvm_f2ll_rm:
1926 case Intrinsic::nvvm_f2ll_rn:
1927 case Intrinsic::nvvm_f2ll_rp:
1928 case Intrinsic::nvvm_f2ll_rz:
1929 case Intrinsic::nvvm_f2ll_rm_ftz:
1930 case Intrinsic::nvvm_f2ll_rn_ftz:
1931 case Intrinsic::nvvm_f2ll_rp_ftz:
1932 case Intrinsic::nvvm_f2ll_rz_ftz:
1933 case Intrinsic::nvvm_f2ull_rm:
1934 case Intrinsic::nvvm_f2ull_rn:
1935 case Intrinsic::nvvm_f2ull_rp:
1936 case Intrinsic::nvvm_f2ull_rz:
1937 case Intrinsic::nvvm_f2ull_rm_ftz:
1938 case Intrinsic::nvvm_f2ull_rn_ftz:
1939 case Intrinsic::nvvm_f2ull_rp_ftz:
1940 case Intrinsic::nvvm_f2ull_rz_ftz:
1941 case Intrinsic::nvvm_d2ll_rm:
1942 case Intrinsic::nvvm_d2ll_rn:
1943 case Intrinsic::nvvm_d2ll_rp:
1944 case Intrinsic::nvvm_d2ll_rz:
1945 case Intrinsic::nvvm_d2ull_rm:
1946 case Intrinsic::nvvm_d2ull_rn:
1947 case Intrinsic::nvvm_d2ull_rp:
1948 case Intrinsic::nvvm_d2ull_rz:
1949
1950 // NVVM math intrinsics:
1951 case Intrinsic::nvvm_ceil_d:
1952 case Intrinsic::nvvm_ceil_f:
1953 case Intrinsic::nvvm_ceil_ftz_f:
1954
1955 case Intrinsic::nvvm_fabs:
1956 case Intrinsic::nvvm_fabs_ftz:
1957
1958 case Intrinsic::nvvm_floor_d:
1959 case Intrinsic::nvvm_floor_f:
1960 case Intrinsic::nvvm_floor_ftz_f:
1961
1962 case Intrinsic::nvvm_rcp_rm_d:
1963 case Intrinsic::nvvm_rcp_rm_f:
1964 case Intrinsic::nvvm_rcp_rm_ftz_f:
1965 case Intrinsic::nvvm_rcp_rn_d:
1966 case Intrinsic::nvvm_rcp_rn_f:
1967 case Intrinsic::nvvm_rcp_rn_ftz_f:
1968 case Intrinsic::nvvm_rcp_rp_d:
1969 case Intrinsic::nvvm_rcp_rp_f:
1970 case Intrinsic::nvvm_rcp_rp_ftz_f:
1971 case Intrinsic::nvvm_rcp_rz_d:
1972 case Intrinsic::nvvm_rcp_rz_f:
1973 case Intrinsic::nvvm_rcp_rz_ftz_f:
1974
1975 case Intrinsic::nvvm_round_d:
1976 case Intrinsic::nvvm_round_f:
1977 case Intrinsic::nvvm_round_ftz_f:
1978
1979 case Intrinsic::nvvm_saturate_d:
1980 case Intrinsic::nvvm_saturate_f:
1981 case Intrinsic::nvvm_saturate_ftz_f:
1982
1983 case Intrinsic::nvvm_sqrt_f:
1984 case Intrinsic::nvvm_sqrt_rn_d:
1985 case Intrinsic::nvvm_sqrt_rn_f:
1986 case Intrinsic::nvvm_sqrt_rn_ftz_f:
1987 return !Call->isStrictFP();
1988
1989 // NVVM add intrinsics with explicit rounding modes
1990 case Intrinsic::nvvm_add_rm_d:
1991 case Intrinsic::nvvm_add_rn_d:
1992 case Intrinsic::nvvm_add_rp_d:
1993 case Intrinsic::nvvm_add_rz_d:
1994 case Intrinsic::nvvm_add_rm_f:
1995 case Intrinsic::nvvm_add_rn_f:
1996 case Intrinsic::nvvm_add_rp_f:
1997 case Intrinsic::nvvm_add_rz_f:
1998 case Intrinsic::nvvm_add_rm_ftz_f:
1999 case Intrinsic::nvvm_add_rn_ftz_f:
2000 case Intrinsic::nvvm_add_rp_ftz_f:
2001 case Intrinsic::nvvm_add_rz_ftz_f:
2002
2003 // NVVM div intrinsics with explicit rounding modes
2004 case Intrinsic::nvvm_div_rm_d:
2005 case Intrinsic::nvvm_div_rn_d:
2006 case Intrinsic::nvvm_div_rp_d:
2007 case Intrinsic::nvvm_div_rz_d:
2008 case Intrinsic::nvvm_div_rm_f:
2009 case Intrinsic::nvvm_div_rn_f:
2010 case Intrinsic::nvvm_div_rp_f:
2011 case Intrinsic::nvvm_div_rz_f:
2012 case Intrinsic::nvvm_div_rm_ftz_f:
2013 case Intrinsic::nvvm_div_rn_ftz_f:
2014 case Intrinsic::nvvm_div_rp_ftz_f:
2015 case Intrinsic::nvvm_div_rz_ftz_f:
2016
2017 // NVVM mul intrinsics with explicit rounding modes
2018 case Intrinsic::nvvm_mul_rm_d:
2019 case Intrinsic::nvvm_mul_rn_d:
2020 case Intrinsic::nvvm_mul_rp_d:
2021 case Intrinsic::nvvm_mul_rz_d:
2022 case Intrinsic::nvvm_mul_rm_f:
2023 case Intrinsic::nvvm_mul_rn_f:
2024 case Intrinsic::nvvm_mul_rp_f:
2025 case Intrinsic::nvvm_mul_rz_f:
2026 case Intrinsic::nvvm_mul_rm_ftz_f:
2027 case Intrinsic::nvvm_mul_rn_ftz_f:
2028 case Intrinsic::nvvm_mul_rp_ftz_f:
2029 case Intrinsic::nvvm_mul_rz_ftz_f:
2030
2031 // NVVM fma intrinsics with explicit rounding modes
2032 case Intrinsic::nvvm_fma_rm_d:
2033 case Intrinsic::nvvm_fma_rn_d:
2034 case Intrinsic::nvvm_fma_rp_d:
2035 case Intrinsic::nvvm_fma_rz_d:
2036 case Intrinsic::nvvm_fma_rm_f:
2037 case Intrinsic::nvvm_fma_rn_f:
2038 case Intrinsic::nvvm_fma_rp_f:
2039 case Intrinsic::nvvm_fma_rz_f:
2040 case Intrinsic::nvvm_fma_rm_ftz_f:
2041 case Intrinsic::nvvm_fma_rn_ftz_f:
2042 case Intrinsic::nvvm_fma_rp_ftz_f:
2043 case Intrinsic::nvvm_fma_rz_ftz_f:
2044
2045 // Sign operations are actually bitwise operations, they do not raise
2046 // exceptions even for SNANs.
2047 case Intrinsic::fabs:
2048 case Intrinsic::copysign:
2049 case Intrinsic::is_fpclass:
2050 // Non-constrained variants of rounding operations means default FP
2051 // environment, they can be folded in any case.
2052 case Intrinsic::ceil:
2053 case Intrinsic::floor:
2054 case Intrinsic::round:
2055 case Intrinsic::roundeven:
2056 case Intrinsic::trunc:
2057 case Intrinsic::nearbyint:
2058 case Intrinsic::rint:
2059 case Intrinsic::canonicalize:
2060
2061 // Constrained intrinsics can be folded if FP environment is known
2062 // to compiler.
2063 case Intrinsic::experimental_constrained_fma:
2064 case Intrinsic::experimental_constrained_fmuladd:
2065 case Intrinsic::experimental_constrained_fadd:
2066 case Intrinsic::experimental_constrained_fsub:
2067 case Intrinsic::experimental_constrained_fmul:
2068 case Intrinsic::experimental_constrained_fdiv:
2069 case Intrinsic::experimental_constrained_frem:
2070 case Intrinsic::experimental_constrained_ceil:
2071 case Intrinsic::experimental_constrained_floor:
2072 case Intrinsic::experimental_constrained_round:
2073 case Intrinsic::experimental_constrained_roundeven:
2074 case Intrinsic::experimental_constrained_trunc:
2075 case Intrinsic::experimental_constrained_nearbyint:
2076 case Intrinsic::experimental_constrained_rint:
2077 case Intrinsic::experimental_constrained_fcmp:
2078 case Intrinsic::experimental_constrained_fcmps:
2079
2080 case Intrinsic::experimental_cttz_elts:
2081 return true;
2082 default:
2083 return false;
2084 case Intrinsic::not_intrinsic: break;
2085 }
2086
2087 if (!F->hasName() || Call->isStrictFP())
2088 return false;
2089
2090 // In these cases, the check of the length is required. We don't want to
2091 // return true for a name like "cos\0blah" which strcmp would return equal to
2092 // "cos", but has length 8.
2093 StringRef Name = F->getName();
2094 switch (Name[0]) {
2095 default:
2096 return false;
2097 // clang-format off
2098 case 'a':
2099 return Name == "acos" || Name == "acosf" ||
2100 Name == "asin" || Name == "asinf" ||
2101 Name == "atan" || Name == "atanf" ||
2102 Name == "atan2" || Name == "atan2f";
2103 case 'c':
2104 return Name == "ceil" || Name == "ceilf" ||
2105 Name == "cos" || Name == "cosf" ||
2106 Name == "cosh" || Name == "coshf";
2107 case 'e':
2108 return Name == "exp" || Name == "expf" || Name == "exp2" ||
2109 Name == "exp2f" || Name == "erf" || Name == "erff";
2110 case 'f':
2111 return Name == "fabs" || Name == "fabsf" ||
2112 Name == "floor" || Name == "floorf" ||
2113 Name == "fmod" || Name == "fmodf";
2114 case 'i':
2115 return Name == "ilogb" || Name == "ilogbf";
2116 case 'l':
2117 return Name == "log" || Name == "logf" || Name == "logl" ||
2118 Name == "log2" || Name == "log2f" || Name == "log10" ||
2119 Name == "log10f" || Name == "logb" || Name == "logbf" ||
2120 Name == "log1p" || Name == "log1pf";
2121 case 'n':
2122 return Name == "nearbyint" || Name == "nearbyintf";
2123 case 'p':
2124 return Name == "pow" || Name == "powf";
2125 case 'r':
2126 return Name == "remainder" || Name == "remainderf" ||
2127 Name == "rint" || Name == "rintf" ||
2128 Name == "round" || Name == "roundf" ||
2129 Name == "roundeven" || Name == "roundevenf";
2130 case 's':
2131 return Name == "sin" || Name == "sinf" ||
2132 Name == "sinh" || Name == "sinhf" ||
2133 Name == "sqrt" || Name == "sqrtf";
2134 case 't':
2135 return Name == "tan" || Name == "tanf" ||
2136 Name == "tanh" || Name == "tanhf" ||
2137 Name == "trunc" || Name == "truncf";
2138 case '_':
2139 // Check for various function names that get used for the math functions
2140 // when the header files are preprocessed with the macro
2141 // __FINITE_MATH_ONLY__ enabled.
2142 // The '12' here is the length of the shortest name that can match.
2143 // We need to check the size before looking at Name[1] and Name[2]
2144 // so we may as well check a limit that will eliminate mismatches.
2145 if (Name.size() < 12 || Name[1] != '_')
2146 return false;
2147 switch (Name[2]) {
2148 default:
2149 return false;
2150 case 'a':
2151 return Name == "__acos_finite" || Name == "__acosf_finite" ||
2152 Name == "__asin_finite" || Name == "__asinf_finite" ||
2153 Name == "__atan2_finite" || Name == "__atan2f_finite";
2154 case 'c':
2155 return Name == "__cosh_finite" || Name == "__coshf_finite";
2156 case 'e':
2157 return Name == "__exp_finite" || Name == "__expf_finite" ||
2158 Name == "__exp2_finite" || Name == "__exp2f_finite";
2159 case 'l':
2160 return Name == "__log_finite" || Name == "__logf_finite" ||
2161 Name == "__log10_finite" || Name == "__log10f_finite";
2162 case 'p':
2163 return Name == "__pow_finite" || Name == "__powf_finite";
2164 case 's':
2165 return Name == "__sinh_finite" || Name == "__sinhf_finite";
2166 }
2167 // clang-format on
2168 }
2169}
2170
2171namespace {
2172
2173Constant *GetConstantFoldFPValue(double V, Type *Ty) {
2174 if (Ty->isHalfTy() || Ty->isFloatTy()) {
2175 APFloat APF(V);
2176 bool unused;
2177 APF.convert(Ty->getFltSemantics(), APFloat::rmNearestTiesToEven, &unused);
2178 return ConstantFP::get(Ty->getContext(), APF);
2179 }
2180 if (Ty->isDoubleTy())
2181 return ConstantFP::get(Ty->getContext(), APFloat(V));
2182 llvm_unreachable("Can only constant fold half/float/double");
2183}
2184
2185#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2186Constant *GetConstantFoldFPValue128(float128 V, Type *Ty) {
2187 if (Ty->isFP128Ty())
2188 return ConstantFP::get(Ty, V);
2189 llvm_unreachable("Can only constant fold fp128");
2190}
2191#endif
2192
2193/// Clear the floating-point exception state.
2194inline void llvm_fenv_clearexcept() {
2195#if HAVE_DECL_FE_ALL_EXCEPT
2196 feclearexcept(FE_ALL_EXCEPT);
2197#endif
2198 errno = 0;
2199}
2200
2201/// Test if a floating-point exception was raised.
2202inline bool llvm_fenv_testexcept() {
2203 int errno_val = errno;
2204 if (errno_val == ERANGE || errno_val == EDOM)
2205 return true;
2206#if HAVE_DECL_FE_ALL_EXCEPT && HAVE_DECL_FE_INEXACT
2207 if (fetestexcept(FE_ALL_EXCEPT & ~FE_INEXACT))
2208 return true;
2209#endif
2210 return false;
2211}
2212
2213static APFloat FTZPreserveSign(const APFloat &V) {
2214 if (V.isDenormal())
2215 return APFloat::getZero(V.getSemantics(), V.isNegative());
2216 return V;
2217}
2218
2219static APFloat FlushToPositiveZero(const APFloat &V) {
2220 if (V.isDenormal())
2221 return APFloat::getZero(V.getSemantics(), false);
2222 return V;
2223}
2224
2225static APFloat FlushWithDenormKind(const APFloat &V,
2226 DenormalMode::DenormalModeKind DenormKind) {
2229 switch (DenormKind) {
2231 return V;
2233 return FTZPreserveSign(V);
2235 return FlushToPositiveZero(V);
2236 default:
2237 llvm_unreachable("Invalid denormal mode!");
2238 }
2239}
2240
2241Constant *ConstantFoldFP(double (*NativeFP)(double), const APFloat &V, Type *Ty,
2242 DenormalMode DenormMode = DenormalMode::getIEEE()) {
2243 if (!DenormMode.isValid() ||
2244 DenormMode.Input == DenormalMode::DenormalModeKind::Dynamic ||
2245 DenormMode.Output == DenormalMode::DenormalModeKind::Dynamic)
2246 return nullptr;
2247
2248 llvm_fenv_clearexcept();
2249 auto Input = FlushWithDenormKind(V, DenormMode.Input);
2250 double Result = NativeFP(Input.convertToDouble());
2251 if (llvm_fenv_testexcept()) {
2252 llvm_fenv_clearexcept();
2253 return nullptr;
2254 }
2255
2256 Constant *Output = GetConstantFoldFPValue(Result, Ty);
2257 if (DenormMode.Output == DenormalMode::DenormalModeKind::IEEE)
2258 return Output;
2259 const auto *CFP = static_cast<ConstantFP *>(Output);
2260 const auto Res = FlushWithDenormKind(CFP->getValueAPF(), DenormMode.Output);
2261 return ConstantFP::get(Ty->getContext(), Res);
2262}
2263
2264#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2265Constant *ConstantFoldFP128(float128 (*NativeFP)(float128), const APFloat &V,
2266 Type *Ty) {
2267 llvm_fenv_clearexcept();
2268 float128 Result = NativeFP(V.convertToQuad());
2269 if (llvm_fenv_testexcept()) {
2270 llvm_fenv_clearexcept();
2271 return nullptr;
2272 }
2273
2274 return GetConstantFoldFPValue128(Result, Ty);
2275}
2276#endif
2277
2278Constant *ConstantFoldBinaryFP(double (*NativeFP)(double, double),
2279 const APFloat &V, const APFloat &W, Type *Ty) {
2280 llvm_fenv_clearexcept();
2281 double Result = NativeFP(V.convertToDouble(), W.convertToDouble());
2282 if (llvm_fenv_testexcept()) {
2283 llvm_fenv_clearexcept();
2284 return nullptr;
2285 }
2286
2287 return GetConstantFoldFPValue(Result, Ty);
2288}
2289
2290Constant *constantFoldVectorReduce(Intrinsic::ID IID, Constant *Op) {
2291 auto *OpVT = cast<VectorType>(Op->getType());
2292
2293 // This is the same as the underlying binops - poison propagates.
2294 if (Op->containsPoisonElement())
2295 return PoisonValue::get(OpVT->getElementType());
2296
2297 // Shortcut non-accumulating reductions.
2298 if (Constant *SplatVal = Op->getSplatValue()) {
2299 switch (IID) {
2300 case Intrinsic::vector_reduce_and:
2301 case Intrinsic::vector_reduce_or:
2302 case Intrinsic::vector_reduce_smin:
2303 case Intrinsic::vector_reduce_smax:
2304 case Intrinsic::vector_reduce_umin:
2305 case Intrinsic::vector_reduce_umax:
2306 return SplatVal;
2307 case Intrinsic::vector_reduce_add:
2308 if (SplatVal->isNullValue())
2309 return SplatVal;
2310 break;
2311 case Intrinsic::vector_reduce_mul:
2312 if (SplatVal->isNullValue() || SplatVal->isOneValue())
2313 return SplatVal;
2314 break;
2315 case Intrinsic::vector_reduce_xor:
2316 if (SplatVal->isNullValue())
2317 return SplatVal;
2318 if (OpVT->getElementCount().isKnownMultipleOf(2))
2319 return Constant::getNullValue(OpVT->getElementType());
2320 break;
2321 }
2322 }
2323
2325 if (!VT)
2326 return nullptr;
2327
2328 // TODO: Handle undef.
2329 auto *EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(0U));
2330 if (!EltC)
2331 return nullptr;
2332
2333 APInt Acc = EltC->getValue();
2334 for (unsigned I = 1, E = VT->getNumElements(); I != E; I++) {
2335 if (!(EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(I))))
2336 return nullptr;
2337 const APInt &X = EltC->getValue();
2338 switch (IID) {
2339 case Intrinsic::vector_reduce_add:
2340 Acc = Acc + X;
2341 break;
2342 case Intrinsic::vector_reduce_mul:
2343 Acc = Acc * X;
2344 break;
2345 case Intrinsic::vector_reduce_and:
2346 Acc = Acc & X;
2347 break;
2348 case Intrinsic::vector_reduce_or:
2349 Acc = Acc | X;
2350 break;
2351 case Intrinsic::vector_reduce_xor:
2352 Acc = Acc ^ X;
2353 break;
2354 case Intrinsic::vector_reduce_smin:
2355 Acc = APIntOps::smin(Acc, X);
2356 break;
2357 case Intrinsic::vector_reduce_smax:
2358 Acc = APIntOps::smax(Acc, X);
2359 break;
2360 case Intrinsic::vector_reduce_umin:
2361 Acc = APIntOps::umin(Acc, X);
2362 break;
2363 case Intrinsic::vector_reduce_umax:
2364 Acc = APIntOps::umax(Acc, X);
2365 break;
2366 }
2367 }
2368
2369 return ConstantInt::get(Op->getContext(), Acc);
2370}
2371
2372/// Attempt to fold an SSE floating point to integer conversion of a constant
2373/// floating point. If roundTowardZero is false, the default IEEE rounding is
2374/// used (toward nearest, ties to even). This matches the behavior of the
2375/// non-truncating SSE instructions in the default rounding mode. The desired
2376/// integer type Ty is used to select how many bits are available for the
2377/// result. Returns null if the conversion cannot be performed, otherwise
2378/// returns the Constant value resulting from the conversion.
2379Constant *ConstantFoldSSEConvertToInt(const APFloat &Val, bool roundTowardZero,
2380 Type *Ty, bool IsSigned) {
2381 // All of these conversion intrinsics form an integer of at most 64bits.
2382 unsigned ResultWidth = Ty->getIntegerBitWidth();
2383 assert(ResultWidth <= 64 &&
2384 "Can only constant fold conversions to 64 and 32 bit ints");
2385
2386 uint64_t UIntVal;
2387 bool isExact = false;
2391 Val.convertToInteger(MutableArrayRef(UIntVal), ResultWidth,
2392 IsSigned, mode, &isExact);
2393 if (status != APFloat::opOK &&
2394 (!roundTowardZero || status != APFloat::opInexact))
2395 return nullptr;
2396 return ConstantInt::get(Ty, UIntVal, IsSigned);
2397}
2398
2399double getValueAsDouble(ConstantFP *Op) {
2400 Type *Ty = Op->getType();
2401
2402 if (Ty->isBFloatTy() || Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())
2403 return Op->getValueAPF().convertToDouble();
2404
2405 bool unused;
2406 APFloat APF = Op->getValueAPF();
2408 return APF.convertToDouble();
2409}
2410
2411static bool getConstIntOrUndef(Value *Op, const APInt *&C) {
2412 if (auto *CI = dyn_cast<ConstantInt>(Op)) {
2413 C = &CI->getValue();
2414 return true;
2415 }
2416 if (isa<UndefValue>(Op)) {
2417 C = nullptr;
2418 return true;
2419 }
2420 return false;
2421}
2422
2423/// Checks if the given intrinsic call, which evaluates to constant, is allowed
2424/// to be folded.
2425///
2426/// \param CI Constrained intrinsic call.
2427/// \param St Exception flags raised during constant evaluation.
2428static bool mayFoldConstrained(ConstrainedFPIntrinsic *CI,
2429 APFloat::opStatus St) {
2430 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2431 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2432
2433 // If the operation does not change exception status flags, it is safe
2434 // to fold.
2435 if (St == APFloat::opStatus::opOK)
2436 return true;
2437
2438 // If evaluation raised FP exception, the result can depend on rounding
2439 // mode. If the latter is unknown, folding is not possible.
2440 if (ORM == RoundingMode::Dynamic)
2441 return false;
2442
2443 // If FP exceptions are ignored, fold the call, even if such exception is
2444 // raised.
2445 if (EB && *EB != fp::ExceptionBehavior::ebStrict)
2446 return true;
2447
2448 // Leave the calculation for runtime so that exception flags be correctly set
2449 // in hardware.
2450 return false;
2451}
2452
2453/// Returns the rounding mode that should be used for constant evaluation.
2454static RoundingMode
2455getEvaluationRoundingMode(const ConstrainedFPIntrinsic *CI) {
2456 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2457 if (!ORM || *ORM == RoundingMode::Dynamic)
2458 // Even if the rounding mode is unknown, try evaluating the operation.
2459 // If it does not raise inexact exception, rounding was not applied,
2460 // so the result is exact and does not depend on rounding mode. Whether
2461 // other FP exceptions are raised, it does not depend on rounding mode.
2463 return *ORM;
2464}
2465
2466/// Try to constant fold llvm.canonicalize for the given caller and value.
2467static Constant *constantFoldCanonicalize(const Type *Ty, const CallBase *CI,
2468 const APFloat &Src) {
2469 // Zero, positive and negative, is always OK to fold.
2470 if (Src.isZero()) {
2471 // Get a fresh 0, since ppc_fp128 does have non-canonical zeros.
2472 return ConstantFP::get(
2473 CI->getContext(),
2474 APFloat::getZero(Src.getSemantics(), Src.isNegative()));
2475 }
2476
2477 if (!Ty->isIEEELikeFPTy())
2478 return nullptr;
2479
2480 // Zero is always canonical and the sign must be preserved.
2481 //
2482 // Denorms and nans may have special encodings, but it should be OK to fold a
2483 // totally average number.
2484 if (Src.isNormal() || Src.isInfinity())
2485 return ConstantFP::get(CI->getContext(), Src);
2486
2487 if (Src.isDenormal() && CI->getParent() && CI->getFunction()) {
2488 DenormalMode DenormMode =
2489 CI->getFunction()->getDenormalMode(Src.getSemantics());
2490
2491 if (DenormMode == DenormalMode::getIEEE())
2492 return ConstantFP::get(CI->getContext(), Src);
2493
2494 if (DenormMode.Input == DenormalMode::Dynamic)
2495 return nullptr;
2496
2497 // If we know if either input or output is flushed, we can fold.
2498 if ((DenormMode.Input == DenormalMode::Dynamic &&
2499 DenormMode.Output == DenormalMode::IEEE) ||
2500 (DenormMode.Input == DenormalMode::IEEE &&
2501 DenormMode.Output == DenormalMode::Dynamic))
2502 return nullptr;
2503
2504 bool IsPositive =
2505 (!Src.isNegative() || DenormMode.Input == DenormalMode::PositiveZero ||
2506 (DenormMode.Output == DenormalMode::PositiveZero &&
2507 DenormMode.Input == DenormalMode::IEEE));
2508
2509 return ConstantFP::get(CI->getContext(),
2510 APFloat::getZero(Src.getSemantics(), !IsPositive));
2511 }
2512
2513 return nullptr;
2514}
2515
2516static Constant *ConstantFoldScalarCall1(StringRef Name,
2517 Intrinsic::ID IntrinsicID,
2518 Type *Ty,
2519 ArrayRef<Constant *> Operands,
2520 const TargetLibraryInfo *TLI,
2521 const CallBase *Call) {
2522 assert(Operands.size() == 1 && "Wrong number of operands.");
2523
2524 if (IntrinsicID == Intrinsic::is_constant) {
2525 // We know we have a "Constant" argument. But we want to only
2526 // return true for manifest constants, not those that depend on
2527 // constants with unknowable values, e.g. GlobalValue or BlockAddress.
2528 if (Operands[0]->isManifestConstant())
2529 return ConstantInt::getTrue(Ty->getContext());
2530 return nullptr;
2531 }
2532
2533 if (isa<UndefValue>(Operands[0])) {
2534 // cosine(arg) is between -1 and 1. cosine(invalid arg) is NaN.
2535 // ctpop() is between 0 and bitwidth, pick 0 for undef.
2536 // fptoui.sat and fptosi.sat can always fold to zero (for a zero input).
2537 if (IntrinsicID == Intrinsic::cos ||
2538 IntrinsicID == Intrinsic::ctpop ||
2539 IntrinsicID == Intrinsic::fptoui_sat ||
2540 IntrinsicID == Intrinsic::fptosi_sat ||
2541 IntrinsicID == Intrinsic::canonicalize)
2542 return Constant::getNullValue(Ty);
2543 if (IntrinsicID == Intrinsic::bswap ||
2544 IntrinsicID == Intrinsic::bitreverse ||
2545 IntrinsicID == Intrinsic::launder_invariant_group ||
2546 IntrinsicID == Intrinsic::strip_invariant_group)
2547 return Operands[0];
2548 }
2549
2550 if (isa<ConstantPointerNull>(Operands[0])) {
2551 // launder(null) == null == strip(null) iff in addrspace 0
2552 if (IntrinsicID == Intrinsic::launder_invariant_group ||
2553 IntrinsicID == Intrinsic::strip_invariant_group) {
2554 // If instruction is not yet put in a basic block (e.g. when cloning
2555 // a function during inlining), Call's caller may not be available.
2556 // So check Call's BB first before querying Call->getCaller.
2557 const Function *Caller =
2558 Call->getParent() ? Call->getCaller() : nullptr;
2559 if (Caller &&
2561 Caller, Operands[0]->getType()->getPointerAddressSpace())) {
2562 return Operands[0];
2563 }
2564 return nullptr;
2565 }
2566 }
2567
2568 if (auto *Op = dyn_cast<ConstantFP>(Operands[0])) {
2569 APFloat U = Op->getValueAPF();
2570
2571 if (IntrinsicID == Intrinsic::wasm_trunc_signed ||
2572 IntrinsicID == Intrinsic::wasm_trunc_unsigned) {
2573 bool Signed = IntrinsicID == Intrinsic::wasm_trunc_signed;
2574
2575 if (U.isNaN())
2576 return nullptr;
2577
2578 unsigned Width = Ty->getIntegerBitWidth();
2579 APSInt Int(Width, !Signed);
2580 bool IsExact = false;
2582 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2583
2585 return ConstantInt::get(Ty, Int);
2586
2587 return nullptr;
2588 }
2589
2590 if (IntrinsicID == Intrinsic::fptoui_sat ||
2591 IntrinsicID == Intrinsic::fptosi_sat) {
2592 // convertToInteger() already has the desired saturation semantics.
2593 APSInt Int(Ty->getIntegerBitWidth(),
2594 IntrinsicID == Intrinsic::fptoui_sat);
2595 bool IsExact;
2596 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2597 return ConstantInt::get(Ty, Int);
2598 }
2599
2600 if (IntrinsicID == Intrinsic::canonicalize)
2601 return constantFoldCanonicalize(Ty, Call, U);
2602
2603#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2604 if (Ty->isFP128Ty()) {
2605 if (IntrinsicID == Intrinsic::log) {
2606 float128 Result = logf128(Op->getValueAPF().convertToQuad());
2607 return GetConstantFoldFPValue128(Result, Ty);
2608 }
2609
2610 LibFunc Fp128Func = NotLibFunc;
2611 if (TLI && TLI->getLibFunc(Name, Fp128Func) && TLI->has(Fp128Func) &&
2612 Fp128Func == LibFunc_logl)
2613 return ConstantFoldFP128(logf128, Op->getValueAPF(), Ty);
2614 }
2615#endif
2616
2617 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy() &&
2618 !Ty->isIntegerTy())
2619 return nullptr;
2620
2621 // Use internal versions of these intrinsics.
2622
2623 if (IntrinsicID == Intrinsic::nearbyint || IntrinsicID == Intrinsic::rint ||
2624 IntrinsicID == Intrinsic::roundeven) {
2625 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2626 return ConstantFP::get(Ty, U);
2627 }
2628
2629 if (IntrinsicID == Intrinsic::round) {
2630 U.roundToIntegral(APFloat::rmNearestTiesToAway);
2631 return ConstantFP::get(Ty, U);
2632 }
2633
2634 if (IntrinsicID == Intrinsic::roundeven) {
2635 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2636 return ConstantFP::get(Ty, U);
2637 }
2638
2639 if (IntrinsicID == Intrinsic::ceil) {
2640 U.roundToIntegral(APFloat::rmTowardPositive);
2641 return ConstantFP::get(Ty, U);
2642 }
2643
2644 if (IntrinsicID == Intrinsic::floor) {
2645 U.roundToIntegral(APFloat::rmTowardNegative);
2646 return ConstantFP::get(Ty, U);
2647 }
2648
2649 if (IntrinsicID == Intrinsic::trunc) {
2650 U.roundToIntegral(APFloat::rmTowardZero);
2651 return ConstantFP::get(Ty, U);
2652 }
2653
2654 if (IntrinsicID == Intrinsic::fabs) {
2655 U.clearSign();
2656 return ConstantFP::get(Ty, U);
2657 }
2658
2659 if (IntrinsicID == Intrinsic::amdgcn_fract) {
2660 // The v_fract instruction behaves like the OpenCL spec, which defines
2661 // fract(x) as fmin(x - floor(x), 0x1.fffffep-1f): "The min() operator is
2662 // there to prevent fract(-small) from returning 1.0. It returns the
2663 // largest positive floating-point number less than 1.0."
2664 APFloat FloorU(U);
2665 FloorU.roundToIntegral(APFloat::rmTowardNegative);
2666 APFloat FractU(U - FloorU);
2667 APFloat AlmostOne(U.getSemantics(), 1);
2668 AlmostOne.next(/*nextDown*/ true);
2669 return ConstantFP::get(Ty, minimum(FractU, AlmostOne));
2670 }
2671
2672 // Rounding operations (floor, trunc, ceil, round and nearbyint) do not
2673 // raise FP exceptions, unless the argument is signaling NaN.
2674
2675 std::optional<APFloat::roundingMode> RM;
2676 switch (IntrinsicID) {
2677 default:
2678 break;
2679 case Intrinsic::experimental_constrained_nearbyint:
2680 case Intrinsic::experimental_constrained_rint: {
2682 RM = CI->getRoundingMode();
2683 if (!RM || *RM == RoundingMode::Dynamic)
2684 return nullptr;
2685 break;
2686 }
2687 case Intrinsic::experimental_constrained_round:
2689 break;
2690 case Intrinsic::experimental_constrained_ceil:
2692 break;
2693 case Intrinsic::experimental_constrained_floor:
2695 break;
2696 case Intrinsic::experimental_constrained_trunc:
2698 break;
2699 }
2700 if (RM) {
2702 if (U.isFinite()) {
2703 APFloat::opStatus St = U.roundToIntegral(*RM);
2704 if (IntrinsicID == Intrinsic::experimental_constrained_rint &&
2705 St == APFloat::opInexact) {
2706 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2707 if (EB == fp::ebStrict)
2708 return nullptr;
2709 }
2710 } else if (U.isSignaling()) {
2711 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2712 if (EB && *EB != fp::ebIgnore)
2713 return nullptr;
2714 U = APFloat::getQNaN(U.getSemantics());
2715 }
2716 return ConstantFP::get(Ty, U);
2717 }
2718
2719 // NVVM float/double to signed/unsigned int32/int64 conversions:
2720 switch (IntrinsicID) {
2721 // f2i
2722 case Intrinsic::nvvm_f2i_rm:
2723 case Intrinsic::nvvm_f2i_rn:
2724 case Intrinsic::nvvm_f2i_rp:
2725 case Intrinsic::nvvm_f2i_rz:
2726 case Intrinsic::nvvm_f2i_rm_ftz:
2727 case Intrinsic::nvvm_f2i_rn_ftz:
2728 case Intrinsic::nvvm_f2i_rp_ftz:
2729 case Intrinsic::nvvm_f2i_rz_ftz:
2730 // f2ui
2731 case Intrinsic::nvvm_f2ui_rm:
2732 case Intrinsic::nvvm_f2ui_rn:
2733 case Intrinsic::nvvm_f2ui_rp:
2734 case Intrinsic::nvvm_f2ui_rz:
2735 case Intrinsic::nvvm_f2ui_rm_ftz:
2736 case Intrinsic::nvvm_f2ui_rn_ftz:
2737 case Intrinsic::nvvm_f2ui_rp_ftz:
2738 case Intrinsic::nvvm_f2ui_rz_ftz:
2739 // d2i
2740 case Intrinsic::nvvm_d2i_rm:
2741 case Intrinsic::nvvm_d2i_rn:
2742 case Intrinsic::nvvm_d2i_rp:
2743 case Intrinsic::nvvm_d2i_rz:
2744 // d2ui
2745 case Intrinsic::nvvm_d2ui_rm:
2746 case Intrinsic::nvvm_d2ui_rn:
2747 case Intrinsic::nvvm_d2ui_rp:
2748 case Intrinsic::nvvm_d2ui_rz:
2749 // f2ll
2750 case Intrinsic::nvvm_f2ll_rm:
2751 case Intrinsic::nvvm_f2ll_rn:
2752 case Intrinsic::nvvm_f2ll_rp:
2753 case Intrinsic::nvvm_f2ll_rz:
2754 case Intrinsic::nvvm_f2ll_rm_ftz:
2755 case Intrinsic::nvvm_f2ll_rn_ftz:
2756 case Intrinsic::nvvm_f2ll_rp_ftz:
2757 case Intrinsic::nvvm_f2ll_rz_ftz:
2758 // f2ull
2759 case Intrinsic::nvvm_f2ull_rm:
2760 case Intrinsic::nvvm_f2ull_rn:
2761 case Intrinsic::nvvm_f2ull_rp:
2762 case Intrinsic::nvvm_f2ull_rz:
2763 case Intrinsic::nvvm_f2ull_rm_ftz:
2764 case Intrinsic::nvvm_f2ull_rn_ftz:
2765 case Intrinsic::nvvm_f2ull_rp_ftz:
2766 case Intrinsic::nvvm_f2ull_rz_ftz:
2767 // d2ll
2768 case Intrinsic::nvvm_d2ll_rm:
2769 case Intrinsic::nvvm_d2ll_rn:
2770 case Intrinsic::nvvm_d2ll_rp:
2771 case Intrinsic::nvvm_d2ll_rz:
2772 // d2ull
2773 case Intrinsic::nvvm_d2ull_rm:
2774 case Intrinsic::nvvm_d2ull_rn:
2775 case Intrinsic::nvvm_d2ull_rp:
2776 case Intrinsic::nvvm_d2ull_rz: {
2777 // In float-to-integer conversion, NaN inputs are converted to 0.
2778 if (U.isNaN()) {
2779 // In float-to-integer conversion, NaN inputs are converted to 0
2780 // when the source and destination bitwidths are both less than 64.
2781 if (nvvm::FPToIntegerIntrinsicNaNZero(IntrinsicID))
2782 return ConstantInt::get(Ty, 0);
2783
2784 // Otherwise, the most significant bit is set.
2785 unsigned BitWidth = Ty->getIntegerBitWidth();
2786 uint64_t Val = 1ULL << (BitWidth - 1);
2787 return ConstantInt::get(Ty, APInt(BitWidth, Val, /*IsSigned=*/false));
2788 }
2789
2790 APFloat::roundingMode RMode =
2792 bool IsFTZ = nvvm::FPToIntegerIntrinsicShouldFTZ(IntrinsicID);
2793 bool IsSigned = nvvm::FPToIntegerIntrinsicResultIsSigned(IntrinsicID);
2794
2795 APSInt ResInt(Ty->getIntegerBitWidth(), !IsSigned);
2796 auto FloatToRound = IsFTZ ? FTZPreserveSign(U) : U;
2797
2798 // Return max/min value for integers if the result is +/-inf or
2799 // is too large to fit in the result's integer bitwidth.
2800 bool IsExact = false;
2801 FloatToRound.convertToInteger(ResInt, RMode, &IsExact);
2802 return ConstantInt::get(Ty, ResInt);
2803 }
2804 }
2805
2806 /// We only fold functions with finite arguments. Folding NaN and inf is
2807 /// likely to be aborted with an exception anyway, and some host libms
2808 /// have known errors raising exceptions.
2809 if (!U.isFinite())
2810 return nullptr;
2811
2812 /// Currently APFloat versions of these functions do not exist, so we use
2813 /// the host native double versions. Float versions are not called
2814 /// directly but for all these it is true (float)(f((double)arg)) ==
2815 /// f(arg). Long double not supported yet.
2816 const APFloat &APF = Op->getValueAPF();
2817
2818 switch (IntrinsicID) {
2819 default: break;
2820 case Intrinsic::log:
2821 if (U.isZero())
2822 return ConstantFP::getInfinity(Ty, true);
2823 if (U.isNegative())
2824 return ConstantFP::getNaN(Ty);
2825 if (U.isExactlyValue(1.0))
2826 return ConstantFP::getZero(Ty);
2827 return ConstantFoldFP(log, APF, Ty);
2828 case Intrinsic::log2:
2829 if (U.isZero())
2830 return ConstantFP::getInfinity(Ty, true);
2831 if (U.isNegative())
2832 return ConstantFP::getNaN(Ty);
2833 if (U.isExactlyValue(1.0))
2834 return ConstantFP::getZero(Ty);
2835 // TODO: What about hosts that lack a C99 library?
2836 return ConstantFoldFP(log2, APF, Ty);
2837 case Intrinsic::log10:
2838 if (U.isZero())
2839 return ConstantFP::getInfinity(Ty, true);
2840 if (U.isNegative())
2841 return ConstantFP::getNaN(Ty);
2842 if (U.isExactlyValue(1.0))
2843 return ConstantFP::getZero(Ty);
2844 // TODO: What about hosts that lack a C99 library?
2845 return ConstantFoldFP(log10, APF, Ty);
2846 case Intrinsic::exp:
2847 return ConstantFoldFP(exp, APF, Ty);
2848 case Intrinsic::exp2:
2849 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2850 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2851 case Intrinsic::exp10:
2852 // Fold exp10(x) as pow(10, x), in case the host lacks a C99 library.
2853 return ConstantFoldBinaryFP(pow, APFloat(10.0), APF, Ty);
2854 case Intrinsic::sin:
2855 return ConstantFoldFP(sin, APF, Ty);
2856 case Intrinsic::cos:
2857 return ConstantFoldFP(cos, APF, Ty);
2858 case Intrinsic::sinh:
2859 return ConstantFoldFP(sinh, APF, Ty);
2860 case Intrinsic::cosh:
2861 return ConstantFoldFP(cosh, APF, Ty);
2862 case Intrinsic::atan:
2863 // Implement optional behavior from C's Annex F for +/-0.0.
2864 if (U.isZero())
2865 return ConstantFP::get(Ty, U);
2866 return ConstantFoldFP(atan, APF, Ty);
2867 case Intrinsic::sqrt:
2868 return ConstantFoldFP(sqrt, APF, Ty);
2869
2870 // NVVM Intrinsics:
2871 case Intrinsic::nvvm_ceil_ftz_f:
2872 case Intrinsic::nvvm_ceil_f:
2873 case Intrinsic::nvvm_ceil_d:
2874 return ConstantFoldFP(
2875 ceil, APF, Ty,
2877 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2878
2879 case Intrinsic::nvvm_fabs_ftz:
2880 case Intrinsic::nvvm_fabs:
2881 return ConstantFoldFP(
2882 fabs, APF, Ty,
2884 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2885
2886 case Intrinsic::nvvm_floor_ftz_f:
2887 case Intrinsic::nvvm_floor_f:
2888 case Intrinsic::nvvm_floor_d:
2889 return ConstantFoldFP(
2890 floor, APF, Ty,
2892 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2893
2894 case Intrinsic::nvvm_rcp_rm_ftz_f:
2895 case Intrinsic::nvvm_rcp_rn_ftz_f:
2896 case Intrinsic::nvvm_rcp_rp_ftz_f:
2897 case Intrinsic::nvvm_rcp_rz_ftz_f:
2898 case Intrinsic::nvvm_rcp_rm_d:
2899 case Intrinsic::nvvm_rcp_rm_f:
2900 case Intrinsic::nvvm_rcp_rn_d:
2901 case Intrinsic::nvvm_rcp_rn_f:
2902 case Intrinsic::nvvm_rcp_rp_d:
2903 case Intrinsic::nvvm_rcp_rp_f:
2904 case Intrinsic::nvvm_rcp_rz_d:
2905 case Intrinsic::nvvm_rcp_rz_f: {
2906 APFloat::roundingMode RoundMode = nvvm::GetRCPRoundingMode(IntrinsicID);
2907 bool IsFTZ = nvvm::RCPShouldFTZ(IntrinsicID);
2908
2909 auto Denominator = IsFTZ ? FTZPreserveSign(APF) : APF;
2911 APFloat::opStatus Status = Res.divide(Denominator, RoundMode);
2912
2914 if (IsFTZ)
2915 Res = FTZPreserveSign(Res);
2916 return ConstantFP::get(Ty, Res);
2917 }
2918 return nullptr;
2919 }
2920
2921 case Intrinsic::nvvm_round_ftz_f:
2922 case Intrinsic::nvvm_round_f:
2923 case Intrinsic::nvvm_round_d: {
2924 // nvvm_round is lowered to PTX cvt.rni, which will round to nearest
2925 // integer, choosing even integer if source is equidistant between two
2926 // integers, so the semantics are closer to "rint" rather than "round".
2927 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2928 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2930 return ConstantFP::get(Ty, V);
2931 }
2932
2933 case Intrinsic::nvvm_saturate_ftz_f:
2934 case Intrinsic::nvvm_saturate_d:
2935 case Intrinsic::nvvm_saturate_f: {
2936 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2937 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2938 if (V.isNegative() || V.isZero() || V.isNaN())
2939 return ConstantFP::getZero(Ty);
2941 if (V > One)
2942 return ConstantFP::get(Ty, One);
2943 return ConstantFP::get(Ty, APF);
2944 }
2945
2946 case Intrinsic::nvvm_sqrt_rn_ftz_f:
2947 case Intrinsic::nvvm_sqrt_f:
2948 case Intrinsic::nvvm_sqrt_rn_d:
2949 case Intrinsic::nvvm_sqrt_rn_f:
2950 if (APF.isNegative())
2951 return nullptr;
2952 return ConstantFoldFP(
2953 sqrt, APF, Ty,
2955 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2956
2957 // AMDGCN Intrinsics:
2958 case Intrinsic::amdgcn_cos:
2959 case Intrinsic::amdgcn_sin: {
2960 double V = getValueAsDouble(Op);
2961 if (V < -256.0 || V > 256.0)
2962 // The gfx8 and gfx9 architectures handle arguments outside the range
2963 // [-256, 256] differently. This should be a rare case so bail out
2964 // rather than trying to handle the difference.
2965 return nullptr;
2966 bool IsCos = IntrinsicID == Intrinsic::amdgcn_cos;
2967 double V4 = V * 4.0;
2968 if (V4 == floor(V4)) {
2969 // Force exact results for quarter-integer inputs.
2970 const double SinVals[4] = { 0.0, 1.0, 0.0, -1.0 };
2971 V = SinVals[((int)V4 + (IsCos ? 1 : 0)) & 3];
2972 } else {
2973 if (IsCos)
2974 V = cos(V * 2.0 * numbers::pi);
2975 else
2976 V = sin(V * 2.0 * numbers::pi);
2977 }
2978 return GetConstantFoldFPValue(V, Ty);
2979 }
2980 }
2981
2982 if (!TLI)
2983 return nullptr;
2984
2985 LibFunc Func = NotLibFunc;
2986 if (!TLI->getLibFunc(Name, Func))
2987 return nullptr;
2988
2989 switch (Func) {
2990 default:
2991 break;
2992 case LibFunc_acos:
2993 case LibFunc_acosf:
2994 case LibFunc_acos_finite:
2995 case LibFunc_acosf_finite:
2996 if (TLI->has(Func))
2997 return ConstantFoldFP(acos, APF, Ty);
2998 break;
2999 case LibFunc_asin:
3000 case LibFunc_asinf:
3001 case LibFunc_asin_finite:
3002 case LibFunc_asinf_finite:
3003 if (TLI->has(Func))
3004 return ConstantFoldFP(asin, APF, Ty);
3005 break;
3006 case LibFunc_atan:
3007 case LibFunc_atanf:
3008 // Implement optional behavior from C's Annex F for +/-0.0.
3009 if (U.isZero())
3010 return ConstantFP::get(Ty, U);
3011 if (TLI->has(Func))
3012 return ConstantFoldFP(atan, APF, Ty);
3013 break;
3014 case LibFunc_ceil:
3015 case LibFunc_ceilf:
3016 if (TLI->has(Func)) {
3017 U.roundToIntegral(APFloat::rmTowardPositive);
3018 return ConstantFP::get(Ty, U);
3019 }
3020 break;
3021 case LibFunc_cos:
3022 case LibFunc_cosf:
3023 if (TLI->has(Func))
3024 return ConstantFoldFP(cos, APF, Ty);
3025 break;
3026 case LibFunc_cosh:
3027 case LibFunc_coshf:
3028 case LibFunc_cosh_finite:
3029 case LibFunc_coshf_finite:
3030 if (TLI->has(Func))
3031 return ConstantFoldFP(cosh, APF, Ty);
3032 break;
3033 case LibFunc_exp:
3034 case LibFunc_expf:
3035 case LibFunc_exp_finite:
3036 case LibFunc_expf_finite:
3037 if (TLI->has(Func))
3038 return ConstantFoldFP(exp, APF, Ty);
3039 break;
3040 case LibFunc_exp2:
3041 case LibFunc_exp2f:
3042 case LibFunc_exp2_finite:
3043 case LibFunc_exp2f_finite:
3044 if (TLI->has(Func))
3045 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
3046 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
3047 break;
3048 case LibFunc_fabs:
3049 case LibFunc_fabsf:
3050 if (TLI->has(Func)) {
3051 U.clearSign();
3052 return ConstantFP::get(Ty, U);
3053 }
3054 break;
3055 case LibFunc_floor:
3056 case LibFunc_floorf:
3057 if (TLI->has(Func)) {
3058 U.roundToIntegral(APFloat::rmTowardNegative);
3059 return ConstantFP::get(Ty, U);
3060 }
3061 break;
3062 case LibFunc_log:
3063 case LibFunc_logf:
3064 case LibFunc_log_finite:
3065 case LibFunc_logf_finite:
3066 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3067 return ConstantFoldFP(log, APF, Ty);
3068 break;
3069 case LibFunc_log2:
3070 case LibFunc_log2f:
3071 case LibFunc_log2_finite:
3072 case LibFunc_log2f_finite:
3073 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3074 // TODO: What about hosts that lack a C99 library?
3075 return ConstantFoldFP(log2, APF, Ty);
3076 break;
3077 case LibFunc_log10:
3078 case LibFunc_log10f:
3079 case LibFunc_log10_finite:
3080 case LibFunc_log10f_finite:
3081 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3082 // TODO: What about hosts that lack a C99 library?
3083 return ConstantFoldFP(log10, APF, Ty);
3084 break;
3085 case LibFunc_ilogb:
3086 case LibFunc_ilogbf:
3087 if (!APF.isZero() && TLI->has(Func))
3088 return ConstantInt::get(Ty, ilogb(APF), true);
3089 break;
3090 case LibFunc_logb:
3091 case LibFunc_logbf:
3092 if (!APF.isZero() && TLI->has(Func))
3093 return ConstantFoldFP(logb, APF, Ty);
3094 break;
3095 case LibFunc_log1p:
3096 case LibFunc_log1pf:
3097 // Implement optional behavior from C's Annex F for +/-0.0.
3098 if (U.isZero())
3099 return ConstantFP::get(Ty, U);
3100 if (APF > APFloat::getOne(APF.getSemantics(), true) && TLI->has(Func))
3101 return ConstantFoldFP(log1p, APF, Ty);
3102 break;
3103 case LibFunc_logl:
3104 return nullptr;
3105 case LibFunc_erf:
3106 case LibFunc_erff:
3107 if (TLI->has(Func))
3108 return ConstantFoldFP(erf, APF, Ty);
3109 break;
3110 case LibFunc_nearbyint:
3111 case LibFunc_nearbyintf:
3112 case LibFunc_rint:
3113 case LibFunc_rintf:
3114 case LibFunc_roundeven:
3115 case LibFunc_roundevenf:
3116 if (TLI->has(Func)) {
3117 U.roundToIntegral(APFloat::rmNearestTiesToEven);
3118 return ConstantFP::get(Ty, U);
3119 }
3120 break;
3121 case LibFunc_round:
3122 case LibFunc_roundf:
3123 if (TLI->has(Func)) {
3124 U.roundToIntegral(APFloat::rmNearestTiesToAway);
3125 return ConstantFP::get(Ty, U);
3126 }
3127 break;
3128 case LibFunc_sin:
3129 case LibFunc_sinf:
3130 if (TLI->has(Func))
3131 return ConstantFoldFP(sin, APF, Ty);
3132 break;
3133 case LibFunc_sinh:
3134 case LibFunc_sinhf:
3135 case LibFunc_sinh_finite:
3136 case LibFunc_sinhf_finite:
3137 if (TLI->has(Func))
3138 return ConstantFoldFP(sinh, APF, Ty);
3139 break;
3140 case LibFunc_sqrt:
3141 case LibFunc_sqrtf:
3142 if (!APF.isNegative() && TLI->has(Func))
3143 return ConstantFoldFP(sqrt, APF, Ty);
3144 break;
3145 case LibFunc_tan:
3146 case LibFunc_tanf:
3147 if (TLI->has(Func))
3148 return ConstantFoldFP(tan, APF, Ty);
3149 break;
3150 case LibFunc_tanh:
3151 case LibFunc_tanhf:
3152 if (TLI->has(Func))
3153 return ConstantFoldFP(tanh, APF, Ty);
3154 break;
3155 case LibFunc_trunc:
3156 case LibFunc_truncf:
3157 if (TLI->has(Func)) {
3158 U.roundToIntegral(APFloat::rmTowardZero);
3159 return ConstantFP::get(Ty, U);
3160 }
3161 break;
3162 }
3163 return nullptr;
3164 }
3165
3166 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
3167 switch (IntrinsicID) {
3168 case Intrinsic::bswap:
3169 return ConstantInt::get(Ty->getContext(), Op->getValue().byteSwap());
3170 case Intrinsic::ctpop:
3171 return ConstantInt::get(Ty, Op->getValue().popcount());
3172 case Intrinsic::bitreverse:
3173 return ConstantInt::get(Ty->getContext(), Op->getValue().reverseBits());
3174 case Intrinsic::amdgcn_s_wqm: {
3175 uint64_t Val = Op->getZExtValue();
3176 Val |= (Val & 0x5555555555555555ULL) << 1 |
3177 ((Val >> 1) & 0x5555555555555555ULL);
3178 Val |= (Val & 0x3333333333333333ULL) << 2 |
3179 ((Val >> 2) & 0x3333333333333333ULL);
3180 return ConstantInt::get(Ty, Val);
3181 }
3182
3183 case Intrinsic::amdgcn_s_quadmask: {
3184 uint64_t Val = Op->getZExtValue();
3185 uint64_t QuadMask = 0;
3186 for (unsigned I = 0; I < Op->getBitWidth() / 4; ++I, Val >>= 4) {
3187 if (!(Val & 0xF))
3188 continue;
3189
3190 QuadMask |= (1ULL << I);
3191 }
3192 return ConstantInt::get(Ty, QuadMask);
3193 }
3194
3195 case Intrinsic::amdgcn_s_bitreplicate: {
3196 uint64_t Val = Op->getZExtValue();
3197 Val = (Val & 0x000000000000FFFFULL) | (Val & 0x00000000FFFF0000ULL) << 16;
3198 Val = (Val & 0x000000FF000000FFULL) | (Val & 0x0000FF000000FF00ULL) << 8;
3199 Val = (Val & 0x000F000F000F000FULL) | (Val & 0x00F000F000F000F0ULL) << 4;
3200 Val = (Val & 0x0303030303030303ULL) | (Val & 0x0C0C0C0C0C0C0C0CULL) << 2;
3201 Val = (Val & 0x1111111111111111ULL) | (Val & 0x2222222222222222ULL) << 1;
3202 Val = Val | Val << 1;
3203 return ConstantInt::get(Ty, Val);
3204 }
3205 }
3206 }
3207
3208 if (Operands[0]->getType()->isVectorTy()) {
3209 auto *Op = cast<Constant>(Operands[0]);
3210 switch (IntrinsicID) {
3211 default: break;
3212 case Intrinsic::vector_reduce_add:
3213 case Intrinsic::vector_reduce_mul:
3214 case Intrinsic::vector_reduce_and:
3215 case Intrinsic::vector_reduce_or:
3216 case Intrinsic::vector_reduce_xor:
3217 case Intrinsic::vector_reduce_smin:
3218 case Intrinsic::vector_reduce_smax:
3219 case Intrinsic::vector_reduce_umin:
3220 case Intrinsic::vector_reduce_umax:
3221 if (Constant *C = constantFoldVectorReduce(IntrinsicID, Operands[0]))
3222 return C;
3223 break;
3224 case Intrinsic::x86_sse_cvtss2si:
3225 case Intrinsic::x86_sse_cvtss2si64:
3226 case Intrinsic::x86_sse2_cvtsd2si:
3227 case Intrinsic::x86_sse2_cvtsd2si64:
3228 if (ConstantFP *FPOp =
3229 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3230 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3231 /*roundTowardZero=*/false, Ty,
3232 /*IsSigned*/true);
3233 break;
3234 case Intrinsic::x86_sse_cvttss2si:
3235 case Intrinsic::x86_sse_cvttss2si64:
3236 case Intrinsic::x86_sse2_cvttsd2si:
3237 case Intrinsic::x86_sse2_cvttsd2si64:
3238 if (ConstantFP *FPOp =
3239 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3240 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3241 /*roundTowardZero=*/true, Ty,
3242 /*IsSigned*/true);
3243 break;
3244
3245 case Intrinsic::wasm_anytrue:
3246 return Op->isNullValue() ? ConstantInt::get(Ty, 0)
3247 : ConstantInt::get(Ty, 1);
3248
3249 case Intrinsic::wasm_alltrue:
3250 // Check each element individually
3251 unsigned E = cast<FixedVectorType>(Op->getType())->getNumElements();
3252 for (unsigned I = 0; I != E; ++I) {
3253 Constant *Elt = Op->getAggregateElement(I);
3254 // Return false as soon as we find a non-true element.
3255 if (Elt && Elt->isNullValue())
3256 return ConstantInt::get(Ty, 0);
3257 // Bail as soon as we find an element we cannot prove to be true.
3258 if (!Elt || !isa<ConstantInt>(Elt))
3259 return nullptr;
3260 }
3261
3262 return ConstantInt::get(Ty, 1);
3263 }
3264 }
3265
3266 return nullptr;
3267}
3268
3269static Constant *evaluateCompare(const APFloat &Op1, const APFloat &Op2,
3273 FCmpInst::Predicate Cond = FCmp->getPredicate();
3274 if (FCmp->isSignaling()) {
3275 if (Op1.isNaN() || Op2.isNaN())
3277 } else {
3278 if (Op1.isSignaling() || Op2.isSignaling())
3280 }
3281 bool Result = FCmpInst::compare(Op1, Op2, Cond);
3282 if (mayFoldConstrained(const_cast<ConstrainedFPCmpIntrinsic *>(FCmp), St))
3283 return ConstantInt::get(Call->getType()->getScalarType(), Result);
3284 return nullptr;
3285}
3286
3287static Constant *ConstantFoldLibCall2(StringRef Name, Type *Ty,
3288 ArrayRef<Constant *> Operands,
3289 const TargetLibraryInfo *TLI) {
3290 if (!TLI)
3291 return nullptr;
3292
3293 LibFunc Func = NotLibFunc;
3294 if (!TLI->getLibFunc(Name, Func))
3295 return nullptr;
3296
3297 const auto *Op1 = dyn_cast<ConstantFP>(Operands[0]);
3298 if (!Op1)
3299 return nullptr;
3300
3301 const auto *Op2 = dyn_cast<ConstantFP>(Operands[1]);
3302 if (!Op2)
3303 return nullptr;
3304
3305 const APFloat &Op1V = Op1->getValueAPF();
3306 const APFloat &Op2V = Op2->getValueAPF();
3307
3308 switch (Func) {
3309 default:
3310 break;
3311 case LibFunc_pow:
3312 case LibFunc_powf:
3313 case LibFunc_pow_finite:
3314 case LibFunc_powf_finite:
3315 if (TLI->has(Func))
3316 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3317 break;
3318 case LibFunc_fmod:
3319 case LibFunc_fmodf:
3320 if (TLI->has(Func)) {
3321 APFloat V = Op1->getValueAPF();
3322 if (APFloat::opStatus::opOK == V.mod(Op2->getValueAPF()))
3323 return ConstantFP::get(Ty, V);
3324 }
3325 break;
3326 case LibFunc_remainder:
3327 case LibFunc_remainderf:
3328 if (TLI->has(Func)) {
3329 APFloat V = Op1->getValueAPF();
3330 if (APFloat::opStatus::opOK == V.remainder(Op2->getValueAPF()))
3331 return ConstantFP::get(Ty, V);
3332 }
3333 break;
3334 case LibFunc_atan2:
3335 case LibFunc_atan2f:
3336 // atan2(+/-0.0, +/-0.0) is known to raise an exception on some libm
3337 // (Solaris), so we do not assume a known result for that.
3338 if (Op1V.isZero() && Op2V.isZero())
3339 return nullptr;
3340 [[fallthrough]];
3341 case LibFunc_atan2_finite:
3342 case LibFunc_atan2f_finite:
3343 if (TLI->has(Func))
3344 return ConstantFoldBinaryFP(atan2, Op1V, Op2V, Ty);
3345 break;
3346 }
3347
3348 return nullptr;
3349}
3350
3351static Constant *ConstantFoldIntrinsicCall2(Intrinsic::ID IntrinsicID, Type *Ty,
3352 ArrayRef<Constant *> Operands,
3353 const CallBase *Call) {
3354 assert(Operands.size() == 2 && "Wrong number of operands.");
3355
3356 if (Ty->isFloatingPointTy()) {
3357 // TODO: We should have undef handling for all of the FP intrinsics that
3358 // are attempted to be folded in this function.
3359 bool IsOp0Undef = isa<UndefValue>(Operands[0]);
3360 bool IsOp1Undef = isa<UndefValue>(Operands[1]);
3361 switch (IntrinsicID) {
3362 case Intrinsic::maxnum:
3363 case Intrinsic::minnum:
3364 case Intrinsic::maximum:
3365 case Intrinsic::minimum:
3366 case Intrinsic::maximumnum:
3367 case Intrinsic::minimumnum:
3368 case Intrinsic::nvvm_fmax_d:
3369 case Intrinsic::nvvm_fmin_d:
3370 // If one argument is undef, return the other argument.
3371 if (IsOp0Undef)
3372 return Operands[1];
3373 if (IsOp1Undef)
3374 return Operands[0];
3375 break;
3376
3377 case Intrinsic::nvvm_fmax_f:
3378 case Intrinsic::nvvm_fmax_ftz_f:
3379 case Intrinsic::nvvm_fmax_ftz_nan_f:
3380 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3381 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3382 case Intrinsic::nvvm_fmax_nan_f:
3383 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3384 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3385
3386 case Intrinsic::nvvm_fmin_f:
3387 case Intrinsic::nvvm_fmin_ftz_f:
3388 case Intrinsic::nvvm_fmin_ftz_nan_f:
3389 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3390 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3391 case Intrinsic::nvvm_fmin_nan_f:
3392 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3393 case Intrinsic::nvvm_fmin_xorsign_abs_f:
3394 // If one arg is undef, the other arg can be returned only if it is
3395 // constant, as we may need to flush it to sign-preserving zero or
3396 // canonicalize the NaN.
3397 if (!IsOp0Undef && !IsOp1Undef)
3398 break;
3399 if (auto *Op = dyn_cast<ConstantFP>(Operands[IsOp0Undef ? 1 : 0])) {
3400 if (Op->isNaN()) {
3401 APInt NVCanonicalNaN(32, 0x7fffffff);
3402 return ConstantFP::get(
3403 Ty, APFloat(Ty->getFltSemantics(), NVCanonicalNaN));
3404 }
3405 if (nvvm::FMinFMaxShouldFTZ(IntrinsicID))
3406 return ConstantFP::get(Ty, FTZPreserveSign(Op->getValueAPF()));
3407 else
3408 return Op;
3409 }
3410 break;
3411 }
3412 }
3413
3414 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3415 const APFloat &Op1V = Op1->getValueAPF();
3416
3417 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3418 if (Op2->getType() != Op1->getType())
3419 return nullptr;
3420 const APFloat &Op2V = Op2->getValueAPF();
3421
3422 if (const auto *ConstrIntr =
3424 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3425 APFloat Res = Op1V;
3427 switch (IntrinsicID) {
3428 default:
3429 return nullptr;
3430 case Intrinsic::experimental_constrained_fadd:
3431 St = Res.add(Op2V, RM);
3432 break;
3433 case Intrinsic::experimental_constrained_fsub:
3434 St = Res.subtract(Op2V, RM);
3435 break;
3436 case Intrinsic::experimental_constrained_fmul:
3437 St = Res.multiply(Op2V, RM);
3438 break;
3439 case Intrinsic::experimental_constrained_fdiv:
3440 St = Res.divide(Op2V, RM);
3441 break;
3442 case Intrinsic::experimental_constrained_frem:
3443 St = Res.mod(Op2V);
3444 break;
3445 case Intrinsic::experimental_constrained_fcmp:
3446 case Intrinsic::experimental_constrained_fcmps:
3447 return evaluateCompare(Op1V, Op2V, ConstrIntr);
3448 }
3449 if (mayFoldConstrained(const_cast<ConstrainedFPIntrinsic *>(ConstrIntr),
3450 St))
3451 return ConstantFP::get(Ty, Res);
3452 return nullptr;
3453 }
3454
3455 switch (IntrinsicID) {
3456 default:
3457 break;
3458 case Intrinsic::copysign:
3459 return ConstantFP::get(Ty, APFloat::copySign(Op1V, Op2V));
3460 case Intrinsic::minnum:
3461 return ConstantFP::get(Ty, minnum(Op1V, Op2V));
3462 case Intrinsic::maxnum:
3463 return ConstantFP::get(Ty, maxnum(Op1V, Op2V));
3464 case Intrinsic::minimum:
3465 return ConstantFP::get(Ty, minimum(Op1V, Op2V));
3466 case Intrinsic::maximum:
3467 return ConstantFP::get(Ty, maximum(Op1V, Op2V));
3468 case Intrinsic::minimumnum:
3469 return ConstantFP::get(Ty, minimumnum(Op1V, Op2V));
3470 case Intrinsic::maximumnum:
3471 return ConstantFP::get(Ty, maximumnum(Op1V, Op2V));
3472
3473 case Intrinsic::nvvm_fmax_d:
3474 case Intrinsic::nvvm_fmax_f:
3475 case Intrinsic::nvvm_fmax_ftz_f:
3476 case Intrinsic::nvvm_fmax_ftz_nan_f:
3477 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3478 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3479 case Intrinsic::nvvm_fmax_nan_f:
3480 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3481 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3482
3483 case Intrinsic::nvvm_fmin_d:
3484 case Intrinsic::nvvm_fmin_f:
3485 case Intrinsic::nvvm_fmin_ftz_f:
3486 case Intrinsic::nvvm_fmin_ftz_nan_f:
3487 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3488 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3489 case Intrinsic::nvvm_fmin_nan_f:
3490 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3491 case Intrinsic::nvvm_fmin_xorsign_abs_f: {
3492
3493 bool ShouldCanonicalizeNaNs = !(IntrinsicID == Intrinsic::nvvm_fmax_d ||
3494 IntrinsicID == Intrinsic::nvvm_fmin_d);
3495 bool IsFTZ = nvvm::FMinFMaxShouldFTZ(IntrinsicID);
3496 bool IsNaNPropagating = nvvm::FMinFMaxPropagatesNaNs(IntrinsicID);
3497 bool IsXorSignAbs = nvvm::FMinFMaxIsXorSignAbs(IntrinsicID);
3498
3499 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3500 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3501
3502 bool XorSign = false;
3503 if (IsXorSignAbs) {
3504 XorSign = A.isNegative() ^ B.isNegative();
3505 A = abs(A);
3506 B = abs(B);
3507 }
3508
3509 bool IsFMax = false;
3510 switch (IntrinsicID) {
3511 case Intrinsic::nvvm_fmax_d:
3512 case Intrinsic::nvvm_fmax_f:
3513 case Intrinsic::nvvm_fmax_ftz_f:
3514 case Intrinsic::nvvm_fmax_ftz_nan_f:
3515 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3516 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3517 case Intrinsic::nvvm_fmax_nan_f:
3518 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3519 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3520 IsFMax = true;
3521 break;
3522 }
3523 APFloat Res =
3524 IsFMax ? (IsNaNPropagating ? maximum(A, B) : maximumnum(A, B))
3525 : (IsNaNPropagating ? minimum(A, B) : minimumnum(A, B));
3526
3527 if (ShouldCanonicalizeNaNs && Res.isNaN()) {
3528 APFloat NVCanonicalNaN(Res.getSemantics(), APInt(32, 0x7fffffff));
3529 return ConstantFP::get(Ty, NVCanonicalNaN);
3530 }
3531
3532 if (IsXorSignAbs && XorSign != Res.isNegative())
3533 Res.changeSign();
3534
3535 return ConstantFP::get(Ty, Res);
3536 }
3537
3538 case Intrinsic::nvvm_add_rm_f:
3539 case Intrinsic::nvvm_add_rn_f:
3540 case Intrinsic::nvvm_add_rp_f:
3541 case Intrinsic::nvvm_add_rz_f:
3542 case Intrinsic::nvvm_add_rm_d:
3543 case Intrinsic::nvvm_add_rn_d:
3544 case Intrinsic::nvvm_add_rp_d:
3545 case Intrinsic::nvvm_add_rz_d:
3546 case Intrinsic::nvvm_add_rm_ftz_f:
3547 case Intrinsic::nvvm_add_rn_ftz_f:
3548 case Intrinsic::nvvm_add_rp_ftz_f:
3549 case Intrinsic::nvvm_add_rz_ftz_f: {
3550
3551 bool IsFTZ = nvvm::FAddShouldFTZ(IntrinsicID);
3552 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3553 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3554
3555 APFloat::roundingMode RoundMode =
3556 nvvm::GetFAddRoundingMode(IntrinsicID);
3557
3558 APFloat Res = A;
3559 APFloat::opStatus Status = Res.add(B, RoundMode);
3560
3561 if (!Res.isNaN() &&
3563 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3564 return ConstantFP::get(Ty, Res);
3565 }
3566 return nullptr;
3567 }
3568
3569 case Intrinsic::nvvm_mul_rm_f:
3570 case Intrinsic::nvvm_mul_rn_f:
3571 case Intrinsic::nvvm_mul_rp_f:
3572 case Intrinsic::nvvm_mul_rz_f:
3573 case Intrinsic::nvvm_mul_rm_d:
3574 case Intrinsic::nvvm_mul_rn_d:
3575 case Intrinsic::nvvm_mul_rp_d:
3576 case Intrinsic::nvvm_mul_rz_d:
3577 case Intrinsic::nvvm_mul_rm_ftz_f:
3578 case Intrinsic::nvvm_mul_rn_ftz_f:
3579 case Intrinsic::nvvm_mul_rp_ftz_f:
3580 case Intrinsic::nvvm_mul_rz_ftz_f: {
3581
3582 bool IsFTZ = nvvm::FMulShouldFTZ(IntrinsicID);
3583 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3584 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3585
3586 APFloat::roundingMode RoundMode =
3587 nvvm::GetFMulRoundingMode(IntrinsicID);
3588
3589 APFloat Res = A;
3590 APFloat::opStatus Status = Res.multiply(B, RoundMode);
3591
3592 if (!Res.isNaN() &&
3594 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3595 return ConstantFP::get(Ty, Res);
3596 }
3597 return nullptr;
3598 }
3599
3600 case Intrinsic::nvvm_div_rm_f:
3601 case Intrinsic::nvvm_div_rn_f:
3602 case Intrinsic::nvvm_div_rp_f:
3603 case Intrinsic::nvvm_div_rz_f:
3604 case Intrinsic::nvvm_div_rm_d:
3605 case Intrinsic::nvvm_div_rn_d:
3606 case Intrinsic::nvvm_div_rp_d:
3607 case Intrinsic::nvvm_div_rz_d:
3608 case Intrinsic::nvvm_div_rm_ftz_f:
3609 case Intrinsic::nvvm_div_rn_ftz_f:
3610 case Intrinsic::nvvm_div_rp_ftz_f:
3611 case Intrinsic::nvvm_div_rz_ftz_f: {
3612 bool IsFTZ = nvvm::FDivShouldFTZ(IntrinsicID);
3613 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3614 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3615 APFloat::roundingMode RoundMode =
3616 nvvm::GetFDivRoundingMode(IntrinsicID);
3617
3618 APFloat Res = A;
3619 APFloat::opStatus Status = Res.divide(B, RoundMode);
3620 if (!Res.isNaN() &&
3622 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3623 return ConstantFP::get(Ty, Res);
3624 }
3625 return nullptr;
3626 }
3627 }
3628
3629 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy())
3630 return nullptr;
3631
3632 switch (IntrinsicID) {
3633 default:
3634 break;
3635 case Intrinsic::pow:
3636 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3637 case Intrinsic::amdgcn_fmul_legacy:
3638 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3639 // NaN or infinity, gives +0.0.
3640 if (Op1V.isZero() || Op2V.isZero())
3641 return ConstantFP::getZero(Ty);
3642 return ConstantFP::get(Ty, Op1V * Op2V);
3643 }
3644
3645 } else if (auto *Op2C = dyn_cast<ConstantInt>(Operands[1])) {
3646 switch (IntrinsicID) {
3647 case Intrinsic::ldexp: {
3648 return ConstantFP::get(
3649 Ty->getContext(),
3650 scalbn(Op1V, Op2C->getSExtValue(), APFloat::rmNearestTiesToEven));
3651 }
3652 case Intrinsic::is_fpclass: {
3653 FPClassTest Mask = static_cast<FPClassTest>(Op2C->getZExtValue());
3654 bool Result =
3655 ((Mask & fcSNan) && Op1V.isNaN() && Op1V.isSignaling()) ||
3656 ((Mask & fcQNan) && Op1V.isNaN() && !Op1V.isSignaling()) ||
3657 ((Mask & fcNegInf) && Op1V.isNegInfinity()) ||
3658 ((Mask & fcNegNormal) && Op1V.isNormal() && Op1V.isNegative()) ||
3659 ((Mask & fcNegSubnormal) && Op1V.isDenormal() && Op1V.isNegative()) ||
3660 ((Mask & fcNegZero) && Op1V.isZero() && Op1V.isNegative()) ||
3661 ((Mask & fcPosZero) && Op1V.isZero() && !Op1V.isNegative()) ||
3662 ((Mask & fcPosSubnormal) && Op1V.isDenormal() && !Op1V.isNegative()) ||
3663 ((Mask & fcPosNormal) && Op1V.isNormal() && !Op1V.isNegative()) ||
3664 ((Mask & fcPosInf) && Op1V.isPosInfinity());
3665 return ConstantInt::get(Ty, Result);
3666 }
3667 case Intrinsic::powi: {
3668 int Exp = static_cast<int>(Op2C->getSExtValue());
3669 switch (Ty->getTypeID()) {
3670 case Type::HalfTyID:
3671 case Type::FloatTyID: {
3672 APFloat Res(static_cast<float>(std::pow(Op1V.convertToFloat(), Exp)));
3673 if (Ty->isHalfTy()) {
3674 bool Unused;
3676 &Unused);
3677 }
3678 return ConstantFP::get(Ty, Res);
3679 }
3680 case Type::DoubleTyID:
3681 return ConstantFP::get(Ty, std::pow(Op1V.convertToDouble(), Exp));
3682 default:
3683 return nullptr;
3684 }
3685 }
3686 default:
3687 break;
3688 }
3689 }
3690 return nullptr;
3691 }
3692
3693 if (Operands[0]->getType()->isIntegerTy() &&
3694 Operands[1]->getType()->isIntegerTy()) {
3695 const APInt *C0, *C1;
3696 if (!getConstIntOrUndef(Operands[0], C0) ||
3697 !getConstIntOrUndef(Operands[1], C1))
3698 return nullptr;
3699
3700 switch (IntrinsicID) {
3701 default: break;
3702 case Intrinsic::smax:
3703 case Intrinsic::smin:
3704 case Intrinsic::umax:
3705 case Intrinsic::umin:
3706 if (!C0 && !C1)
3707 return UndefValue::get(Ty);
3708 if (!C0 || !C1)
3709 return MinMaxIntrinsic::getSaturationPoint(IntrinsicID, Ty);
3710 return ConstantInt::get(
3711 Ty, ICmpInst::compare(*C0, *C1,
3712 MinMaxIntrinsic::getPredicate(IntrinsicID))
3713 ? *C0
3714 : *C1);
3715
3716 case Intrinsic::scmp:
3717 case Intrinsic::ucmp:
3718 if (!C0 || !C1)
3719 return ConstantInt::get(Ty, 0);
3720
3721 int Res;
3722 if (IntrinsicID == Intrinsic::scmp)
3723 Res = C0->sgt(*C1) ? 1 : C0->slt(*C1) ? -1 : 0;
3724 else
3725 Res = C0->ugt(*C1) ? 1 : C0->ult(*C1) ? -1 : 0;
3726 return ConstantInt::get(Ty, Res, /*IsSigned=*/true);
3727
3728 case Intrinsic::usub_with_overflow:
3729 case Intrinsic::ssub_with_overflow:
3730 // X - undef -> { 0, false }
3731 // undef - X -> { 0, false }
3732 if (!C0 || !C1)
3733 return Constant::getNullValue(Ty);
3734 [[fallthrough]];
3735 case Intrinsic::uadd_with_overflow:
3736 case Intrinsic::sadd_with_overflow:
3737 // X + undef -> { -1, false }
3738 // undef + x -> { -1, false }
3739 if (!C0 || !C1) {
3740 return ConstantStruct::get(
3741 cast<StructType>(Ty),
3742 {Constant::getAllOnesValue(Ty->getStructElementType(0)),
3743 Constant::getNullValue(Ty->getStructElementType(1))});
3744 }
3745 [[fallthrough]];
3746 case Intrinsic::smul_with_overflow:
3747 case Intrinsic::umul_with_overflow: {
3748 // undef * X -> { 0, false }
3749 // X * undef -> { 0, false }
3750 if (!C0 || !C1)
3751 return Constant::getNullValue(Ty);
3752
3753 APInt Res;
3754 bool Overflow;
3755 switch (IntrinsicID) {
3756 default: llvm_unreachable("Invalid case");
3757 case Intrinsic::sadd_with_overflow:
3758 Res = C0->sadd_ov(*C1, Overflow);
3759 break;
3760 case Intrinsic::uadd_with_overflow:
3761 Res = C0->uadd_ov(*C1, Overflow);
3762 break;
3763 case Intrinsic::ssub_with_overflow:
3764 Res = C0->ssub_ov(*C1, Overflow);
3765 break;
3766 case Intrinsic::usub_with_overflow:
3767 Res = C0->usub_ov(*C1, Overflow);
3768 break;
3769 case Intrinsic::smul_with_overflow:
3770 Res = C0->smul_ov(*C1, Overflow);
3771 break;
3772 case Intrinsic::umul_with_overflow:
3773 Res = C0->umul_ov(*C1, Overflow);
3774 break;
3775 }
3776 Constant *Ops[] = {
3777 ConstantInt::get(Ty->getContext(), Res),
3778 ConstantInt::get(Type::getInt1Ty(Ty->getContext()), Overflow)
3779 };
3781 }
3782 case Intrinsic::uadd_sat:
3783 case Intrinsic::sadd_sat:
3784 if (!C0 && !C1)
3785 return UndefValue::get(Ty);
3786 if (!C0 || !C1)
3787 return Constant::getAllOnesValue(Ty);
3788 if (IntrinsicID == Intrinsic::uadd_sat)
3789 return ConstantInt::get(Ty, C0->uadd_sat(*C1));
3790 else
3791 return ConstantInt::get(Ty, C0->sadd_sat(*C1));
3792 case Intrinsic::usub_sat:
3793 case Intrinsic::ssub_sat:
3794 if (!C0 && !C1)
3795 return UndefValue::get(Ty);
3796 if (!C0 || !C1)
3797 return Constant::getNullValue(Ty);
3798 if (IntrinsicID == Intrinsic::usub_sat)
3799 return ConstantInt::get(Ty, C0->usub_sat(*C1));
3800 else
3801 return ConstantInt::get(Ty, C0->ssub_sat(*C1));
3802 case Intrinsic::cttz:
3803 case Intrinsic::ctlz:
3804 assert(C1 && "Must be constant int");
3805
3806 // cttz(0, 1) and ctlz(0, 1) are poison.
3807 if (C1->isOne() && (!C0 || C0->isZero()))
3808 return PoisonValue::get(Ty);
3809 if (!C0)
3810 return Constant::getNullValue(Ty);
3811 if (IntrinsicID == Intrinsic::cttz)
3812 return ConstantInt::get(Ty, C0->countr_zero());
3813 else
3814 return ConstantInt::get(Ty, C0->countl_zero());
3815
3816 case Intrinsic::abs:
3817 assert(C1 && "Must be constant int");
3818 assert((C1->isOne() || C1->isZero()) && "Must be 0 or 1");
3819
3820 // Undef or minimum val operand with poison min --> poison
3821 if (C1->isOne() && (!C0 || C0->isMinSignedValue()))
3822 return PoisonValue::get(Ty);
3823
3824 // Undef operand with no poison min --> 0 (sign bit must be clear)
3825 if (!C0)
3826 return Constant::getNullValue(Ty);
3827
3828 return ConstantInt::get(Ty, C0->abs());
3829 case Intrinsic::amdgcn_wave_reduce_umin:
3830 case Intrinsic::amdgcn_wave_reduce_umax:
3831 case Intrinsic::amdgcn_wave_reduce_max:
3832 case Intrinsic::amdgcn_wave_reduce_min:
3833 case Intrinsic::amdgcn_wave_reduce_and:
3834 case Intrinsic::amdgcn_wave_reduce_or:
3835 return Operands[0];
3836 }
3837
3838 return nullptr;
3839 }
3840
3841 // Support ConstantVector in case we have an Undef in the top.
3842 if ((isa<ConstantVector>(Operands[0]) ||
3843 isa<ConstantDataVector>(Operands[0])) &&
3844 // Check for default rounding mode.
3845 // FIXME: Support other rounding modes?
3846 isa<ConstantInt>(Operands[1]) &&
3847 cast<ConstantInt>(Operands[1])->getValue() == 4) {
3848 auto *Op = cast<Constant>(Operands[0]);
3849 switch (IntrinsicID) {
3850 default: break;
3851 case Intrinsic::x86_avx512_vcvtss2si32:
3852 case Intrinsic::x86_avx512_vcvtss2si64:
3853 case Intrinsic::x86_avx512_vcvtsd2si32:
3854 case Intrinsic::x86_avx512_vcvtsd2si64:
3855 if (ConstantFP *FPOp =
3856 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3857 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3858 /*roundTowardZero=*/false, Ty,
3859 /*IsSigned*/true);
3860 break;
3861 case Intrinsic::x86_avx512_vcvtss2usi32:
3862 case Intrinsic::x86_avx512_vcvtss2usi64:
3863 case Intrinsic::x86_avx512_vcvtsd2usi32:
3864 case Intrinsic::x86_avx512_vcvtsd2usi64:
3865 if (ConstantFP *FPOp =
3866 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3867 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3868 /*roundTowardZero=*/false, Ty,
3869 /*IsSigned*/false);
3870 break;
3871 case Intrinsic::x86_avx512_cvttss2si:
3872 case Intrinsic::x86_avx512_cvttss2si64:
3873 case Intrinsic::x86_avx512_cvttsd2si:
3874 case Intrinsic::x86_avx512_cvttsd2si64:
3875 if (ConstantFP *FPOp =
3876 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3877 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3878 /*roundTowardZero=*/true, Ty,
3879 /*IsSigned*/true);
3880 break;
3881 case Intrinsic::x86_avx512_cvttss2usi:
3882 case Intrinsic::x86_avx512_cvttss2usi64:
3883 case Intrinsic::x86_avx512_cvttsd2usi:
3884 case Intrinsic::x86_avx512_cvttsd2usi64:
3885 if (ConstantFP *FPOp =
3886 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3887 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3888 /*roundTowardZero=*/true, Ty,
3889 /*IsSigned*/false);
3890 break;
3891 }
3892 }
3893
3894 if (IntrinsicID == Intrinsic::experimental_cttz_elts) {
3895 auto *FVTy = dyn_cast<FixedVectorType>(Operands[0]->getType());
3896 bool ZeroIsPoison = cast<ConstantInt>(Operands[1])->isOne();
3897 if (!FVTy)
3898 return nullptr;
3899 unsigned Width = Ty->getIntegerBitWidth();
3900 if (APInt::getMaxValue(Width).ult(FVTy->getNumElements()))
3901 return PoisonValue::get(Ty);
3902 for (unsigned I = 0; I < FVTy->getNumElements(); ++I) {
3903 Constant *Elt = Operands[0]->getAggregateElement(I);
3904 if (!Elt)
3905 return nullptr;
3906 if (isa<UndefValue>(Elt) || Elt->isNullValue())
3907 continue;
3908 return ConstantInt::get(Ty, I);
3909 }
3910 if (ZeroIsPoison)
3911 return PoisonValue::get(Ty);
3912 return ConstantInt::get(Ty, FVTy->getNumElements());
3913 }
3914 return nullptr;
3915}
3916
3917static APFloat ConstantFoldAMDGCNCubeIntrinsic(Intrinsic::ID IntrinsicID,
3918 const APFloat &S0,
3919 const APFloat &S1,
3920 const APFloat &S2) {
3921 unsigned ID;
3922 const fltSemantics &Sem = S0.getSemantics();
3923 APFloat MA(Sem), SC(Sem), TC(Sem);
3924 if (abs(S2) >= abs(S0) && abs(S2) >= abs(S1)) {
3925 if (S2.isNegative() && S2.isNonZero() && !S2.isNaN()) {
3926 // S2 < 0
3927 ID = 5;
3928 SC = -S0;
3929 } else {
3930 ID = 4;
3931 SC = S0;
3932 }
3933 MA = S2;
3934 TC = -S1;
3935 } else if (abs(S1) >= abs(S0)) {
3936 if (S1.isNegative() && S1.isNonZero() && !S1.isNaN()) {
3937 // S1 < 0
3938 ID = 3;
3939 TC = -S2;
3940 } else {
3941 ID = 2;
3942 TC = S2;
3943 }
3944 MA = S1;
3945 SC = S0;
3946 } else {
3947 if (S0.isNegative() && S0.isNonZero() && !S0.isNaN()) {
3948 // S0 < 0
3949 ID = 1;
3950 SC = S2;
3951 } else {
3952 ID = 0;
3953 SC = -S2;
3954 }
3955 MA = S0;
3956 TC = -S1;
3957 }
3958 switch (IntrinsicID) {
3959 default:
3960 llvm_unreachable("unhandled amdgcn cube intrinsic");
3961 case Intrinsic::amdgcn_cubeid:
3962 return APFloat(Sem, ID);
3963 case Intrinsic::amdgcn_cubema:
3964 return MA + MA;
3965 case Intrinsic::amdgcn_cubesc:
3966 return SC;
3967 case Intrinsic::amdgcn_cubetc:
3968 return TC;
3969 }
3970}
3971
3972static Constant *ConstantFoldAMDGCNPermIntrinsic(ArrayRef<Constant *> Operands,
3973 Type *Ty) {
3974 const APInt *C0, *C1, *C2;
3975 if (!getConstIntOrUndef(Operands[0], C0) ||
3976 !getConstIntOrUndef(Operands[1], C1) ||
3977 !getConstIntOrUndef(Operands[2], C2))
3978 return nullptr;
3979
3980 if (!C2)
3981 return UndefValue::get(Ty);
3982
3983 APInt Val(32, 0);
3984 unsigned NumUndefBytes = 0;
3985 for (unsigned I = 0; I < 32; I += 8) {
3986 unsigned Sel = C2->extractBitsAsZExtValue(8, I);
3987 unsigned B = 0;
3988
3989 if (Sel >= 13)
3990 B = 0xff;
3991 else if (Sel == 12)
3992 B = 0x00;
3993 else {
3994 const APInt *Src = ((Sel & 10) == 10 || (Sel & 12) == 4) ? C0 : C1;
3995 if (!Src)
3996 ++NumUndefBytes;
3997 else if (Sel < 8)
3998 B = Src->extractBitsAsZExtValue(8, (Sel & 3) * 8);
3999 else
4000 B = Src->extractBitsAsZExtValue(1, (Sel & 1) ? 31 : 15) * 0xff;
4001 }
4002
4003 Val.insertBits(B, I, 8);
4004 }
4005
4006 if (NumUndefBytes == 4)
4007 return UndefValue::get(Ty);
4008
4009 return ConstantInt::get(Ty, Val);
4010}
4011
4012static Constant *ConstantFoldScalarCall3(StringRef Name,
4013 Intrinsic::ID IntrinsicID,
4014 Type *Ty,
4015 ArrayRef<Constant *> Operands,
4016 const TargetLibraryInfo *TLI,
4017 const CallBase *Call) {
4018 assert(Operands.size() == 3 && "Wrong number of operands.");
4019
4020 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
4021 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
4022 if (const auto *Op3 = dyn_cast<ConstantFP>(Operands[2])) {
4023 const APFloat &C1 = Op1->getValueAPF();
4024 const APFloat &C2 = Op2->getValueAPF();
4025 const APFloat &C3 = Op3->getValueAPF();
4026
4027 if (const auto *ConstrIntr = dyn_cast<ConstrainedFPIntrinsic>(Call)) {
4028 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
4029 APFloat Res = C1;
4031 switch (IntrinsicID) {
4032 default:
4033 return nullptr;
4034 case Intrinsic::experimental_constrained_fma:
4035 case Intrinsic::experimental_constrained_fmuladd:
4036 St = Res.fusedMultiplyAdd(C2, C3, RM);
4037 break;
4038 }
4039 if (mayFoldConstrained(
4040 const_cast<ConstrainedFPIntrinsic *>(ConstrIntr), St))
4041 return ConstantFP::get(Ty, Res);
4042 return nullptr;
4043 }
4044
4045 switch (IntrinsicID) {
4046 default: break;
4047 case Intrinsic::amdgcn_fma_legacy: {
4048 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
4049 // NaN or infinity, gives +0.0.
4050 if (C1.isZero() || C2.isZero()) {
4051 // It's tempting to just return C3 here, but that would give the
4052 // wrong result if C3 was -0.0.
4053 return ConstantFP::get(Ty, APFloat(0.0f) + C3);
4054 }
4055 [[fallthrough]];
4056 }
4057 case Intrinsic::fma:
4058 case Intrinsic::fmuladd: {
4059 APFloat V = C1;
4061 return ConstantFP::get(Ty, V);
4062 }
4063
4064 case Intrinsic::nvvm_fma_rm_f:
4065 case Intrinsic::nvvm_fma_rn_f:
4066 case Intrinsic::nvvm_fma_rp_f:
4067 case Intrinsic::nvvm_fma_rz_f:
4068 case Intrinsic::nvvm_fma_rm_d:
4069 case Intrinsic::nvvm_fma_rn_d:
4070 case Intrinsic::nvvm_fma_rp_d:
4071 case Intrinsic::nvvm_fma_rz_d:
4072 case Intrinsic::nvvm_fma_rm_ftz_f:
4073 case Intrinsic::nvvm_fma_rn_ftz_f:
4074 case Intrinsic::nvvm_fma_rp_ftz_f:
4075 case Intrinsic::nvvm_fma_rz_ftz_f: {
4076 bool IsFTZ = nvvm::FMAShouldFTZ(IntrinsicID);
4077 APFloat A = IsFTZ ? FTZPreserveSign(C1) : C1;
4078 APFloat B = IsFTZ ? FTZPreserveSign(C2) : C2;
4079 APFloat C = IsFTZ ? FTZPreserveSign(C3) : C3;
4080
4081 APFloat::roundingMode RoundMode =
4082 nvvm::GetFMARoundingMode(IntrinsicID);
4083
4084 APFloat Res = A;
4085 APFloat::opStatus Status = Res.fusedMultiplyAdd(B, C, RoundMode);
4086
4087 if (!Res.isNaN() &&
4089 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
4090 return ConstantFP::get(Ty, Res);
4091 }
4092 return nullptr;
4093 }
4094
4095 case Intrinsic::amdgcn_cubeid:
4096 case Intrinsic::amdgcn_cubema:
4097 case Intrinsic::amdgcn_cubesc:
4098 case Intrinsic::amdgcn_cubetc: {
4099 APFloat V = ConstantFoldAMDGCNCubeIntrinsic(IntrinsicID, C1, C2, C3);
4100 return ConstantFP::get(Ty, V);
4101 }
4102 }
4103 }
4104 }
4105 }
4106
4107 if (IntrinsicID == Intrinsic::smul_fix ||
4108 IntrinsicID == Intrinsic::smul_fix_sat) {
4109 const APInt *C0, *C1;
4110 if (!getConstIntOrUndef(Operands[0], C0) ||
4111 !getConstIntOrUndef(Operands[1], C1))
4112 return nullptr;
4113
4114 // undef * C -> 0
4115 // C * undef -> 0
4116 if (!C0 || !C1)
4117 return Constant::getNullValue(Ty);
4118
4119 // This code performs rounding towards negative infinity in case the result
4120 // cannot be represented exactly for the given scale. Targets that do care
4121 // about rounding should use a target hook for specifying how rounding
4122 // should be done, and provide their own folding to be consistent with
4123 // rounding. This is the same approach as used by
4124 // DAGTypeLegalizer::ExpandIntRes_MULFIX.
4125 unsigned Scale = cast<ConstantInt>(Operands[2])->getZExtValue();
4126 unsigned Width = C0->getBitWidth();
4127 assert(Scale < Width && "Illegal scale.");
4128 unsigned ExtendedWidth = Width * 2;
4129 APInt Product =
4130 (C0->sext(ExtendedWidth) * C1->sext(ExtendedWidth)).ashr(Scale);
4131 if (IntrinsicID == Intrinsic::smul_fix_sat) {
4132 APInt Max = APInt::getSignedMaxValue(Width).sext(ExtendedWidth);
4133 APInt Min = APInt::getSignedMinValue(Width).sext(ExtendedWidth);
4134 Product = APIntOps::smin(Product, Max);
4135 Product = APIntOps::smax(Product, Min);
4136 }
4137 return ConstantInt::get(Ty->getContext(), Product.sextOrTrunc(Width));
4138 }
4139
4140 if (IntrinsicID == Intrinsic::fshl || IntrinsicID == Intrinsic::fshr) {
4141 const APInt *C0, *C1, *C2;
4142 if (!getConstIntOrUndef(Operands[0], C0) ||
4143 !getConstIntOrUndef(Operands[1], C1) ||
4144 !getConstIntOrUndef(Operands[2], C2))
4145 return nullptr;
4146
4147 bool IsRight = IntrinsicID == Intrinsic::fshr;
4148 if (!C2)
4149 return Operands[IsRight ? 1 : 0];
4150 if (!C0 && !C1)
4151 return UndefValue::get(Ty);
4152
4153 // The shift amount is interpreted as modulo the bitwidth. If the shift
4154 // amount is effectively 0, avoid UB due to oversized inverse shift below.
4155 unsigned BitWidth = C2->getBitWidth();
4156 unsigned ShAmt = C2->urem(BitWidth);
4157 if (!ShAmt)
4158 return Operands[IsRight ? 1 : 0];
4159
4160 // (C0 << ShlAmt) | (C1 >> LshrAmt)
4161 unsigned LshrAmt = IsRight ? ShAmt : BitWidth - ShAmt;
4162 unsigned ShlAmt = !IsRight ? ShAmt : BitWidth - ShAmt;
4163 if (!C0)
4164 return ConstantInt::get(Ty, C1->lshr(LshrAmt));
4165 if (!C1)
4166 return ConstantInt::get(Ty, C0->shl(ShlAmt));
4167 return ConstantInt::get(Ty, C0->shl(ShlAmt) | C1->lshr(LshrAmt));
4168 }
4169
4170 if (IntrinsicID == Intrinsic::amdgcn_perm)
4171 return ConstantFoldAMDGCNPermIntrinsic(Operands, Ty);
4172
4173 return nullptr;
4174}
4175
4176static Constant *ConstantFoldScalarCall(StringRef Name,
4177 Intrinsic::ID IntrinsicID,
4178 Type *Ty,
4179 ArrayRef<Constant *> Operands,
4180 const TargetLibraryInfo *TLI,
4181 const CallBase *Call) {
4182 if (IntrinsicID != Intrinsic::not_intrinsic &&
4183 any_of(Operands, IsaPred<PoisonValue>) &&
4184 intrinsicPropagatesPoison(IntrinsicID))
4185 return PoisonValue::get(Ty);
4186
4187 if (Operands.size() == 1)
4188 return ConstantFoldScalarCall1(Name, IntrinsicID, Ty, Operands, TLI, Call);
4189
4190 if (Operands.size() == 2) {
4191 if (Constant *FoldedLibCall =
4192 ConstantFoldLibCall2(Name, Ty, Operands, TLI)) {
4193 return FoldedLibCall;
4194 }
4195 return ConstantFoldIntrinsicCall2(IntrinsicID, Ty, Operands, Call);
4196 }
4197
4198 if (Operands.size() == 3)
4199 return ConstantFoldScalarCall3(Name, IntrinsicID, Ty, Operands, TLI, Call);
4200
4201 return nullptr;
4202}
4203
4204static Constant *ConstantFoldFixedVectorCall(
4205 StringRef Name, Intrinsic::ID IntrinsicID, FixedVectorType *FVTy,
4206 ArrayRef<Constant *> Operands, const DataLayout &DL,
4207 const TargetLibraryInfo *TLI, const CallBase *Call) {
4209 SmallVector<Constant *, 4> Lane(Operands.size());
4210 Type *Ty = FVTy->getElementType();
4211
4212 switch (IntrinsicID) {
4213 case Intrinsic::masked_load: {
4214 auto *SrcPtr = Operands[0];
4215 auto *Mask = Operands[1];
4216 auto *Passthru = Operands[2];
4217
4218 Constant *VecData = ConstantFoldLoadFromConstPtr(SrcPtr, FVTy, DL);
4219
4220 SmallVector<Constant *, 32> NewElements;
4221 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4222 auto *MaskElt = Mask->getAggregateElement(I);
4223 if (!MaskElt)
4224 break;
4225 auto *PassthruElt = Passthru->getAggregateElement(I);
4226 auto *VecElt = VecData ? VecData->getAggregateElement(I) : nullptr;
4227 if (isa<UndefValue>(MaskElt)) {
4228 if (PassthruElt)
4229 NewElements.push_back(PassthruElt);
4230 else if (VecElt)
4231 NewElements.push_back(VecElt);
4232 else
4233 return nullptr;
4234 }
4235 if (MaskElt->isNullValue()) {
4236 if (!PassthruElt)
4237 return nullptr;
4238 NewElements.push_back(PassthruElt);
4239 } else if (MaskElt->isOneValue()) {
4240 if (!VecElt)
4241 return nullptr;
4242 NewElements.push_back(VecElt);
4243 } else {
4244 return nullptr;
4245 }
4246 }
4247 if (NewElements.size() != FVTy->getNumElements())
4248 return nullptr;
4249 return ConstantVector::get(NewElements);
4250 }
4251 case Intrinsic::arm_mve_vctp8:
4252 case Intrinsic::arm_mve_vctp16:
4253 case Intrinsic::arm_mve_vctp32:
4254 case Intrinsic::arm_mve_vctp64: {
4255 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
4256 unsigned Lanes = FVTy->getNumElements();
4257 uint64_t Limit = Op->getZExtValue();
4258
4260 for (unsigned i = 0; i < Lanes; i++) {
4261 if (i < Limit)
4263 else
4265 }
4266 return ConstantVector::get(NCs);
4267 }
4268 return nullptr;
4269 }
4270 case Intrinsic::get_active_lane_mask: {
4271 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4272 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4273 if (Op0 && Op1) {
4274 unsigned Lanes = FVTy->getNumElements();
4275 uint64_t Base = Op0->getZExtValue();
4276 uint64_t Limit = Op1->getZExtValue();
4277
4279 for (unsigned i = 0; i < Lanes; i++) {
4280 if (Base + i < Limit)
4282 else
4284 }
4285 return ConstantVector::get(NCs);
4286 }
4287 return nullptr;
4288 }
4289 case Intrinsic::vector_extract: {
4290 auto *Idx = dyn_cast<ConstantInt>(Operands[1]);
4291 Constant *Vec = Operands[0];
4292 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4293 return nullptr;
4294
4295 unsigned NumElements = FVTy->getNumElements();
4296 unsigned VecNumElements =
4297 cast<FixedVectorType>(Vec->getType())->getNumElements();
4298 unsigned StartingIndex = Idx->getZExtValue();
4299
4300 // Extracting entire vector is nop
4301 if (NumElements == VecNumElements && StartingIndex == 0)
4302 return Vec;
4303
4304 for (unsigned I = StartingIndex, E = StartingIndex + NumElements; I < E;
4305 ++I) {
4306 Constant *Elt = Vec->getAggregateElement(I);
4307 if (!Elt)
4308 return nullptr;
4309 Result[I - StartingIndex] = Elt;
4310 }
4311
4312 return ConstantVector::get(Result);
4313 }
4314 case Intrinsic::vector_insert: {
4315 Constant *Vec = Operands[0];
4316 Constant *SubVec = Operands[1];
4317 auto *Idx = dyn_cast<ConstantInt>(Operands[2]);
4318 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4319 return nullptr;
4320
4321 unsigned SubVecNumElements =
4322 cast<FixedVectorType>(SubVec->getType())->getNumElements();
4323 unsigned VecNumElements =
4324 cast<FixedVectorType>(Vec->getType())->getNumElements();
4325 unsigned IdxN = Idx->getZExtValue();
4326 // Replacing entire vector with a subvec is nop
4327 if (SubVecNumElements == VecNumElements && IdxN == 0)
4328 return SubVec;
4329
4330 for (unsigned I = 0; I < VecNumElements; ++I) {
4331 Constant *Elt;
4332 if (I < IdxN + SubVecNumElements)
4333 Elt = SubVec->getAggregateElement(I - IdxN);
4334 else
4335 Elt = Vec->getAggregateElement(I);
4336 if (!Elt)
4337 return nullptr;
4338 Result[I] = Elt;
4339 }
4340 return ConstantVector::get(Result);
4341 }
4342 case Intrinsic::vector_interleave2:
4343 case Intrinsic::vector_interleave3:
4344 case Intrinsic::vector_interleave4:
4345 case Intrinsic::vector_interleave5:
4346 case Intrinsic::vector_interleave6:
4347 case Intrinsic::vector_interleave7:
4348 case Intrinsic::vector_interleave8: {
4349 unsigned NumElements =
4350 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4351 unsigned NumOperands = Operands.size();
4352 for (unsigned I = 0; I < NumElements; ++I) {
4353 for (unsigned J = 0; J < NumOperands; ++J) {
4354 Constant *Elt = Operands[J]->getAggregateElement(I);
4355 if (!Elt)
4356 return nullptr;
4357 Result[NumOperands * I + J] = Elt;
4358 }
4359 }
4360 return ConstantVector::get(Result);
4361 }
4362 case Intrinsic::wasm_dot: {
4363 unsigned NumElements =
4364 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4365
4366 assert(NumElements == 8 && Result.size() == 4 &&
4367 "wasm dot takes i16x8 and produces i32x4");
4368 assert(Ty->isIntegerTy());
4369 int32_t MulVector[8];
4370
4371 for (unsigned I = 0; I < NumElements; ++I) {
4372 ConstantInt *Elt0 =
4373 cast<ConstantInt>(Operands[0]->getAggregateElement(I));
4374 ConstantInt *Elt1 =
4375 cast<ConstantInt>(Operands[1]->getAggregateElement(I));
4376
4377 MulVector[I] = Elt0->getSExtValue() * Elt1->getSExtValue();
4378 }
4379 for (unsigned I = 0; I < Result.size(); I++) {
4380 int64_t IAdd = (int64_t)MulVector[I * 2] + (int64_t)MulVector[I * 2 + 1];
4381 Result[I] = ConstantInt::getSigned(Ty, IAdd, /*ImplicitTrunc=*/true);
4382 }
4383
4384 return ConstantVector::get(Result);
4385 }
4386 default:
4387 break;
4388 }
4389
4390 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4391 // Gather a column of constants.
4392 for (unsigned J = 0, JE = Operands.size(); J != JE; ++J) {
4393 // Some intrinsics use a scalar type for certain arguments.
4394 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, J, /*TTI=*/nullptr)) {
4395 Lane[J] = Operands[J];
4396 continue;
4397 }
4398
4399 Constant *Agg = Operands[J]->getAggregateElement(I);
4400 if (!Agg)
4401 return nullptr;
4402
4403 Lane[J] = Agg;
4404 }
4405
4406 // Use the regular scalar folding to simplify this column.
4407 Constant *Folded =
4408 ConstantFoldScalarCall(Name, IntrinsicID, Ty, Lane, TLI, Call);
4409 if (!Folded)
4410 return nullptr;
4411 Result[I] = Folded;
4412 }
4413
4414 return ConstantVector::get(Result);
4415}
4416
4417static Constant *ConstantFoldScalableVectorCall(
4418 StringRef Name, Intrinsic::ID IntrinsicID, ScalableVectorType *SVTy,
4419 ArrayRef<Constant *> Operands, const DataLayout &DL,
4420 const TargetLibraryInfo *TLI, const CallBase *Call) {
4421 switch (IntrinsicID) {
4422 case Intrinsic::aarch64_sve_convert_from_svbool: {
4423 Constant *Src = Operands[0];
4424 if (!Src->isNullValue())
4425 break;
4426
4427 return ConstantInt::getFalse(SVTy);
4428 }
4429 case Intrinsic::get_active_lane_mask: {
4430 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4431 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4432 if (Op0 && Op1 && Op0->getValue().uge(Op1->getValue()))
4433 return ConstantVector::getNullValue(SVTy);
4434 break;
4435 }
4436 case Intrinsic::vector_interleave2:
4437 case Intrinsic::vector_interleave3:
4438 case Intrinsic::vector_interleave4:
4439 case Intrinsic::vector_interleave5:
4440 case Intrinsic::vector_interleave6:
4441 case Intrinsic::vector_interleave7:
4442 case Intrinsic::vector_interleave8: {
4443 Constant *SplatVal = Operands[0]->getSplatValue();
4444 if (!SplatVal)
4445 return nullptr;
4446
4447 if (!llvm::all_equal(Operands))
4448 return nullptr;
4449
4450 return ConstantVector::getSplat(SVTy->getElementCount(), SplatVal);
4451 }
4452 default:
4453 break;
4454 }
4455
4456 // If trivially vectorizable, try folding it via the scalar call if all
4457 // operands are splats.
4458
4459 // TODO: ConstantFoldFixedVectorCall should probably check this too?
4460 if (!isTriviallyVectorizable(IntrinsicID))
4461 return nullptr;
4462
4464 for (auto [I, Op] : enumerate(Operands)) {
4465 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, I, /*TTI=*/nullptr)) {
4466 SplatOps.push_back(Op);
4467 continue;
4468 }
4469 Constant *Splat = Op->getSplatValue();
4470 if (!Splat)
4471 return nullptr;
4472 SplatOps.push_back(Splat);
4473 }
4474 Constant *Folded = ConstantFoldScalarCall(
4475 Name, IntrinsicID, SVTy->getElementType(), SplatOps, TLI, Call);
4476 if (!Folded)
4477 return nullptr;
4478 return ConstantVector::getSplat(SVTy->getElementCount(), Folded);
4479}
4480
4481static std::pair<Constant *, Constant *>
4482ConstantFoldScalarFrexpCall(Constant *Op, Type *IntTy) {
4483 if (isa<PoisonValue>(Op))
4484 return {Op, PoisonValue::get(IntTy)};
4485
4486 auto *ConstFP = dyn_cast<ConstantFP>(Op);
4487 if (!ConstFP)
4488 return {};
4489
4490 const APFloat &U = ConstFP->getValueAPF();
4491 int FrexpExp;
4492 APFloat FrexpMant = frexp(U, FrexpExp, APFloat::rmNearestTiesToEven);
4493 Constant *Result0 = ConstantFP::get(ConstFP->getType(), FrexpMant);
4494
4495 // The exponent is an "unspecified value" for inf/nan. We use zero to avoid
4496 // using undef.
4497 Constant *Result1 = FrexpMant.isFinite()
4498 ? ConstantInt::getSigned(IntTy, FrexpExp)
4499 : ConstantInt::getNullValue(IntTy);
4500 return {Result0, Result1};
4501}
4502
4503/// Handle intrinsics that return tuples, which may be tuples of vectors.
4504static Constant *
4505ConstantFoldStructCall(StringRef Name, Intrinsic::ID IntrinsicID,
4506 StructType *StTy, ArrayRef<Constant *> Operands,
4507 const DataLayout &DL, const TargetLibraryInfo *TLI,
4508 const CallBase *Call) {
4509
4510 switch (IntrinsicID) {
4511 case Intrinsic::frexp: {
4512 Type *Ty0 = StTy->getContainedType(0);
4513 Type *Ty1 = StTy->getContainedType(1)->getScalarType();
4514
4515 if (auto *FVTy0 = dyn_cast<FixedVectorType>(Ty0)) {
4516 SmallVector<Constant *, 4> Results0(FVTy0->getNumElements());
4517 SmallVector<Constant *, 4> Results1(FVTy0->getNumElements());
4518
4519 for (unsigned I = 0, E = FVTy0->getNumElements(); I != E; ++I) {
4520 Constant *Lane = Operands[0]->getAggregateElement(I);
4521 std::tie(Results0[I], Results1[I]) =
4522 ConstantFoldScalarFrexpCall(Lane, Ty1);
4523 if (!Results0[I])
4524 return nullptr;
4525 }
4526
4527 return ConstantStruct::get(StTy, ConstantVector::get(Results0),
4528 ConstantVector::get(Results1));
4529 }
4530
4531 auto [Result0, Result1] = ConstantFoldScalarFrexpCall(Operands[0], Ty1);
4532 if (!Result0)
4533 return nullptr;
4534 return ConstantStruct::get(StTy, Result0, Result1);
4535 }
4536 case Intrinsic::sincos: {
4537 Type *Ty = StTy->getContainedType(0);
4538 Type *TyScalar = Ty->getScalarType();
4539
4540 auto ConstantFoldScalarSincosCall =
4541 [&](Constant *Op) -> std::pair<Constant *, Constant *> {
4542 Constant *SinResult =
4543 ConstantFoldScalarCall(Name, Intrinsic::sin, TyScalar, Op, TLI, Call);
4544 Constant *CosResult =
4545 ConstantFoldScalarCall(Name, Intrinsic::cos, TyScalar, Op, TLI, Call);
4546 return std::make_pair(SinResult, CosResult);
4547 };
4548
4549 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty)) {
4550 SmallVector<Constant *> SinResults(FVTy->getNumElements());
4551 SmallVector<Constant *> CosResults(FVTy->getNumElements());
4552
4553 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4554 Constant *Lane = Operands[0]->getAggregateElement(I);
4555 std::tie(SinResults[I], CosResults[I]) =
4556 ConstantFoldScalarSincosCall(Lane);
4557 if (!SinResults[I] || !CosResults[I])
4558 return nullptr;
4559 }
4560
4561 return ConstantStruct::get(StTy, ConstantVector::get(SinResults),
4562 ConstantVector::get(CosResults));
4563 }
4564
4565 auto [SinResult, CosResult] = ConstantFoldScalarSincosCall(Operands[0]);
4566 if (!SinResult || !CosResult)
4567 return nullptr;
4568 return ConstantStruct::get(StTy, SinResult, CosResult);
4569 }
4570 case Intrinsic::vector_deinterleave2:
4571 case Intrinsic::vector_deinterleave3:
4572 case Intrinsic::vector_deinterleave4:
4573 case Intrinsic::vector_deinterleave5:
4574 case Intrinsic::vector_deinterleave6:
4575 case Intrinsic::vector_deinterleave7:
4576 case Intrinsic::vector_deinterleave8: {
4577 unsigned NumResults = StTy->getNumElements();
4578 auto *Vec = Operands[0];
4579 auto *VecTy = cast<VectorType>(Vec->getType());
4580
4581 ElementCount ResultEC =
4582 VecTy->getElementCount().divideCoefficientBy(NumResults);
4583
4584 if (auto *EltC = Vec->getSplatValue()) {
4585 auto *ResultVec = ConstantVector::getSplat(ResultEC, EltC);
4586 SmallVector<Constant *, 8> Results(NumResults, ResultVec);
4587 return ConstantStruct::get(StTy, Results);
4588 }
4589
4590 if (!ResultEC.isFixed())
4591 return nullptr;
4592
4593 unsigned NumElements = ResultEC.getFixedValue();
4595 SmallVector<Constant *> Elements(NumElements);
4596 for (unsigned I = 0; I != NumResults; ++I) {
4597 for (unsigned J = 0; J != NumElements; ++J) {
4598 Constant *Elt = Vec->getAggregateElement(J * NumResults + I);
4599 if (!Elt)
4600 return nullptr;
4601 Elements[J] = Elt;
4602 }
4603 Results[I] = ConstantVector::get(Elements);
4604 }
4605 return ConstantStruct::get(StTy, Results);
4606 }
4607 default:
4608 // TODO: Constant folding of vector intrinsics that fall through here does
4609 // not work (e.g. overflow intrinsics)
4610 return ConstantFoldScalarCall(Name, IntrinsicID, StTy, Operands, TLI, Call);
4611 }
4612
4613 return nullptr;
4614}
4615
4616} // end anonymous namespace
4617
4619 Constant *RHS, Type *Ty,
4622 // Ensure we check flags like StrictFP that might prevent this from getting
4623 // folded before generating a result.
4624 if (Call && !canConstantFoldCallTo(Call, Call->getCalledFunction()))
4625 return nullptr;
4626 return ConstantFoldIntrinsicCall2(ID, Ty, {LHS, RHS}, Call);
4627}
4628
4630 ArrayRef<Constant *> Operands,
4631 const TargetLibraryInfo *TLI,
4632 bool AllowNonDeterministic) {
4633 if (Call->isNoBuiltin())
4634 return nullptr;
4635 if (!F->hasName())
4636 return nullptr;
4637
4638 // If this is not an intrinsic and not recognized as a library call, bail out.
4639 Intrinsic::ID IID = F->getIntrinsicID();
4640 if (IID == Intrinsic::not_intrinsic) {
4641 if (!TLI)
4642 return nullptr;
4643 LibFunc LibF;
4644 if (!TLI->getLibFunc(*F, LibF))
4645 return nullptr;
4646 }
4647
4648 // Conservatively assume that floating-point libcalls may be
4649 // non-deterministic.
4650 Type *Ty = F->getReturnType();
4651 if (!AllowNonDeterministic && Ty->isFPOrFPVectorTy())
4652 return nullptr;
4653
4654 StringRef Name = F->getName();
4655 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty))
4656 return ConstantFoldFixedVectorCall(
4657 Name, IID, FVTy, Operands, F->getDataLayout(), TLI, Call);
4658
4659 if (auto *SVTy = dyn_cast<ScalableVectorType>(Ty))
4660 return ConstantFoldScalableVectorCall(
4661 Name, IID, SVTy, Operands, F->getDataLayout(), TLI, Call);
4662
4663 if (auto *StTy = dyn_cast<StructType>(Ty))
4664 return ConstantFoldStructCall(Name, IID, StTy, Operands,
4665 F->getDataLayout(), TLI, Call);
4666
4667 // TODO: If this is a library function, we already discovered that above,
4668 // so we should pass the LibFunc, not the name (and it might be better
4669 // still to separate intrinsic handling from libcalls).
4670 return ConstantFoldScalarCall(Name, IID, Ty, Operands, TLI, Call);
4671}
4672
4674 const TargetLibraryInfo *TLI) {
4675 // FIXME: Refactor this code; this duplicates logic in LibCallsShrinkWrap
4676 // (and to some extent ConstantFoldScalarCall).
4677 if (Call->isNoBuiltin() || Call->isStrictFP())
4678 return false;
4679 Function *F = Call->getCalledFunction();
4680 if (!F)
4681 return false;
4682
4683 LibFunc Func;
4684 if (!TLI || !TLI->getLibFunc(*F, Func))
4685 return false;
4686
4687 if (Call->arg_size() == 1) {
4688 if (ConstantFP *OpC = dyn_cast<ConstantFP>(Call->getArgOperand(0))) {
4689 const APFloat &Op = OpC->getValueAPF();
4690 switch (Func) {
4691 case LibFunc_logl:
4692 case LibFunc_log:
4693 case LibFunc_logf:
4694 case LibFunc_log2l:
4695 case LibFunc_log2:
4696 case LibFunc_log2f:
4697 case LibFunc_log10l:
4698 case LibFunc_log10:
4699 case LibFunc_log10f:
4700 return Op.isNaN() || (!Op.isZero() && !Op.isNegative());
4701
4702 case LibFunc_ilogb:
4703 return !Op.isNaN() && !Op.isZero() && !Op.isInfinity();
4704
4705 case LibFunc_expl:
4706 case LibFunc_exp:
4707 case LibFunc_expf:
4708 // FIXME: These boundaries are slightly conservative.
4709 if (OpC->getType()->isDoubleTy())
4710 return !(Op < APFloat(-745.0) || Op > APFloat(709.0));
4711 if (OpC->getType()->isFloatTy())
4712 return !(Op < APFloat(-103.0f) || Op > APFloat(88.0f));
4713 break;
4714
4715 case LibFunc_exp2l:
4716 case LibFunc_exp2:
4717 case LibFunc_exp2f:
4718 // FIXME: These boundaries are slightly conservative.
4719 if (OpC->getType()->isDoubleTy())
4720 return !(Op < APFloat(-1074.0) || Op > APFloat(1023.0));
4721 if (OpC->getType()->isFloatTy())
4722 return !(Op < APFloat(-149.0f) || Op > APFloat(127.0f));
4723 break;
4724
4725 case LibFunc_sinl:
4726 case LibFunc_sin:
4727 case LibFunc_sinf:
4728 case LibFunc_cosl:
4729 case LibFunc_cos:
4730 case LibFunc_cosf:
4731 return !Op.isInfinity();
4732
4733 case LibFunc_tanl:
4734 case LibFunc_tan:
4735 case LibFunc_tanf: {
4736 // FIXME: Stop using the host math library.
4737 // FIXME: The computation isn't done in the right precision.
4738 Type *Ty = OpC->getType();
4739 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy())
4740 return ConstantFoldFP(tan, OpC->getValueAPF(), Ty) != nullptr;
4741 break;
4742 }
4743
4744 case LibFunc_atan:
4745 case LibFunc_atanf:
4746 case LibFunc_atanl:
4747 // Per POSIX, this MAY fail if Op is denormal. We choose not failing.
4748 return true;
4749
4750 case LibFunc_asinl:
4751 case LibFunc_asin:
4752 case LibFunc_asinf:
4753 case LibFunc_acosl:
4754 case LibFunc_acos:
4755 case LibFunc_acosf:
4756 return !(Op < APFloat::getOne(Op.getSemantics(), true) ||
4757 Op > APFloat::getOne(Op.getSemantics()));
4758
4759 case LibFunc_sinh:
4760 case LibFunc_cosh:
4761 case LibFunc_sinhf:
4762 case LibFunc_coshf:
4763 case LibFunc_sinhl:
4764 case LibFunc_coshl:
4765 // FIXME: These boundaries are slightly conservative.
4766 if (OpC->getType()->isDoubleTy())
4767 return !(Op < APFloat(-710.0) || Op > APFloat(710.0));
4768 if (OpC->getType()->isFloatTy())
4769 return !(Op < APFloat(-89.0f) || Op > APFloat(89.0f));
4770 break;
4771
4772 case LibFunc_sqrtl:
4773 case LibFunc_sqrt:
4774 case LibFunc_sqrtf:
4775 return Op.isNaN() || Op.isZero() || !Op.isNegative();
4776
4777 // FIXME: Add more functions: sqrt_finite, atanh, expm1, log1p,
4778 // maybe others?
4779 default:
4780 break;
4781 }
4782 }
4783 }
4784
4785 if (Call->arg_size() == 2) {
4786 ConstantFP *Op0C = dyn_cast<ConstantFP>(Call->getArgOperand(0));
4787 ConstantFP *Op1C = dyn_cast<ConstantFP>(Call->getArgOperand(1));
4788 if (Op0C && Op1C) {
4789 const APFloat &Op0 = Op0C->getValueAPF();
4790 const APFloat &Op1 = Op1C->getValueAPF();
4791
4792 switch (Func) {
4793 case LibFunc_powl:
4794 case LibFunc_pow:
4795 case LibFunc_powf: {
4796 // FIXME: Stop using the host math library.
4797 // FIXME: The computation isn't done in the right precision.
4798 Type *Ty = Op0C->getType();
4799 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy()) {
4800 if (Ty == Op1C->getType())
4801 return ConstantFoldBinaryFP(pow, Op0, Op1, Ty) != nullptr;
4802 }
4803 break;
4804 }
4805
4806 case LibFunc_fmodl:
4807 case LibFunc_fmod:
4808 case LibFunc_fmodf:
4809 case LibFunc_remainderl:
4810 case LibFunc_remainder:
4811 case LibFunc_remainderf:
4812 return Op0.isNaN() || Op1.isNaN() ||
4813 (!Op0.isInfinity() && !Op1.isZero());
4814
4815 case LibFunc_atan2:
4816 case LibFunc_atan2f:
4817 case LibFunc_atan2l:
4818 // Although IEEE-754 says atan2(+/-0.0, +/-0.0) are well-defined, and
4819 // GLIBC and MSVC do not appear to raise an error on those, we
4820 // cannot rely on that behavior. POSIX and C11 say that a domain error
4821 // may occur, so allow for that possibility.
4822 return !Op0.isZero() || !Op1.isZero();
4823
4824 default:
4825 break;
4826 }
4827 }
4828 }
4829
4830 return false;
4831}
4832
4834 unsigned CastOp, const DataLayout &DL,
4835 PreservedCastFlags *Flags) {
4836 switch (CastOp) {
4837 case Instruction::BitCast:
4838 // Bitcast is always lossless.
4839 return ConstantFoldCastOperand(Instruction::BitCast, C, InvCastTo, DL);
4840 case Instruction::Trunc: {
4841 auto *ZExtC = ConstantFoldCastOperand(Instruction::ZExt, C, InvCastTo, DL);
4842 if (Flags) {
4843 // Truncation back on ZExt value is always NUW.
4844 Flags->NUW = true;
4845 // Test positivity of C.
4846 auto *SExtC =
4847 ConstantFoldCastOperand(Instruction::SExt, C, InvCastTo, DL);
4848 Flags->NSW = ZExtC == SExtC;
4849 }
4850 return ZExtC;
4851 }
4852 case Instruction::SExt:
4853 case Instruction::ZExt: {
4854 auto *InvC = ConstantExpr::getTrunc(C, InvCastTo);
4855 auto *CastInvC = ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4856 // Must satisfy CastOp(InvC) == C.
4857 if (!CastInvC || CastInvC != C)
4858 return nullptr;
4859 if (Flags && CastOp == Instruction::ZExt) {
4860 auto *SExtInvC =
4861 ConstantFoldCastOperand(Instruction::SExt, InvC, C->getType(), DL);
4862 // Test positivity of InvC.
4863 Flags->NNeg = CastInvC == SExtInvC;
4864 }
4865 return InvC;
4866 }
4867 case Instruction::FPExt: {
4868 Constant *InvC =
4869 ConstantFoldCastOperand(Instruction::FPTrunc, C, InvCastTo, DL);
4870 if (InvC) {
4871 Constant *CastInvC =
4872 ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4873 if (CastInvC == C)
4874 return InvC;
4875 }
4876 return nullptr;
4877 }
4878 default:
4879 return nullptr;
4880 }
4881}
4882
4884 const DataLayout &DL,
4885 PreservedCastFlags *Flags) {
4886 return getLosslessInvCast(C, DestTy, Instruction::ZExt, DL, Flags);
4887}
4888
4890 const DataLayout &DL,
4891 PreservedCastFlags *Flags) {
4892 return getLosslessInvCast(C, DestTy, Instruction::SExt, DL, Flags);
4893}
4894
4895void TargetFolder::anchor() {}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
#define X(NUM, ENUM, NAME)
Definition ELF.h:851
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static Constant * FoldBitCast(Constant *V, Type *DestTy)
static ConstantFP * flushDenormalConstant(Type *Ty, const APFloat &APF, DenormalMode::DenormalModeKind Mode)
Constant * getConstantAtOffset(Constant *Base, APInt Offset, const DataLayout &DL)
If this Offset points exactly to the start of an aggregate element, return that element,...
static cl::opt< bool > DisableFPCallFolding("disable-fp-call-folding", cl::desc("Disable constant-folding of FP intrinsics and libcalls."), cl::init(false), cl::Hidden)
static ConstantFP * flushDenormalConstantFP(ConstantFP *CFP, const Instruction *Inst, bool IsOutput)
static DenormalMode getInstrDenormalMode(const Instruction *CtxI, Type *Ty)
Return the denormal mode that can be assumed when executing a floating point operation at CtxI.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
This file defines the DenseMap class.
Hexagon Common GEP
amode Optimize addressing mode
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
static bool InRange(int64_t Value, unsigned short Shift, int LBound, int HBound)
This file contains the definitions of the enumerations and flags associated with NVVM Intrinsics,...
if(PassOpts->AAPipeline)
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
This file contains some templates that are useful if you are working with the STL at all.
This file implements the SmallBitVector class.
This file defines the SmallVector class.
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39
The Input class is used to parse a yaml document into in-memory structs and vectors.
static constexpr roundingMode rmTowardZero
Definition APFloat.h:348
llvm::RoundingMode roundingMode
IEEE-754R 4.3: Rounding-direction attributes.
Definition APFloat.h:342
static const fltSemantics & IEEEdouble()
Definition APFloat.h:297
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:347
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:344
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:346
static const fltSemantics & IEEEhalf()
Definition APFloat.h:294
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:349
opStatus
IEEE-754R 7: Default exception handling.
Definition APFloat.h:360
static APFloat getQNaN(const fltSemantics &Sem, bool Negative=false, const APInt *payload=nullptr)
Factory for QNaN values.
Definition APFloat.h:1175
opStatus divide(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1263
void copySign(const APFloat &RHS)
Definition APFloat.h:1357
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:5890
opStatus subtract(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1245
bool isNegative() const
Definition APFloat.h:1516
LLVM_ABI double convertToDouble() const
Converts this APFloat to host double value.
Definition APFloat.cpp:5949
bool isPosInfinity() const
Definition APFloat.h:1529
bool isNormal() const
Definition APFloat.h:1520
bool isDenormal() const
Definition APFloat.h:1517
opStatus add(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1236
const fltSemantics & getSemantics() const
Definition APFloat.h:1524
bool isNonZero() const
Definition APFloat.h:1525
bool isFinite() const
Definition APFloat.h:1521
bool isNaN() const
Definition APFloat.h:1514
static APFloat getOne(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative One.
Definition APFloat.h:1143
opStatus multiply(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1254
LLVM_ABI float convertToFloat() const
Converts this APFloat to host float value.
Definition APFloat.cpp:5977
bool isSignaling() const
Definition APFloat.h:1518
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
Definition APFloat.h:1290
bool isZero() const
Definition APFloat.h:1512
opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.h:1387
opStatus mod(const APFloat &RHS)
Definition APFloat.h:1281
bool isNegInfinity() const
Definition APFloat.h:1530
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1303
void changeSign()
Definition APFloat.h:1352
static APFloat getZero(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Zero.
Definition APFloat.h:1134
bool isInfinity() const
Definition APFloat.h:1513
Class for arbitrary precision integers.
Definition APInt.h:78
LLVM_ABI APInt umul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2022
LLVM_ABI APInt usub_sat(const APInt &RHS) const
Definition APInt.cpp:2106
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition APInt.h:424
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1563
LLVM_ABI uint64_t extractBitsAsZExtValue(unsigned numBits, unsigned bitPosition) const
Definition APInt.cpp:520
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1075
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:207
APInt abs() const
Get the absolute value.
Definition APInt.h:1818
LLVM_ABI APInt sadd_sat(const APInt &RHS) const
Definition APInt.cpp:2077
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1208
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1999
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1189
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1708
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1511
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1118
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1979
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1986
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1662
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition APInt.h:1621
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:220
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition APInt.cpp:1083
LLVM_ABI APInt uadd_sat(const APInt &RHS) const
Definition APInt.cpp:2087
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition APInt.h:834
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2011
LLVM_ABI APInt sext(unsigned width) const
Sign extend to a new width.
Definition APInt.cpp:1027
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
bool slt(const APInt &RHS) const
Signed less than comparison.
Definition APInt.h:1137
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201
LLVM_ABI APInt extractBits(unsigned numBits, unsigned bitPosition) const
Return an APInt with the extracted bits [bitPosition,bitPosition+numBits).
Definition APInt.cpp:482
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1992
bool isOne() const
Determine if this is a value of 1.
Definition APInt.h:390
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:858
LLVM_ABI APInt ssub_sat(const APInt &RHS) const
Definition APInt.cpp:2096
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
ArrayRef - Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
size_t size() const
size - Get the array size.
Definition ArrayRef.h:142
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
static LLVM_ABI unsigned isEliminableCastPair(Instruction::CastOps firstOpcode, Instruction::CastOps secondOpcode, Type *SrcTy, Type *MidTy, Type *DstTy, const DataLayout *DL)
Determine how a pair of casts can be eliminated, if they can be at all.
static LLVM_ABI bool castIsValid(Instruction::CastOps op, Type *SrcTy, Type *DstTy)
This method can be used to determine if a cast from SrcTy to DstTy using Opcode op is valid or not.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:676
bool isSigned() const
Definition InstrTypes.h:930
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:827
static bool isFPPredicate(Predicate P)
Definition InstrTypes.h:770
static Constant * get(LLVMContext &Context, ArrayRef< ElementTy > Elts)
get() constructor - Return a constant with array type with an element count and element type matching...
Definition Constants.h:859
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getExtractElement(Constant *Vec, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI bool isDesirableCastOp(unsigned Opcode)
Whether creating a constant expression for this cast is desirable.
static LLVM_ABI Constant * getCast(unsigned ops, Constant *C, Type *Ty, bool OnlyIfReduced=false)
Convenience function for getting a Cast operation.
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
static Constant * getPtrAdd(Constant *Ptr, Constant *Offset, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReduced=nullptr)
Create a getelementptr i8, ptr, offset constant expression.
Definition Constants.h:1472
static LLVM_ABI Constant * getInsertElement(Constant *Vec, Constant *Elt, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI Constant * getShuffleVector(Constant *V1, Constant *V2, ArrayRef< int > Mask, Type *OnlyIfReducedTy=nullptr)
static bool isSupportedGetElementPtr(const Type *SrcElemTy)
Whether creating a constant expression for this getelementptr type is supported.
Definition Constants.h:1573
static LLVM_ABI Constant * get(unsigned Opcode, Constant *C1, Constant *C2, unsigned Flags=0, Type *OnlyIfReducedTy=nullptr)
get - Return a binary or shift operator constant expression, folding if possible.
static LLVM_ABI bool isDesirableBinOp(unsigned Opcode)
Whether creating a constant expression for this binary operator is desirable.
static Constant * getGetElementPtr(Type *Ty, Constant *C, ArrayRef< Constant * > IdxList, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReducedTy=nullptr)
Getelementptr form.
Definition Constants.h:1445
static LLVM_ABI Constant * getBitCast(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getTrunc(Constant *C, Type *Ty, bool OnlyIfReduced=false)
ConstantFP - Floating Point Values [float, double].
Definition Constants.h:420
const APFloat & getValueAPF() const
Definition Constants.h:463
static LLVM_ABI Constant * getInfinity(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getZero(Type *Ty, bool Negative=false)
static LLVM_ABI Constant * getNaN(Type *Ty, bool Negative=false, uint64_t Payload=0)
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=false)
Return a ConstantInt with the specified value for the specified type.
Definition Constants.h:135
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
Definition Constants.h:174
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
static LLVM_ABI Constant * get(ArrayRef< Constant * > V)
This is an important base class in LLVM.
Definition Constant.h:43
LLVM_ABI Constant * getSplatValue(bool AllowPoison=false) const
If all elements of the vector constant have the same value, return that value.
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI Constant * getAggregateElement(unsigned Elt) const
For aggregates (struct/array/vector) return the constant that corresponds to the specified element if...
LLVM_ABI bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition Constants.cpp:74
Constrained floating point compare intrinsics.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI std::optional< RoundingMode > getRoundingMode() const
Wrapper for a function that represents a value that functionally represents the original function.
Definition Constants.h:1118
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:178
iterator end()
Definition DenseMap.h:81
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:241
static LLVM_ABI bool compare(const APFloat &LHS, const APFloat &RHS, FCmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
This provides a helper for copying FMF from an instruction or setting specified flags.
Definition IRBuilder.h:93
Class to represent fixed width SIMD vectors.
unsigned getNumElements() const
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:873
DenormalMode getDenormalMode(const fltSemantics &FPType) const
Returns the denormal handling type for the default rounding mode of the function.
Definition Function.cpp:804
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags inBounds()
GEPNoWrapFlags withoutNoUnsignedSignedWrap() const
static GEPNoWrapFlags noUnsignedWrap()
bool hasNoUnsignedSignedWrap() const
bool isInBounds() const
static LLVM_ABI Type * getIndexedType(Type *Ty, ArrayRef< Value * > IdxList)
Returns the result type of a getelementptr with the given source element type and indexes.
PointerType * getType() const
Global values are always pointers.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this global belongs to.
Definition Globals.cpp:141
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
bool isEquality() const
Return true if this predicate is either EQ or NE.
bool isCast() const
bool isBinaryOp() const
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
bool isUnaryOp() const
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:354
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
static APInt getSaturationPoint(Intrinsic::ID ID, unsigned numBits)
Min/max intrinsics are monotonic, they operate on a fixed-bitwidth values, so there is a certain thre...
static ICmpInst::Predicate getPredicate(Intrinsic::ID ID)
Returns the comparison predicate underlying the intrinsic.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Class to represent scalable SIMD vectors.
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
SmallBitVector & set()
iterator_range< const_set_bits_iterator > set_bits() const
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
StringRef - Represent a constant reference to a string, i.e.
Definition StringRef.h:55
Used to lazily calculate structure layout information for a target machine, based on the DataLayout s...
Definition DataLayout.h:736
LLVM_ABI unsigned getElementContainingOffset(uint64_t FixedOffset) const
Given a valid byte offset into the structure, returns the structure index that contains it.
TypeSize getElementOffset(unsigned Idx) const
Definition DataLayout.h:767
Class to represent struct types.
unsigned getNumElements() const
Random access to the elements.
Provides information about what library functions are available for the current target.
bool has(LibFunc F) const
Tests whether a library function is available.
bool getLibFunc(StringRef funcName, LibFunc &F) const
Searches for a particular function name.
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI IntegerType * getInt64Ty(LLVMContext &C)
Definition Type.cpp:314
bool isByteTy() const
True if this is an instance of ByteType.
Definition Type.h:242
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:290
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:313
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:284
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
Definition Type.h:57
@ FloatTyID
32-bit floating point type
Definition Type.h:59
@ DoubleTyID
64-bit floating point type
Definition Type.h:60
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:370
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:201
static LLVM_ABI IntegerType * getInt16Ty(LLVMContext &C)
Definition Type.cpp:312
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:328
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:130
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:236
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
Definition Type.cpp:310
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition Type.h:186
bool isPtrOrPtrVectorTy() const
Return true if this is a pointer type or a vector of pointer types.
Definition Type.h:287
bool isX86_AMXTy() const
Return true if this is X86 AMX.
Definition Type.h:202
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:317
Type * getContainedType(unsigned i) const
This method is used to implement the type iterator (defined at the end of the file).
Definition Type.h:399
LLVM_ABI const fltSemantics & getFltSemantics() const
Definition Type.cpp:110
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
A Use represents the edge between a Value definition and its users.
Definition Use.h:35
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
LLVM_ABI uint64_t getPointerDereferenceableBytes(const DataLayout &DL, bool &CanBeNull, bool &CanBeFreed) const
Returns the number of bytes known to be dereferenceable for the pointer value.
Definition Value.cpp:890
Base class of all SIMD vector types.
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Type * getElementType() const
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition TypeSize.h:171
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
Definition TypeSize.h:252
static constexpr bool isKnownGE(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:237
const ParentTy * getParent() const
Definition ilist_node.h:34
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
const APInt & smin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be signed.
Definition APInt.h:2277
const APInt & smax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be signed.
Definition APInt.h:2282
const APInt & umin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be unsigned.
Definition APInt.h:2287
const APInt & umax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be unsigned.
Definition APInt.h:2292
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:48
initializer< Ty > init(const Ty &Val)
@ ebStrict
This corresponds to "fpexcept.strict".
Definition FPEnv.h:42
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
constexpr double pi
APFloat::roundingMode GetFMARoundingMode(Intrinsic::ID IntrinsicID)
DenormalMode GetNVVMDenormMode(bool ShouldFTZ)
bool FPToIntegerIntrinsicNaNZero(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFDivRoundingMode(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicResultIsSigned(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFPToIntegerRoundingMode(Intrinsic::ID IntrinsicID)
bool RCPShouldFTZ(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FDivShouldFTZ(Intrinsic::ID IntrinsicID)
bool FAddShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxIsXorSignAbs(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFMulRoundingMode(Intrinsic::ID IntrinsicID)
bool UnaryMathIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFAddRoundingMode(Intrinsic::ID IntrinsicID)
bool FMAShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMulShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetRCPRoundingMode(Intrinsic::ID IntrinsicID)
bool FMinFMaxPropagatesNaNs(Intrinsic::ID IntrinsicID)
NodeAddr< FuncNode * > Func
Definition RDFGraph.h:393
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:316
@ Offset
Definition DWP.cpp:532
LLVM_ABI Constant * ConstantFoldBinaryIntrinsic(Intrinsic::ID ID, Constant *LHS, Constant *RHS, Type *Ty, Instruction *FMFSource)
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1739
LLVM_ABI Constant * ConstantFoldLoadThroughBitcast(Constant *C, Type *DestTy, const DataLayout &DL)
ConstantFoldLoadThroughBitcast - try to cast constant to destination type returning null if unsuccess...
static double log2(double V)
LLVM_ABI Constant * ConstantFoldSelectInstruction(Constant *Cond, Constant *V1, Constant *V2)
Attempt to constant fold a select instruction with the specified operands.
LLVM_ABI Constant * ConstantFoldFPInstOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL, const Instruction *I, bool AllowNonDeterministic=true)
Attempt to constant fold a floating point binary operation with the specified operands,...
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2554
LLVM_ABI bool canConstantFoldCallTo(const CallBase *Call, const Function *F)
canConstantFoldCallTo - Return true if its even possible to fold a call to the specified function.
unsigned getPointerAddressSpace(const Type *T)
Definition SPIRVUtils.h:375
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
LLVM_ABI Constant * ConstantFoldInstruction(const Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
APFloat abs(APFloat X)
Returns the absolute value of the argument.
Definition APFloat.h:1630
LLVM_ABI Constant * ConstantFoldCompareInstruction(CmpInst::Predicate Predicate, Constant *C1, Constant *C2)
LLVM_ABI Constant * ConstantFoldUnaryInstruction(unsigned Opcode, Constant *V)
LLVM_ABI bool IsConstantOffsetFromGlobal(Constant *C, GlobalValue *&GV, APInt &Offset, const DataLayout &DL, DSOLocalEquivalent **DSOEquiv=nullptr)
If this constant is a constant offset from a global, return the global and the constant.
LLVM_ABI bool isMathLibCallNoop(const CallBase *Call, const TargetLibraryInfo *TLI)
Check whether the given call has no side-effects.
LLVM_ABI Constant * ReadByteArrayFromGlobal(const GlobalVariable *GV, uint64_t Offset)
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition APFloat.h:1710
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1601
bool isa_and_nonnull(const Y &Val)
Definition Casting.h:676
LLVM_ABI Constant * ConstantFoldCall(const CallBase *Call, Function *F, ArrayRef< Constant * > Operands, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldCall - Attempt to constant fold a call to the specified function with the specified argum...
APFloat frexp(const APFloat &X, int &Exp, APFloat::roundingMode RM)
Equivalent of C standard library function.
Definition APFloat.h:1622
LLVM_ABI Constant * ConstantFoldExtractValueInstruction(Constant *Agg, ArrayRef< unsigned > Idxs)
Attempt to constant fold an extractvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1746
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 maxNum semantics.
Definition APFloat.h:1665
LLVM_ABI Constant * ConstantFoldLoadFromUniformValue(Constant *C, Type *Ty, const DataLayout &DL)
If C is a uniform value where all bits are the same (either all zero, all ones, all undef or all pois...
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
LLVM_ABI Constant * FlushFPConstant(Constant *Operand, const Instruction *I, bool IsOutput)
Attempt to flush float point constant according to denormal mode set in the instruction's parent func...
LLVM_ABI Constant * getLosslessUnsignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_READONLY APFloat minimumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimumNumber semantics.
Definition APFloat.h:1696
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1610
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI Constant * getLosslessSignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
LLVM_ABI bool intrinsicPropagatesPoison(Intrinsic::ID IID)
Return whether this intrinsic propagates poison for all operands.
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 minNum semantics.
Definition APFloat.h:1646
@ Sub
Subtraction of integers.
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
DWARFExpression::Operation Op
RoundingMode
Rounding mode.
@ NearestTiesToEven
roundTiesToEven.
@ Dynamic
Denotes mode unknown at compile time.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
constexpr unsigned BitWidth
LLVM_ABI Constant * getLosslessInvCast(Constant *C, Type *InvCastTo, unsigned CastOp, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Try to cast C to InvC losslessly, satisfying CastOp(InvC) equals C, or CastOp(InvC) is a refined valu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition STLExtras.h:2166
LLVM_ABI Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
LLVM_ABI Constant * ConstantFoldInsertValueInstruction(Constant *Agg, Constant *Val, ArrayRef< unsigned > Idxs)
Attempt to constant fold an insertvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldLoadFromConstPtr(Constant *C, Type *Ty, APInt Offset, const DataLayout &DL)
Return the value that a load from C with offset Offset would produce if it is constant and determinab...
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition APFloat.h:1683
LLVM_READONLY APFloat maximumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximumNumber semantics.
Definition APFloat.h:1723
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
LLVM_ABI bool isTriviallyVectorizable(Intrinsic::ID ID)
Identify if the intrinsic is trivially vectorizable.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
Definition Casting.h:866
LLVM_ABI Constant * ConstantFoldBinaryInstruction(unsigned Opcode, Constant *V1, Constant *V2)
Represent subnormal handling kind for floating point instruction inputs and outputs.
DenormalModeKind Input
Denormal treatment kind for floating point instruction inputs in the default floating-point environme...
DenormalModeKind
Represent handled modes for denormal (aka subnormal) modes in the floating point environment.
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
@ PositiveZero
Denormals are flushed to positive zero.
@ Dynamic
Denormals have unknown treatment.
@ IEEE
IEEE-754 denormal numbers preserved.
DenormalModeKind Output
Denormal flushing mode for floating point instruction results in the default floating point environme...
static constexpr DenormalMode getDynamic()
static constexpr DenormalMode getIEEE()
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:58