LLVM 23.0.0git
ConstantFolding.cpp
Go to the documentation of this file.
1//===-- ConstantFolding.cpp - Fold instructions into constants ------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines routines for folding instructions into constants.
10//
11// Also, to supplement the basic IR ConstantExpr simplifications,
12// this file defines some additional folding routines that can make use of
13// DataLayout information. These functions cannot go in IR due to library
14// dependency issues.
15//
16//===----------------------------------------------------------------------===//
17
19#include "llvm/ADT/APFloat.h"
20#include "llvm/ADT/APInt.h"
21#include "llvm/ADT/APSInt.h"
22#include "llvm/ADT/ArrayRef.h"
23#include "llvm/ADT/DenseMap.h"
24#include "llvm/ADT/STLExtras.h"
27#include "llvm/ADT/StringRef.h"
32#include "llvm/Config/config.h"
33#include "llvm/IR/Constant.h"
35#include "llvm/IR/Constants.h"
36#include "llvm/IR/DataLayout.h"
38#include "llvm/IR/Function.h"
39#include "llvm/IR/GlobalValue.h"
41#include "llvm/IR/InstrTypes.h"
42#include "llvm/IR/Instruction.h"
45#include "llvm/IR/Intrinsics.h"
46#include "llvm/IR/IntrinsicsAArch64.h"
47#include "llvm/IR/IntrinsicsAMDGPU.h"
48#include "llvm/IR/IntrinsicsARM.h"
49#include "llvm/IR/IntrinsicsNVPTX.h"
50#include "llvm/IR/IntrinsicsWebAssembly.h"
51#include "llvm/IR/IntrinsicsX86.h"
53#include "llvm/IR/Operator.h"
54#include "llvm/IR/Type.h"
55#include "llvm/IR/Value.h"
60#include <cassert>
61#include <cerrno>
62#include <cfenv>
63#include <cmath>
64#include <cstdint>
65
66using namespace llvm;
67
69 "disable-fp-call-folding",
70 cl::desc("Disable constant-folding of FP intrinsics and libcalls."),
71 cl::init(false), cl::Hidden);
72
73namespace {
74
75//===----------------------------------------------------------------------===//
76// Constant Folding internal helper functions
77//===----------------------------------------------------------------------===//
78
79static Constant *foldConstVectorToAPInt(APInt &Result, Type *DestTy,
80 Constant *C, Type *SrcEltTy,
81 unsigned NumSrcElts,
82 const DataLayout &DL) {
83 // Now that we know that the input value is a vector of integers, just shift
84 // and insert them into our result.
85 unsigned BitShift = DL.getTypeSizeInBits(SrcEltTy);
86 for (unsigned i = 0; i != NumSrcElts; ++i) {
87 Constant *Element;
88 if (DL.isLittleEndian())
89 Element = C->getAggregateElement(NumSrcElts - i - 1);
90 else
91 Element = C->getAggregateElement(i);
92
93 if (isa_and_nonnull<UndefValue>(Element)) {
94 Result <<= BitShift;
95 continue;
96 }
97
98 auto *ElementCI = dyn_cast_or_null<ConstantInt>(Element);
99 if (!ElementCI)
100 return ConstantExpr::getBitCast(C, DestTy);
101
102 Result <<= BitShift;
103 Result |= ElementCI->getValue().zext(Result.getBitWidth());
104 }
105
106 return nullptr;
107}
108
109/// Check whether folding this bitcast into a byte vector would mix poison and
110/// non-poison bits in the same output lane. While integer types track poison on
111/// a per-value basis, byte types track it on a per-bit basis. However,
112/// `ConstantByte` cannot represent values with both poison and non-poison bits.
113///
114/// Source elements are grouped by the output lane they map to. Returns true if
115/// any group contains both poison and non-poison elements.
116static bool foldMixesPoisonBits(Constant *C, unsigned NumSrcElt,
117 unsigned NumDstElt) {
118 // If element counts don't divide evenly, bail out if a poison source element
119 // might span multiple destination lanes.
120 if (NumSrcElt % NumDstElt != 0)
121 return C->containsPoisonElement();
122 unsigned Ratio = NumSrcElt / NumDstElt;
123 for (unsigned i = 0; i != NumSrcElt; i += Ratio) {
124 bool HasPoison = false;
125 bool HasNonPoison = false;
126 for (unsigned j = 0; j != Ratio; ++j) {
127 Constant *Src = C->getAggregateElement(i + j);
128 // Conservatively bail out.
129 if (!Src)
130 return true;
131 if (isa<PoisonValue>(Src))
132 HasPoison = true;
133 else
134 HasNonPoison = true;
135 }
136 if (HasPoison && HasNonPoison)
137 return true;
138 }
139 return false;
140}
141
142/// Track which destination lanes of a bitcast are produced from poison bytes.
143/// A destination lane is marked if any source element mapped to it is poison.
144/// Returns false if an aggregate element cannot be inspected. The caller should
145/// bail out of folding.
146static bool computePoisonDstLanes(Constant *C, unsigned NumSrcElt,
147 unsigned NumDstElt,
148 SmallBitVector &PoisonDstElts) {
149 // If element counts don't divide evenly, bail out if a poison source element
150 // might span multiple destination lanes.
151 if ((NumDstElt < NumSrcElt ? NumSrcElt % NumDstElt : NumDstElt % NumSrcElt))
152 return !C->containsPoisonElement();
153 if (NumDstElt < NumSrcElt) {
154 unsigned Ratio = NumSrcElt / NumDstElt;
155 for (unsigned i = 0; i != NumDstElt; ++i) {
156 for (unsigned j = 0; j != Ratio; ++j) {
157 Constant *Src = C->getAggregateElement(i * Ratio + j);
158 if (!Src)
159 return false;
160 if (isa<PoisonValue>(Src)) {
161 PoisonDstElts[i] = true;
162 break;
163 }
164 }
165 }
166 } else {
167 unsigned Ratio = NumDstElt / NumSrcElt;
168 for (unsigned i = 0; i != NumSrcElt; ++i) {
169 Constant *Src = C->getAggregateElement(i);
170 if (!Src)
171 return false;
172 if (isa<PoisonValue>(Src))
173 PoisonDstElts.set(i * Ratio, (i + 1) * Ratio);
174 }
175 }
176 return true;
177}
178
179/// Constant fold bitcast, symbolically evaluating it with DataLayout.
180/// This always returns a non-null constant, but it may be a
181/// ConstantExpr if unfoldable.
182Constant *FoldBitCast(Constant *C, Type *DestTy, const DataLayout &DL) {
183 assert(CastInst::castIsValid(Instruction::BitCast, C, DestTy) &&
184 "Invalid constantexpr bitcast!");
185
186 // Catch the obvious splat cases.
187 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
188 return Res;
189
190 if (auto *VTy = dyn_cast<VectorType>(C->getType())) {
191 // Handle a vector->scalar integer/fp cast.
192 if (isa<IntegerType>(DestTy) || DestTy->isFloatingPointTy()) {
193 unsigned NumSrcElts = cast<FixedVectorType>(VTy)->getNumElements();
194 Type *SrcEltTy = VTy->getElementType();
195
196 // Bitcasting a byte containing any poison bit to an integer or fp type
197 // yields poison.
198 if (SrcEltTy->isByteTy() && C->containsPoisonElement())
199 return PoisonValue::get(DestTy);
200
201 // If the vector is a vector of floating point or bytes, convert it to a
202 // vector of int to simplify things.
203 if (SrcEltTy->isFloatingPointTy() || SrcEltTy->isByteTy()) {
204 unsigned Width = SrcEltTy->getPrimitiveSizeInBits();
205 auto *SrcIVTy = FixedVectorType::get(
206 IntegerType::get(C->getContext(), Width), NumSrcElts);
207 // Ask IR to do the conversion now that #elts line up.
208 C = ConstantExpr::getBitCast(C, SrcIVTy);
209 }
210
211 APInt Result(DL.getTypeSizeInBits(DestTy), 0);
212 if (Constant *CE = foldConstVectorToAPInt(Result, DestTy, C,
213 SrcEltTy, NumSrcElts, DL))
214 return CE;
215
216 if (isa<IntegerType>(DestTy))
217 return ConstantInt::get(DestTy, Result);
218
219 APFloat FP(DestTy->getFltSemantics(), Result);
220 return ConstantFP::get(DestTy->getContext(), FP);
221 }
222 }
223
224 // The code below only handles casts to vectors currently.
225 auto *DestVTy = dyn_cast<VectorType>(DestTy);
226 if (!DestVTy)
227 return ConstantExpr::getBitCast(C, DestTy);
228
229 // If this is a scalar -> vector cast, convert the input into a <1 x scalar>
230 // vector so the code below can handle it uniformly.
231 if (!isa<VectorType>(C->getType()) &&
233 Constant *Ops = C; // don't take the address of C!
234 return FoldBitCast(ConstantVector::get(Ops), DestTy, DL);
235 }
236
237 // Some of what follows may extend to cover scalable vectors but the current
238 // implementation is fixed length specific.
239 if (!isa<FixedVectorType>(C->getType()))
240 return ConstantExpr::getBitCast(C, DestTy);
241
242 // If this is a bitcast from constant vector -> vector, fold it.
245 return ConstantExpr::getBitCast(C, DestTy);
246
247 // If the element types match, IR can fold it.
248 unsigned NumDstElt = cast<FixedVectorType>(DestVTy)->getNumElements();
249 unsigned NumSrcElt = cast<FixedVectorType>(C->getType())->getNumElements();
250 if (NumDstElt == NumSrcElt)
251 return ConstantExpr::getBitCast(C, DestTy);
252
253 Type *SrcEltTy = cast<VectorType>(C->getType())->getElementType();
254 Type *DstEltTy = DestVTy->getElementType();
255
256 // Otherwise, we're changing the number of elements in a vector, which
257 // requires endianness information to do the right thing. For example,
258 // bitcast (<2 x i64> <i64 0, i64 1> to <4 x i32>)
259 // folds to (little endian):
260 // <4 x i32> <i32 0, i32 0, i32 1, i32 0>
261 // and to (big endian):
262 // <4 x i32> <i32 0, i32 0, i32 0, i32 1>
263
264 // First thing is first. We only want to think about integer here, so if
265 // we have something in FP form, recast it as integer.
266 if (DstEltTy->isFloatingPointTy()) {
267 // Fold to an vector of integers with same size as our FP type.
268 unsigned FPWidth = DstEltTy->getPrimitiveSizeInBits();
269 auto *DestIVTy = FixedVectorType::get(
270 IntegerType::get(C->getContext(), FPWidth), NumDstElt);
271 // Recursively handle this integer conversion, if possible.
272 C = FoldBitCast(C, DestIVTy, DL);
273
274 // Finally, IR can handle this now that #elts line up.
275 return ConstantExpr::getBitCast(C, DestTy);
276 }
277
278 // Handle byte destination type by folding through integers.
279 if (DstEltTy->isByteTy()) {
280 // When combining elements into larger byte values, bail out if the fold
281 // mixes poison and non-poison bits in the same destination element. Byte
282 // types track poison per bit, and no constant value can represent that.
283 if (NumDstElt < NumSrcElt && foldMixesPoisonBits(C, NumSrcElt, NumDstElt))
284 return ConstantExpr::getBitCast(C, DestTy);
285
286 // Fold to a vector of integers with same size as the byte type.
287 unsigned ByteWidth = DstEltTy->getPrimitiveSizeInBits();
288 auto *DestIVTy = FixedVectorType::get(
289 IntegerType::get(C->getContext(), ByteWidth), NumDstElt);
290 C = FoldBitCast(C, DestIVTy, DL);
291 return ConstantExpr::getBitCast(C, DestTy);
292 }
293
294 // Okay, we know the destination is integer, if the input is FP, convert
295 // it to integer first.
296 if (SrcEltTy->isFloatingPointTy()) {
297 unsigned FPWidth = SrcEltTy->getPrimitiveSizeInBits();
298 auto *SrcIVTy = FixedVectorType::get(
299 IntegerType::get(C->getContext(), FPWidth), NumSrcElt);
300 // Ask IR to do the conversion now that #elts line up.
301 C = ConstantExpr::getBitCast(C, SrcIVTy);
302 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
304 "Constant folding cannot fail for plain fp->int bitcast!");
305 }
306
307 // Handle byte source type by folding through integers. Byte types track
308 // poison per bit, so any poison bit makes the destination lane poison.
309 // Record which destination lanes contain poison bits, before the generic
310 // fold below refines them to undef/zero, so they can be restored.
311 SmallBitVector PoisonDstElts(NumDstElt);
312 if (SrcEltTy->isByteTy()) {
313 if (!computePoisonDstLanes(C, NumSrcElt, NumDstElt, PoisonDstElts))
314 return ConstantExpr::getBitCast(C, DestTy);
315
316 unsigned ByteWidth = SrcEltTy->getPrimitiveSizeInBits();
317 auto *SrcIVTy = FixedVectorType::get(
318 IntegerType::get(C->getContext(), ByteWidth), NumSrcElt);
319 // Ask IR to do the conversion now that #elts line up.
320 C = ConstantExpr::getBitCast(C, SrcIVTy);
321 assert((isa<ConstantVector>(C) || // FIXME: Remove ConstantVector.
323 "Constant folding cannot fail for plain byte->int bitcast!");
324 }
325
326 // Now we know that the input and output vectors are both integer vectors
327 // of the same size, and that their #elements is not the same.
328 // Use data buffer for easy non-integer element ratio vectors handling,
329 // For example: <4 x i24> to <3 x i32>.
330 bool isLittleEndian = DL.isLittleEndian();
331 unsigned SrcBitSize = SrcEltTy->getPrimitiveSizeInBits();
332 unsigned DstBitSize = DstEltTy->getPrimitiveSizeInBits();
334 unsigned SrcElt = 0;
335
336 APInt Buffer(2 * std::max(SrcBitSize, DstBitSize), 0);
337 APInt UndefMask(Buffer.getBitWidth(), 0);
338 APInt PoisonMask(Buffer.getBitWidth(), 0);
339 unsigned BufferBitSize = 0;
340
341 while (Result.size() != NumDstElt) {
342 // Load SrcElts into Buffer.
343 while (BufferBitSize < DstBitSize) {
344 Constant *Element = C->getAggregateElement(SrcElt++);
345 if (!Element) // Reject constantexpr elements
346 return ConstantExpr::getBitCast(C, DestTy);
347
348 // Shift Buffer & Masks to fit next SrcElt.
349 if (!isLittleEndian) {
350 Buffer <<= SrcBitSize;
351 UndefMask <<= SrcBitSize;
352 PoisonMask <<= SrcBitSize;
353 }
354
355 APInt SrcValue;
356 unsigned BitPosition = isLittleEndian ? BufferBitSize : 0;
357 if (isa<UndefValue>(Element)) {
358 // Set masks fragments bits.
359 UndefMask.setBits(BitPosition, BitPosition + SrcBitSize);
360 if (isa<PoisonValue>(Element))
361 PoisonMask.setBits(BitPosition, BitPosition + SrcBitSize);
362 SrcValue = APInt::getZero(SrcBitSize);
363 } else {
364 auto *Src = dyn_cast<ConstantInt>(Element);
365 if (!Src)
366 return ConstantExpr::getBitCast(C, DestTy);
367 SrcValue = Src->getValue();
368 }
369
370 // Insert src element bits into Buffer on correct position.
371 Buffer.insertBits(SrcValue, BitPosition);
372 BufferBitSize += SrcBitSize;
373 }
374
375 // Create DstElts from Buffer.
376 while (BufferBitSize >= DstBitSize) {
377 unsigned ShiftAmt = isLittleEndian ? 0 : BufferBitSize - DstBitSize;
378 // Emit undef/poison, if all undef mask fragment bits are set.
379 if (UndefMask.extractBits(DstBitSize, ShiftAmt).isAllOnes()) {
380 // Push poison, if any bit in poison mask fragment is set.
381 if (!PoisonMask.extractBits(DstBitSize, ShiftAmt).isZero()) {
382 Result.push_back(PoisonValue::get(DstEltTy));
383 } else {
384 Result.push_back(UndefValue::get(DstEltTy));
385 }
386 } else {
387 // Create and push DstElt.
388 APInt Elt = Buffer.extractBits(DstBitSize, ShiftAmt);
389 Result.push_back(ConstantInt::get(DstEltTy, Elt));
390 }
391
392 // Shift unused Buffer fragment to lower bits.
393 if (isLittleEndian) {
394 Buffer.lshrInPlace(DstBitSize);
395 UndefMask.lshrInPlace(DstBitSize);
396 PoisonMask.lshrInPlace(DstBitSize);
397 }
398 BufferBitSize -= DstBitSize;
399 }
400 }
401
402 // Restore destination lanes whose source bytes contained poison bits.
403 for (unsigned I : PoisonDstElts.set_bits())
404 Result[I] = PoisonValue::get(DstEltTy);
405
406 return ConstantVector::get(Result);
407}
408
409} // end anonymous namespace
410
411/// If this constant is a constant offset from a global, return the global and
412/// the constant. Because of constantexprs, this function is recursive.
414 APInt &Offset, const DataLayout &DL,
415 DSOLocalEquivalent **DSOEquiv) {
416 if (DSOEquiv)
417 *DSOEquiv = nullptr;
418
419 // Trivial case, constant is the global.
420 if ((GV = dyn_cast<GlobalValue>(C))) {
421 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
422 Offset = APInt(BitWidth, 0);
423 return true;
424 }
425
426 if (auto *FoundDSOEquiv = dyn_cast<DSOLocalEquivalent>(C)) {
427 if (DSOEquiv)
428 *DSOEquiv = FoundDSOEquiv;
429 GV = FoundDSOEquiv->getGlobalValue();
430 unsigned BitWidth = DL.getIndexTypeSizeInBits(GV->getType());
431 Offset = APInt(BitWidth, 0);
432 return true;
433 }
434
435 // Otherwise, if this isn't a constant expr, bail out.
436 auto *CE = dyn_cast<ConstantExpr>(C);
437 if (!CE) return false;
438
439 // Look through ptr->int and ptr->ptr casts.
440 if (CE->getOpcode() == Instruction::PtrToInt ||
441 CE->getOpcode() == Instruction::PtrToAddr)
442 return IsConstantOffsetFromGlobal(CE->getOperand(0), GV, Offset, DL,
443 DSOEquiv);
444
445 // i32* getelementptr ([5 x i32]* @a, i32 0, i32 5)
446 auto *GEP = dyn_cast<GEPOperator>(CE);
447 if (!GEP)
448 return false;
449
450 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
451 APInt TmpOffset(BitWidth, 0);
452
453 // If the base isn't a global+constant, we aren't either.
454 if (!IsConstantOffsetFromGlobal(CE->getOperand(0), GV, TmpOffset, DL,
455 DSOEquiv))
456 return false;
457
458 // Otherwise, add any offset that our operands provide.
459 if (!GEP->accumulateConstantOffset(DL, TmpOffset))
460 return false;
461
462 Offset = TmpOffset;
463 return true;
464}
465
467 const DataLayout &DL) {
468 do {
469 Type *SrcTy = C->getType();
470 if (SrcTy == DestTy)
471 return C;
472
473 TypeSize DestSize = DL.getTypeSizeInBits(DestTy);
474 TypeSize SrcSize = DL.getTypeSizeInBits(SrcTy);
475 if (!TypeSize::isKnownGE(SrcSize, DestSize))
476 return nullptr;
477
478 // Catch the obvious splat cases (since all-zeros can coerce non-integral
479 // pointers legally).
480 if (Constant *Res = ConstantFoldLoadFromUniformValue(C, DestTy, DL))
481 return Res;
482
483 // If the type sizes are the same and a cast is legal, just directly
484 // cast the constant.
485 // But be careful not to coerce non-integral pointers illegally.
486 if (SrcSize == DestSize &&
487 DL.isNonIntegralPointerType(SrcTy->getScalarType()) ==
488 DL.isNonIntegralPointerType(DestTy->getScalarType())) {
489 Instruction::CastOps Cast = Instruction::BitCast;
490 // If we are going from a pointer to int or vice versa, we spell the cast
491 // differently.
492 if (SrcTy->isIntegerTy() && DestTy->isPointerTy())
493 Cast = Instruction::IntToPtr;
494 else if (SrcTy->isPointerTy() && DestTy->isIntegerTy())
495 Cast = Instruction::PtrToInt;
496
497 if (CastInst::castIsValid(Cast, C, DestTy))
498 return ConstantFoldCastOperand(Cast, C, DestTy, DL);
499 }
500
501 // If this isn't an aggregate type, there is nothing we can do to drill down
502 // and find a bitcastable constant.
503 if (!SrcTy->isAggregateType() && !SrcTy->isVectorTy())
504 return nullptr;
505
506 // We're simulating a load through a pointer that was bitcast to point to
507 // a different type, so we can try to walk down through the initial
508 // elements of an aggregate to see if some part of the aggregate is
509 // castable to implement the "load" semantic model.
510 if (SrcTy->isStructTy()) {
511 // Struct types might have leading zero-length elements like [0 x i32],
512 // which are certainly not what we are looking for, so skip them.
513 unsigned Elem = 0;
514 Constant *ElemC;
515 do {
516 ElemC = C->getAggregateElement(Elem++);
517 } while (ElemC && DL.getTypeSizeInBits(ElemC->getType()).isZero());
518 C = ElemC;
519 } else {
520 // For non-byte-sized vector elements, the first element is not
521 // necessarily located at the vector base address.
522 if (auto *VT = dyn_cast<VectorType>(SrcTy))
523 if (!DL.typeSizeEqualsStoreSize(VT->getElementType()))
524 return nullptr;
525
526 C = C->getAggregateElement(0u);
527 }
528 } while (C);
529
530 return nullptr;
531}
532
533namespace {
534
535/// Recursive helper to read bits out of global. C is the constant being copied
536/// out of. ByteOffset is an offset into C. CurPtr is the pointer to copy
537/// results into and BytesLeft is the number of bytes left in
538/// the CurPtr buffer. DL is the DataLayout. When IsByteLoad is true, do not
539/// unwrap inttoptr constant expressions. The caller would reconstruct those
540/// bits as a ConstantByte, dropping the pointer's provenance.
541bool ReadDataFromGlobal(Constant *C, uint64_t ByteOffset, unsigned char *CurPtr,
542 unsigned BytesLeft, const DataLayout &DL,
543 bool IsByteLoad = false) {
544 assert(ByteOffset <= DL.getTypeAllocSize(C->getType()) &&
545 "Out of range access");
546
547 // Reading type padding, return zero.
548 if (ByteOffset >= DL.getTypeStoreSize(C->getType()))
549 return true;
550
551 // If this element is zero or undefined, we can just return since *CurPtr is
552 // zero initialized.
554 return true;
555
556 auto *CI = dyn_cast<ConstantInt>(C);
557 if (CI && CI->getType()->isIntegerTy()) {
558 if ((CI->getBitWidth() & 7) != 0)
559 return false;
560 const APInt &Val = CI->getValue();
561 unsigned IntBytes = unsigned(CI->getBitWidth()/8);
562
563 for (unsigned i = 0; i != BytesLeft && ByteOffset != IntBytes; ++i) {
564 unsigned n = ByteOffset;
565 if (!DL.isLittleEndian())
566 n = IntBytes - n - 1;
567 CurPtr[i] = Val.extractBits(8, n * 8).getZExtValue();
568 ++ByteOffset;
569 }
570 return true;
571 }
572
573 auto *CFP = dyn_cast<ConstantFP>(C);
574 if (CFP && CFP->getType()->isFloatingPointTy()) {
575 if (CFP->getType()->isDoubleTy()) {
576 C = FoldBitCast(C, Type::getInt64Ty(C->getContext()), DL);
577 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL,
578 IsByteLoad);
579 }
580 if (CFP->getType()->isFloatTy()){
581 C = FoldBitCast(C, Type::getInt32Ty(C->getContext()), DL);
582 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL,
583 IsByteLoad);
584 }
585 if (CFP->getType()->isHalfTy()){
586 C = FoldBitCast(C, Type::getInt16Ty(C->getContext()), DL);
587 return ReadDataFromGlobal(C, ByteOffset, CurPtr, BytesLeft, DL,
588 IsByteLoad);
589 }
590 return false;
591 }
592
593 if (auto *CS = dyn_cast<ConstantStruct>(C)) {
594 const StructLayout *SL = DL.getStructLayout(CS->getType());
595 unsigned Index = SL->getElementContainingOffset(ByteOffset);
596 uint64_t CurEltOffset = SL->getElementOffset(Index);
597 ByteOffset -= CurEltOffset;
598
599 while (true) {
600 // If the element access is to the element itself and not to tail padding,
601 // read the bytes from the element.
602 uint64_t EltSize = DL.getTypeAllocSize(CS->getOperand(Index)->getType());
603
604 if (ByteOffset < EltSize &&
605 !ReadDataFromGlobal(CS->getOperand(Index), ByteOffset, CurPtr,
606 BytesLeft, DL, IsByteLoad))
607 return false;
608
609 ++Index;
610
611 // Check to see if we read from the last struct element, if so we're done.
612 if (Index == CS->getType()->getNumElements())
613 return true;
614
615 // If we read all of the bytes we needed from this element we're done.
616 uint64_t NextEltOffset = SL->getElementOffset(Index);
617
618 if (BytesLeft <= NextEltOffset - CurEltOffset - ByteOffset)
619 return true;
620
621 // Move to the next element of the struct.
622 CurPtr += NextEltOffset - CurEltOffset - ByteOffset;
623 BytesLeft -= NextEltOffset - CurEltOffset - ByteOffset;
624 ByteOffset = 0;
625 CurEltOffset = NextEltOffset;
626 }
627 // not reached.
628 }
629
633 uint64_t NumElts, EltSize;
634 Type *EltTy;
635 if (auto *AT = dyn_cast<ArrayType>(C->getType())) {
636 NumElts = AT->getNumElements();
637 EltTy = AT->getElementType();
638 EltSize = DL.getTypeAllocSize(EltTy);
639 } else {
640 NumElts = cast<FixedVectorType>(C->getType())->getNumElements();
641 EltTy = cast<FixedVectorType>(C->getType())->getElementType();
642 // TODO: For non-byte-sized vectors, current implementation assumes there is
643 // padding to the next byte boundary between elements.
644 if (!DL.typeSizeEqualsStoreSize(EltTy))
645 return false;
646
647 EltSize = DL.getTypeStoreSize(EltTy);
648 }
649 uint64_t Index = ByteOffset / EltSize;
650 uint64_t Offset = ByteOffset - Index * EltSize;
651
652 for (; Index != NumElts; ++Index) {
653 if (!ReadDataFromGlobal(C->getAggregateElement(Index), Offset, CurPtr,
654 BytesLeft, DL, IsByteLoad))
655 return false;
656
657 uint64_t BytesWritten = EltSize - Offset;
658 assert(BytesWritten <= EltSize && "Not indexing into this element?");
659 if (BytesWritten >= BytesLeft)
660 return true;
661
662 Offset = 0;
663 BytesLeft -= BytesWritten;
664 CurPtr += BytesWritten;
665 }
666 return true;
667 }
668
669 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
670 if (CE->getOpcode() == Instruction::IntToPtr &&
671 CE->getOperand(0)->getType() == DL.getIntPtrType(CE->getType())) {
672 // Folding byte loads through the integer operand would rebuild the result
673 // as a `ConstantByte`, dropping the pointer's provenance.
674 if (IsByteLoad)
675 return false;
676 return ReadDataFromGlobal(CE->getOperand(0), ByteOffset, CurPtr,
677 BytesLeft, DL, IsByteLoad);
678 }
679 }
680
681 // Otherwise, unknown initializer type.
682 return false;
683}
684
685/// OrigLoadTy is the original type being loaded, while LoadTy is the type
686/// currently being folded (which may be integer type mapped from OrigLoadTy).
687Constant *FoldReinterpretLoadFromConst(Constant *C, Type *LoadTy,
688 Type *OrigLoadTy, int64_t Offset,
689 const DataLayout &DL) {
690 // Bail out early. Not expect to load from scalable global variable.
691 if (isa<ScalableVectorType>(LoadTy))
692 return nullptr;
693
694 auto *IntType = dyn_cast<IntegerType>(LoadTy);
695
696 // If this isn't an integer load we can't fold it directly.
697 if (!IntType) {
698 // If this is a non-integer load, we can try folding it as an int load and
699 // then bitcast the result. This can be useful for union cases. Note
700 // that address spaces don't matter here since we're not going to result in
701 // an actual new load.
702 if (!LoadTy->isFloatingPointTy() && !LoadTy->isPointerTy() &&
703 !LoadTy->isByteTy() && !LoadTy->isVectorTy())
704 return nullptr;
705
706 Type *MapTy = Type::getIntNTy(C->getContext(),
707 DL.getTypeSizeInBits(LoadTy).getFixedValue());
708 if (Constant *Res =
709 FoldReinterpretLoadFromConst(C, MapTy, OrigLoadTy, Offset, DL)) {
710 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
711 // Materializing a zero can be done trivially without a bitcast
712 return Constant::getNullValue(LoadTy);
713 Type *CastTy = LoadTy->isPtrOrPtrVectorTy() ? DL.getIntPtrType(LoadTy) : LoadTy;
714 Res = FoldBitCast(Res, CastTy, DL);
715 if (LoadTy->isPtrOrPtrVectorTy()) {
716 // For vector of pointer, we needed to first convert to a vector of integer, then do vector inttoptr
717 if (Res->isNullValue() && !LoadTy->isX86_AMXTy())
718 return Constant::getNullValue(LoadTy);
719 if (DL.isNonIntegralPointerType(LoadTy->getScalarType()))
720 // Be careful not to replace a load of an addrspace value with an inttoptr here
721 return nullptr;
722 Res = ConstantExpr::getIntToPtr(Res, LoadTy);
723 }
724 return Res;
725 }
726 return nullptr;
727 }
728
729 unsigned BytesLoaded = (IntType->getBitWidth() + 7) / 8;
730 // Allow folding of large type loads (e.g. <16 x double>).
731 if (BytesLoaded > 128 || BytesLoaded == 0)
732 return nullptr;
733
734 // For scalar integer load, use smaller limit to avoid regression during
735 // memcmp expansion. Codegen may generate inefficient string operations.
736 if (BytesLoaded > 32 && OrigLoadTy->isIntegerTy())
737 return nullptr;
738
739 // If we're not accessing anything in this constant, the result is undefined.
740 if (Offset <= -1 * static_cast<int64_t>(BytesLoaded))
741 return PoisonValue::get(IntType);
742
743 // TODO: We should be able to support scalable types.
744 TypeSize InitializerSize = DL.getTypeAllocSize(C->getType());
745 if (InitializerSize.isScalable())
746 return nullptr;
747
748 // If we're not accessing anything in this constant, the result is undefined.
749 if (Offset >= (int64_t)InitializerSize.getFixedValue())
750 return PoisonValue::get(IntType);
751
752 SmallVector<unsigned char, 64> RawBytes(BytesLoaded);
753 unsigned char *CurPtr = RawBytes.data();
754 unsigned BytesLeft = BytesLoaded;
755
756 // If we're loading off the beginning of the global, some bytes may be valid.
757 if (Offset < 0) {
758 CurPtr += -Offset;
759 BytesLeft += Offset;
760 Offset = 0;
761 }
762
763 if (!ReadDataFromGlobal(C, Offset, CurPtr, BytesLeft, DL,
764 /*IsByteLoad=*/OrigLoadTy->isByteOrByteVectorTy()))
765 return nullptr;
766
767 APInt ResultVal = APInt(IntType->getBitWidth(), 0);
768 if (DL.isLittleEndian()) {
769 ResultVal = RawBytes[BytesLoaded - 1];
770 for (unsigned i = 1; i != BytesLoaded; ++i) {
771 ResultVal <<= 8;
772 ResultVal |= RawBytes[BytesLoaded - 1 - i];
773 }
774 } else {
775 ResultVal = RawBytes[0];
776 for (unsigned i = 1; i != BytesLoaded; ++i) {
777 ResultVal <<= 8;
778 ResultVal |= RawBytes[i];
779 }
780 }
781
782 return ConstantInt::get(IntType->getContext(), ResultVal);
783}
784
785} // anonymous namespace
786
787// If GV is a constant with an initializer read its representation starting
788// at Offset and return it as a constant array of unsigned char. Otherwise
789// return null.
792 if (!GV->isConstant() || !GV->hasDefinitiveInitializer())
793 return nullptr;
794
795 const DataLayout &DL = GV->getDataLayout();
796 Constant *Init = const_cast<Constant *>(GV->getInitializer());
797 TypeSize InitSize = DL.getTypeAllocSize(Init->getType());
798 if (InitSize < Offset)
799 return nullptr;
800
801 uint64_t NBytes = InitSize - Offset;
802 if (NBytes > UINT16_MAX)
803 // Bail for large initializers in excess of 64K to avoid allocating
804 // too much memory.
805 // Offset is assumed to be less than or equal than InitSize (this
806 // is enforced in ReadDataFromGlobal).
807 return nullptr;
808
809 SmallVector<unsigned char, 256> RawBytes(static_cast<size_t>(NBytes));
810 unsigned char *CurPtr = RawBytes.data();
811
812 if (!ReadDataFromGlobal(Init, Offset, CurPtr, NBytes, DL))
813 return nullptr;
814
815 return ConstantDataArray::get(GV->getContext(), RawBytes);
816}
817
818/// If this Offset points exactly to the start of an aggregate element, return
819/// that element, otherwise return nullptr.
821 const DataLayout &DL) {
822 if (Offset.isZero())
823 return Base;
824
826 return nullptr;
827
828 Type *ElemTy = Base->getType();
829 SmallVector<APInt> Indices = DL.getGEPIndicesForOffset(ElemTy, Offset);
830 if (!Offset.isZero() || !Indices[0].isZero())
831 return nullptr;
832
833 Constant *C = Base;
834 for (const APInt &Index : drop_begin(Indices)) {
835 if (Index.isNegative() || Index.getActiveBits() >= 32)
836 return nullptr;
837
838 C = C->getAggregateElement(Index.getZExtValue());
839 if (!C)
840 return nullptr;
841 }
842
843 return C;
844}
845
847 const APInt &Offset,
848 const DataLayout &DL) {
849 if (Constant *AtOffset = getConstantAtOffset(C, Offset, DL))
850 if (Constant *Result = ConstantFoldLoadThroughBitcast(AtOffset, Ty, DL))
851 return Result;
852
853 // Explicitly check for out-of-bounds access, so we return poison even if the
854 // constant is a uniform value.
855 TypeSize Size = DL.getTypeAllocSize(C->getType());
856 if (!Size.isScalable() && Offset.sge(Size.getFixedValue()))
857 return PoisonValue::get(Ty);
858
859 // Try an offset-independent fold of a uniform value.
860 if (Constant *Result = ConstantFoldLoadFromUniformValue(C, Ty, DL))
861 return Result;
862
863 // Try hard to fold loads from bitcasted strange and non-type-safe things.
864 if (Offset.getSignificantBits() <= 64)
865 if (Constant *Result =
866 FoldReinterpretLoadFromConst(C, Ty, Ty, Offset.getSExtValue(), DL))
867 return Result;
868
869 return nullptr;
870}
871
876
879 const DataLayout &DL) {
880 // We can only fold loads from constant globals with a definitive initializer.
881 // Check this upfront, to skip expensive offset calculations.
883 if (!GV || !GV->isConstant() || !GV->hasDefinitiveInitializer())
884 return nullptr;
885
886 C = cast<Constant>(C->stripAndAccumulateConstantOffsets(
887 DL, Offset, /* AllowNonInbounds */ true));
888
889 if (C == GV)
890 if (Constant *Result = ConstantFoldLoadFromConst(GV->getInitializer(), Ty,
891 Offset, DL))
892 return Result;
893
894 // If this load comes from anywhere in a uniform constant global, the value
895 // is always the same, regardless of the loaded offset.
896 return ConstantFoldLoadFromUniformValue(GV->getInitializer(), Ty, DL);
897}
898
900 const DataLayout &DL) {
901 APInt Offset(DL.getIndexTypeSizeInBits(C->getType()), 0);
902 return ConstantFoldLoadFromConstPtr(C, Ty, std::move(Offset), DL);
903}
904
906 const DataLayout &DL) {
907 if (isa<PoisonValue>(C))
908 return PoisonValue::get(Ty);
909 if (isa<UndefValue>(C))
910 return UndefValue::get(Ty);
911 // If padding is needed when storing C to memory, then it isn't considered as
912 // uniform.
913 if (!DL.typeSizeEqualsStoreSize(C->getType()))
914 return nullptr;
915 if (C->isNullValue() && !Ty->isX86_AMXTy())
916 return Constant::getNullValue(Ty);
917 if (C->isAllOnesValue() &&
918 (Ty->isIntOrIntVectorTy() || Ty->isByteOrByteVectorTy() ||
919 Ty->isFPOrFPVectorTy()))
920 return Constant::getAllOnesValue(Ty);
921 return nullptr;
922}
923
924namespace {
925
926/// One of Op0/Op1 is a constant expression.
927/// Attempt to symbolically evaluate the result of a binary operator merging
928/// these together. If target data info is available, it is provided as DL,
929/// otherwise DL is null.
930Constant *SymbolicallyEvaluateBinop(unsigned Opc, Constant *Op0, Constant *Op1,
931 const DataLayout &DL) {
932 // SROA
933
934 // Fold (and 0xffffffff00000000, (shl x, 32)) -> shl.
935 // Fold (lshr (or X, Y), 32) -> (lshr [X/Y], 32) if one doesn't contribute
936 // bits.
937
938 if (Opc == Instruction::And) {
939 KnownBits Known0 = computeKnownBits(Op0, DL);
940 KnownBits Known1 = computeKnownBits(Op1, DL);
941 if ((Known1.One | Known0.Zero).isAllOnes()) {
942 // All the bits of Op0 that the 'and' could be masking are already zero.
943 return Op0;
944 }
945 if ((Known0.One | Known1.Zero).isAllOnes()) {
946 // All the bits of Op1 that the 'and' could be masking are already zero.
947 return Op1;
948 }
949
950 Known0 &= Known1;
951 if (Known0.isConstant())
952 return ConstantInt::get(Op0->getType(), Known0.getConstant());
953 }
954
955 // If the constant expr is something like &A[123] - &A[4].f, fold this into a
956 // constant. This happens frequently when iterating over a global array.
957 if (Opc == Instruction::Sub) {
958 GlobalValue *GV1, *GV2;
959 APInt Offs1, Offs2;
960
961 if (IsConstantOffsetFromGlobal(Op0, GV1, Offs1, DL))
962 if (IsConstantOffsetFromGlobal(Op1, GV2, Offs2, DL) && GV1 == GV2) {
963 unsigned OpSize = DL.getTypeSizeInBits(Op0->getType());
964
965 // (&GV+C1) - (&GV+C2) -> C1-C2, pointer arithmetic cannot overflow.
966 // PtrToInt may change the bitwidth so we have convert to the right size
967 // first.
968 return ConstantInt::get(Op0->getType(), Offs1.zextOrTrunc(OpSize) -
969 Offs2.zextOrTrunc(OpSize));
970 }
971 }
972
973 return nullptr;
974}
975
976/// If array indices are not pointer-sized integers, explicitly cast them so
977/// that they aren't implicitly casted by the getelementptr.
978Constant *CastGEPIndices(Type *SrcElemTy, ArrayRef<Constant *> Ops,
979 Type *ResultTy, GEPNoWrapFlags NW,
980 std::optional<ConstantRange> InRange,
981 const DataLayout &DL, const TargetLibraryInfo *TLI) {
982 Type *IntIdxTy = DL.getIndexType(ResultTy);
983 Type *IntIdxScalarTy = IntIdxTy->getScalarType();
984
985 bool Any = false;
987 for (unsigned i = 1, e = Ops.size(); i != e; ++i) {
988 if ((i == 1 ||
990 SrcElemTy, Ops.slice(1, i - 1)))) &&
991 Ops[i]->getType()->getScalarType() != IntIdxScalarTy) {
992 Any = true;
993 Type *NewType =
994 Ops[i]->getType()->isVectorTy() ? IntIdxTy : IntIdxScalarTy;
996 CastInst::getCastOpcode(Ops[i], true, NewType, true), Ops[i], NewType,
997 DL);
998 if (!NewIdx)
999 return nullptr;
1000 NewIdxs.push_back(NewIdx);
1001 } else
1002 NewIdxs.push_back(Ops[i]);
1003 }
1004
1005 if (!Any)
1006 return nullptr;
1007
1008 Constant *C =
1009 ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], NewIdxs, NW, InRange);
1010 return ConstantFoldConstant(C, DL, TLI);
1011}
1012
1013/// If we can symbolically evaluate the GEP constant expression, do so.
1014Constant *SymbolicallyEvaluateGEP(const GEPOperator *GEP,
1016 const DataLayout &DL,
1017 const TargetLibraryInfo *TLI) {
1018 Type *SrcElemTy = GEP->getSourceElementType();
1019 Type *ResTy = GEP->getType();
1020 if (!SrcElemTy->isSized() || isa<ScalableVectorType>(SrcElemTy))
1021 return nullptr;
1022
1023 if (Constant *C = CastGEPIndices(SrcElemTy, Ops, ResTy, GEP->getNoWrapFlags(),
1024 GEP->getInRange(), DL, TLI))
1025 return C;
1026
1027 Constant *Ptr = Ops[0];
1028 if (!Ptr->getType()->isPointerTy())
1029 return nullptr;
1030
1031 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1032
1033 for (unsigned i = 1, e = Ops.size(); i != e; ++i)
1034 if (!isa<ConstantInt>(Ops[i]) || !Ops[i]->getType()->isIntegerTy())
1035 return nullptr;
1036
1037 unsigned BitWidth = DL.getTypeSizeInBits(IntIdxTy);
1038 APInt Offset = APInt(
1039 BitWidth,
1040 DL.getIndexedOffsetInType(
1041 SrcElemTy, ArrayRef((Value *const *)Ops.data() + 1, Ops.size() - 1)),
1042 /*isSigned=*/true, /*implicitTrunc=*/true);
1043
1044 std::optional<ConstantRange> InRange = GEP->getInRange();
1045 if (InRange)
1046 InRange = InRange->sextOrTrunc(BitWidth);
1047
1048 // If this is a GEP of a GEP, fold it all into a single GEP.
1049 GEPNoWrapFlags NW = GEP->getNoWrapFlags();
1050 bool Overflow = false;
1051 while (auto *GEP = dyn_cast<GEPOperator>(Ptr)) {
1052 NW &= GEP->getNoWrapFlags();
1053
1054 SmallVector<Value *, 4> NestedOps(llvm::drop_begin(GEP->operands()));
1055
1056 // Do not try the incorporate the sub-GEP if some index is not a number.
1057 bool AllConstantInt = true;
1058 for (Value *NestedOp : NestedOps)
1059 if (!isa<ConstantInt>(NestedOp)) {
1060 AllConstantInt = false;
1061 break;
1062 }
1063 if (!AllConstantInt)
1064 break;
1065
1066 // Adjust inrange offset and intersect inrange attributes
1067 if (auto GEPRange = GEP->getInRange()) {
1068 auto AdjustedGEPRange = GEPRange->sextOrTrunc(BitWidth).subtract(Offset);
1069 InRange =
1070 InRange ? InRange->intersectWith(AdjustedGEPRange) : AdjustedGEPRange;
1071 }
1072
1073 Ptr = cast<Constant>(GEP->getOperand(0));
1074 SrcElemTy = GEP->getSourceElementType();
1075 Offset = Offset.sadd_ov(
1076 APInt(BitWidth, DL.getIndexedOffsetInType(SrcElemTy, NestedOps),
1077 /*isSigned=*/true, /*implicitTrunc=*/true),
1078 Overflow);
1079 }
1080
1081 // Preserving nusw (without inbounds) also requires that the offset
1082 // additions did not overflow.
1083 if (NW.hasNoUnsignedSignedWrap() && !NW.isInBounds() && Overflow)
1085
1086 // If the base value for this address is a literal integer value, fold the
1087 // getelementptr to the resulting integer value casted to the pointer type.
1088 APInt BaseIntVal(DL.getPointerTypeSizeInBits(Ptr->getType()), 0);
1089 if (auto *CE = dyn_cast<ConstantExpr>(Ptr)) {
1090 if (CE->getOpcode() == Instruction::IntToPtr) {
1091 if (auto *Base = dyn_cast<ConstantInt>(CE->getOperand(0)))
1092 BaseIntVal = Base->getValue().zextOrTrunc(BaseIntVal.getBitWidth());
1093 }
1094 }
1095
1096 if ((Ptr->isNullValue() || BaseIntVal != 0) &&
1097 !DL.mustNotIntroduceIntToPtr(Ptr->getType())) {
1098
1099 // If the index size is smaller than the pointer size, add to the low
1100 // bits only.
1101 BaseIntVal.insertBits(BaseIntVal.trunc(BitWidth) + Offset, 0);
1102 Constant *C = ConstantInt::get(Ptr->getContext(), BaseIntVal);
1103 return ConstantExpr::getIntToPtr(C, ResTy);
1104 }
1105
1106 // Try to infer inbounds for GEPs of globals.
1107 if (!NW.isInBounds() && Offset.isNonNegative()) {
1108 bool CanBeNull;
1109 uint64_t DerefBytes = Ptr->getPointerDereferenceableBytes(
1110 DL, CanBeNull, /*CanBeFreed=*/nullptr);
1111 if (DerefBytes != 0 && !CanBeNull && Offset.sle(DerefBytes))
1113 }
1114
1115 // nusw + nneg -> nuw
1116 if (NW.hasNoUnsignedSignedWrap() && Offset.isNonNegative())
1118
1119 // Otherwise canonicalize this to a single ptradd.
1120 LLVMContext &Ctx = Ptr->getContext();
1121 return ConstantExpr::getPtrAdd(Ptr, ConstantInt::get(Ctx, Offset), NW,
1122 InRange);
1123}
1124
1125/// Attempt to constant fold an instruction with the
1126/// specified opcode and operands. If successful, the constant result is
1127/// returned, if not, null is returned. Note that this function can fail when
1128/// attempting to fold instructions like loads and stores, which have no
1129/// constant expression form.
1130Constant *ConstantFoldInstOperandsImpl(const Value *InstOrCE, unsigned Opcode,
1132 const DataLayout &DL,
1133 const TargetLibraryInfo *TLI,
1134 bool AllowNonDeterministic) {
1135 Type *DestTy = InstOrCE->getType();
1136
1137 if (Instruction::isUnaryOp(Opcode))
1138 return ConstantFoldUnaryOpOperand(Opcode, Ops[0], DL);
1139
1140 if (Instruction::isBinaryOp(Opcode)) {
1141 switch (Opcode) {
1142 default:
1143 break;
1144 case Instruction::FAdd:
1145 case Instruction::FSub:
1146 case Instruction::FMul:
1147 case Instruction::FDiv:
1148 case Instruction::FRem:
1149 // Handle floating point instructions separately to account for denormals
1150 // TODO: If a constant expression is being folded rather than an
1151 // instruction, denormals will not be flushed/treated as zero
1152 if (const auto *I = dyn_cast<Instruction>(InstOrCE)) {
1153 return ConstantFoldFPInstOperands(Opcode, Ops[0], Ops[1], DL, I,
1154 AllowNonDeterministic);
1155 }
1156 }
1157 return ConstantFoldBinaryOpOperands(Opcode, Ops[0], Ops[1], DL);
1158 }
1159
1160 if (Instruction::isCast(Opcode))
1161 return ConstantFoldCastOperand(Opcode, Ops[0], DestTy, DL);
1162
1163 if (auto *GEP = dyn_cast<GEPOperator>(InstOrCE)) {
1164 Type *SrcElemTy = GEP->getSourceElementType();
1166 return nullptr;
1167
1168 if (Constant *C = SymbolicallyEvaluateGEP(GEP, Ops, DL, TLI))
1169 return C;
1170
1171 return ConstantExpr::getGetElementPtr(SrcElemTy, Ops[0], Ops.slice(1),
1172 GEP->getNoWrapFlags(),
1173 GEP->getInRange());
1174 }
1175
1176 if (auto *CE = dyn_cast<ConstantExpr>(InstOrCE))
1177 return CE->getWithOperands(Ops);
1178
1179 switch (Opcode) {
1180 default: return nullptr;
1181 case Instruction::ICmp:
1182 case Instruction::FCmp: {
1183 auto *C = cast<CmpInst>(InstOrCE);
1184 return ConstantFoldCompareInstOperands(C->getPredicate(), Ops[0], Ops[1],
1185 DL, TLI, C);
1186 }
1187 case Instruction::Freeze:
1188 return isGuaranteedNotToBeUndefOrPoison(Ops[0]) ? Ops[0] : nullptr;
1189 case Instruction::Call:
1190 if (auto *F = dyn_cast<Function>(Ops.back())) {
1191 const auto *Call = cast<CallBase>(InstOrCE);
1193 return ConstantFoldCall(Call, F, Ops.slice(0, Ops.size() - 1), TLI,
1194 AllowNonDeterministic);
1195 }
1196 return nullptr;
1197 case Instruction::Select:
1198 return ConstantFoldSelectInstruction(Ops[0], Ops[1], Ops[2]);
1199 case Instruction::ExtractElement:
1201 case Instruction::ExtractValue:
1203 Ops[0], cast<ExtractValueInst>(InstOrCE)->getIndices());
1204 case Instruction::InsertElement:
1205 return ConstantExpr::getInsertElement(Ops[0], Ops[1], Ops[2]);
1206 case Instruction::InsertValue:
1208 Ops[0], Ops[1], cast<InsertValueInst>(InstOrCE)->getIndices());
1209 case Instruction::ShuffleVector:
1211 Ops[0], Ops[1], cast<ShuffleVectorInst>(InstOrCE)->getShuffleMask());
1212 case Instruction::Load: {
1213 const auto *LI = dyn_cast<LoadInst>(InstOrCE);
1214 if (LI->isVolatile())
1215 return nullptr;
1216 return ConstantFoldLoadFromConstPtr(Ops[0], LI->getType(), DL);
1217 }
1218 }
1219}
1220
1221} // end anonymous namespace
1222
1223//===----------------------------------------------------------------------===//
1224// Constant Folding public APIs
1225//===----------------------------------------------------------------------===//
1226
1227namespace {
1228
1229Constant *
1230ConstantFoldConstantImpl(const Constant *C, const DataLayout &DL,
1231 const TargetLibraryInfo *TLI,
1234 return const_cast<Constant *>(C);
1235
1237 for (const Use &OldU : C->operands()) {
1238 Constant *OldC = cast<Constant>(&OldU);
1239 Constant *NewC = OldC;
1240 // Recursively fold the ConstantExpr's operands. If we have already folded
1241 // a ConstantExpr, we don't have to process it again.
1242 if (isa<ConstantVector>(OldC) || isa<ConstantExpr>(OldC)) {
1243 auto It = FoldedOps.find(OldC);
1244 if (It == FoldedOps.end()) {
1245 NewC = ConstantFoldConstantImpl(OldC, DL, TLI, FoldedOps);
1246 FoldedOps.insert({OldC, NewC});
1247 } else {
1248 NewC = It->second;
1249 }
1250 }
1251 Ops.push_back(NewC);
1252 }
1253
1254 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1255 if (Constant *Res = ConstantFoldInstOperandsImpl(
1256 CE, CE->getOpcode(), Ops, DL, TLI, /*AllowNonDeterministic=*/true))
1257 return Res;
1258 return const_cast<Constant *>(C);
1259 }
1260
1262 return ConstantVector::get(Ops);
1263}
1264
1265} // end anonymous namespace
1266
1268 const DataLayout &DL,
1269 const TargetLibraryInfo *TLI) {
1270 // Handle PHI nodes quickly here...
1271 if (auto *PN = dyn_cast<PHINode>(I)) {
1272 Constant *CommonValue = nullptr;
1273
1275 for (Value *Incoming : PN->incoming_values()) {
1276 // If the incoming value is undef then skip it. Note that while we could
1277 // skip the value if it is equal to the phi node itself we choose not to
1278 // because that would break the rule that constant folding only applies if
1279 // all operands are constants.
1280 if (isa<UndefValue>(Incoming))
1281 continue;
1282 // If the incoming value is not a constant, then give up.
1283 auto *C = dyn_cast<Constant>(Incoming);
1284 if (!C)
1285 return nullptr;
1286 // Fold the PHI's operands.
1287 C = ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1288 // If the incoming value is a different constant to
1289 // the one we saw previously, then give up.
1290 if (CommonValue && C != CommonValue)
1291 return nullptr;
1292 CommonValue = C;
1293 }
1294
1295 // If we reach here, all incoming values are the same constant or undef.
1296 return CommonValue ? CommonValue : UndefValue::get(PN->getType());
1297 }
1298
1299 // Scan the operand list, checking to see if they are all constants, if so,
1300 // hand off to ConstantFoldInstOperandsImpl.
1301 if (!all_of(I->operands(), [](const Use &U) { return isa<Constant>(U); }))
1302 return nullptr;
1303
1306 for (const Use &OpU : I->operands()) {
1307 auto *Op = cast<Constant>(&OpU);
1308 // Fold the Instruction's operands.
1309 Op = ConstantFoldConstantImpl(Op, DL, TLI, FoldedOps);
1310 Ops.push_back(Op);
1311 }
1312
1313 return ConstantFoldInstOperands(I, Ops, DL, TLI);
1314}
1315
1317 const TargetLibraryInfo *TLI) {
1319 return ConstantFoldConstantImpl(C, DL, TLI, FoldedOps);
1320}
1321
1324 const DataLayout &DL,
1325 const TargetLibraryInfo *TLI,
1326 bool AllowNonDeterministic) {
1327 return ConstantFoldInstOperandsImpl(I, I->getOpcode(), Ops, DL, TLI,
1328 AllowNonDeterministic);
1329}
1330
1332 unsigned IntPredicate, Constant *Ops0, Constant *Ops1, const DataLayout &DL,
1333 const TargetLibraryInfo *TLI, const Instruction *I) {
1334 CmpInst::Predicate Predicate = (CmpInst::Predicate)IntPredicate;
1335 // fold: icmp (inttoptr x), null -> icmp x, 0
1336 // fold: icmp null, (inttoptr x) -> icmp 0, x
1337 // fold: icmp (ptrtoint x), 0 -> icmp x, null
1338 // fold: icmp 0, (ptrtoint x) -> icmp null, x
1339 // fold: icmp (inttoptr x), (inttoptr y) -> icmp trunc/zext x, trunc/zext y
1340 // fold: icmp (ptrtoint x), (ptrtoint y) -> icmp x, y
1341 //
1342 // FIXME: The following comment is out of data and the DataLayout is here now.
1343 // ConstantExpr::getCompare cannot do this, because it doesn't have DL
1344 // around to know if bit truncation is happening.
1345 if (auto *CE0 = dyn_cast<ConstantExpr>(Ops0)) {
1346 if (Ops1->isNullValue()) {
1347 if (CE0->getOpcode() == Instruction::IntToPtr) {
1348 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1349 // Convert the integer value to the right size to ensure we get the
1350 // proper extension or truncation.
1351 if (Constant *C = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1352 /*IsSigned*/ false, DL)) {
1353 Constant *Null = Constant::getNullValue(C->getType());
1354 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1355 }
1356 }
1357
1358 // icmp only compares the address part of the pointer, so only do this
1359 // transform if the integer size matches the address size.
1360 if (CE0->getOpcode() == Instruction::PtrToInt ||
1361 CE0->getOpcode() == Instruction::PtrToAddr) {
1362 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1363 if (CE0->getType() == AddrTy) {
1364 Constant *C = CE0->getOperand(0);
1365 Constant *Null = Constant::getNullValue(C->getType());
1366 return ConstantFoldCompareInstOperands(Predicate, C, Null, DL, TLI);
1367 }
1368 }
1369 }
1370
1371 if (auto *CE1 = dyn_cast<ConstantExpr>(Ops1)) {
1372 if (CE0->getOpcode() == CE1->getOpcode()) {
1373 if (CE0->getOpcode() == Instruction::IntToPtr) {
1374 Type *IntPtrTy = DL.getIntPtrType(CE0->getType());
1375
1376 // Convert the integer value to the right size to ensure we get the
1377 // proper extension or truncation.
1378 Constant *C0 = ConstantFoldIntegerCast(CE0->getOperand(0), IntPtrTy,
1379 /*IsSigned*/ false, DL);
1380 Constant *C1 = ConstantFoldIntegerCast(CE1->getOperand(0), IntPtrTy,
1381 /*IsSigned*/ false, DL);
1382 if (C0 && C1)
1383 return ConstantFoldCompareInstOperands(Predicate, C0, C1, DL, TLI);
1384 }
1385
1386 // icmp only compares the address part of the pointer, so only do this
1387 // transform if the integer size matches the address size.
1388 if (CE0->getOpcode() == Instruction::PtrToInt ||
1389 CE0->getOpcode() == Instruction::PtrToAddr) {
1390 Type *AddrTy = DL.getAddressType(CE0->getOperand(0)->getType());
1391 if (CE0->getType() == AddrTy &&
1392 CE0->getOperand(0)->getType() == CE1->getOperand(0)->getType()) {
1394 Predicate, CE0->getOperand(0), CE1->getOperand(0), DL, TLI);
1395 }
1396 }
1397 }
1398 }
1399
1400 // Convert pointer comparison (base+offset1) pred (base+offset2) into
1401 // offset1 pred offset2, for the case where the offset is inbounds. This
1402 // only works for equality and unsigned comparison, as inbounds permits
1403 // crossing the sign boundary. However, the offset comparison itself is
1404 // signed.
1405 if (Ops0->getType()->isPointerTy() && !ICmpInst::isSigned(Predicate)) {
1406 unsigned IndexWidth = DL.getIndexTypeSizeInBits(Ops0->getType());
1407 APInt Offset0(IndexWidth, 0);
1408 bool IsEqPred = ICmpInst::isEquality(Predicate);
1409 Value *Stripped0 = Ops0->stripAndAccumulateConstantOffsets(
1410 DL, Offset0, /*AllowNonInbounds=*/IsEqPred,
1411 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1412 /*LookThroughIntToPtr=*/IsEqPred);
1413 APInt Offset1(IndexWidth, 0);
1414 Value *Stripped1 = Ops1->stripAndAccumulateConstantOffsets(
1415 DL, Offset1, /*AllowNonInbounds=*/IsEqPred,
1416 /*AllowInvariantGroup=*/false, /*ExternalAnalysis=*/nullptr,
1417 /*LookThroughIntToPtr=*/IsEqPred);
1418 if (Stripped0 == Stripped1)
1419 return ConstantInt::getBool(
1420 Ops0->getContext(),
1421 ICmpInst::compare(Offset0, Offset1,
1422 ICmpInst::getSignedPredicate(Predicate)));
1423 }
1424 } else if (isa<ConstantExpr>(Ops1)) {
1425 // If RHS is a constant expression, but the left side isn't, swap the
1426 // operands and try again.
1427 Predicate = ICmpInst::getSwappedPredicate(Predicate);
1428 return ConstantFoldCompareInstOperands(Predicate, Ops1, Ops0, DL, TLI);
1429 }
1430
1431 if (CmpInst::isFPPredicate(Predicate)) {
1432 // Flush any denormal constant float input according to denormal handling
1433 // mode.
1434 Ops0 = FlushFPConstant(Ops0, I, /*IsOutput=*/false);
1435 if (!Ops0)
1436 return nullptr;
1437 Ops1 = FlushFPConstant(Ops1, I, /*IsOutput=*/false);
1438 if (!Ops1)
1439 return nullptr;
1440 }
1441
1442 return ConstantFoldCompareInstruction(Predicate, Ops0, Ops1);
1443}
1444
1446 const DataLayout &DL) {
1448
1449 return ConstantFoldUnaryInstruction(Opcode, Op);
1450}
1451
1453 Constant *RHS,
1454 const DataLayout &DL) {
1456 if (isa<ConstantExpr>(LHS) || isa<ConstantExpr>(RHS))
1457 if (Constant *C = SymbolicallyEvaluateBinop(Opcode, LHS, RHS, DL))
1458 return C;
1459
1461 return ConstantExpr::get(Opcode, LHS, RHS);
1462 return ConstantFoldBinaryInstruction(Opcode, LHS, RHS);
1463}
1464
1467 switch (Mode) {
1469 return nullptr;
1470 case DenormalMode::IEEE:
1471 return ConstantFP::get(Ty, APF);
1473 return ConstantFP::get(
1474 Ty, APFloat::getZero(APF.getSemantics(), APF.isNegative()));
1476 return ConstantFP::get(Ty, APFloat::getZero(APF.getSemantics(), false));
1477 default:
1478 break;
1479 }
1480
1481 llvm_unreachable("unknown denormal mode");
1482}
1483
1484/// Return the denormal mode that can be assumed when executing a floating point
1485/// operation at \p CtxI.
1487 if (!CtxI || !CtxI->getParent() || !CtxI->getFunction())
1488 return DenormalMode::getDynamic();
1489 return CtxI->getFunction()->getDenormalMode(
1490 Ty->getScalarType()->getFltSemantics());
1491}
1492
1494 const Instruction *Inst,
1495 bool IsOutput) {
1496 const APFloat &APF = CFP->getValueAPF();
1497 if (!APF.isDenormal())
1498 return CFP;
1499
1501 return flushDenormalConstant(CFP->getType(), APF,
1502 IsOutput ? Mode.Output : Mode.Input);
1503}
1504
1506 bool IsOutput) {
1507 if (ConstantFP *CFP = dyn_cast<ConstantFP>(Operand))
1508 return flushDenormalConstantFP(CFP, Inst, IsOutput);
1509
1511 return Operand;
1512
1513 Type *Ty = Operand->getType();
1514 VectorType *VecTy = dyn_cast<VectorType>(Ty);
1515 if (VecTy) {
1516 if (auto *Splat = dyn_cast_or_null<ConstantFP>(Operand->getSplatValue())) {
1517 ConstantFP *Folded = flushDenormalConstantFP(Splat, Inst, IsOutput);
1518 if (!Folded)
1519 return nullptr;
1520 return ConstantVector::getSplat(VecTy->getElementCount(), Folded);
1521 }
1522
1523 Ty = VecTy->getElementType();
1524 }
1525
1526 if (isa<ConstantExpr>(Operand))
1527 return Operand;
1528
1529 if (const auto *CV = dyn_cast<ConstantVector>(Operand)) {
1531 for (unsigned i = 0, e = CV->getNumOperands(); i != e; ++i) {
1532 Constant *Element = CV->getAggregateElement(i);
1533 if (isa<UndefValue>(Element)) {
1534 NewElts.push_back(Element);
1535 continue;
1536 }
1537
1538 ConstantFP *CFP = dyn_cast<ConstantFP>(Element);
1539 if (!CFP)
1540 return nullptr;
1541
1542 ConstantFP *Folded = flushDenormalConstantFP(CFP, Inst, IsOutput);
1543 if (!Folded)
1544 return nullptr;
1545 NewElts.push_back(Folded);
1546 }
1547
1548 return ConstantVector::get(NewElts);
1549 }
1550
1551 if (const auto *CDV = dyn_cast<ConstantDataVector>(Operand)) {
1553 for (unsigned I = 0, E = CDV->getNumElements(); I < E; ++I) {
1554 const APFloat &Elt = CDV->getElementAsAPFloat(I);
1555 if (!Elt.isDenormal()) {
1556 NewElts.push_back(ConstantFP::get(Ty, Elt));
1557 } else {
1558 DenormalMode Mode = getInstrDenormalMode(Inst, Ty);
1559 ConstantFP *Folded =
1560 flushDenormalConstant(Ty, Elt, IsOutput ? Mode.Output : Mode.Input);
1561 if (!Folded)
1562 return nullptr;
1563 NewElts.push_back(Folded);
1564 }
1565 }
1566
1567 return ConstantVector::get(NewElts);
1568 }
1569
1570 return nullptr;
1571}
1572
1574 Constant *RHS, const DataLayout &DL,
1575 const Instruction *I,
1576 bool AllowNonDeterministic) {
1577 if (Instruction::isBinaryOp(Opcode)) {
1578 // Flush denormal inputs if needed.
1579 Constant *Op0 = FlushFPConstant(LHS, I, /* IsOutput */ false);
1580 if (!Op0)
1581 return nullptr;
1582 Constant *Op1 = FlushFPConstant(RHS, I, /* IsOutput */ false);
1583 if (!Op1)
1584 return nullptr;
1585
1586 // If nsz or an algebraic FMF flag is set, the result of the FP operation
1587 // may change due to future optimization. Don't constant fold them if
1588 // non-deterministic results are not allowed.
1589 if (!AllowNonDeterministic)
1591 if (FP->hasNoSignedZeros() || FP->hasAllowReassoc() ||
1592 FP->hasAllowContract() || FP->hasAllowReciprocal())
1593 return nullptr;
1594
1595 // Calculate constant result.
1596 Constant *C = ConstantFoldBinaryOpOperands(Opcode, Op0, Op1, DL);
1597 if (!C)
1598 return nullptr;
1599
1600 // Flush denormal output if needed.
1601 C = FlushFPConstant(C, I, /* IsOutput */ true);
1602 if (!C)
1603 return nullptr;
1604
1605 // The precise NaN value is non-deterministic.
1606 if (!AllowNonDeterministic && C->isNaN())
1607 return nullptr;
1608
1609 return C;
1610 }
1611 // If instruction lacks a parent/function and the denormal mode cannot be
1612 // determined, use the default (IEEE).
1613 return ConstantFoldBinaryOpOperands(Opcode, LHS, RHS, DL);
1614}
1615
1617 Type *DestTy, const DataLayout &DL) {
1618 assert(Instruction::isCast(Opcode));
1619
1620 if (auto *CE = dyn_cast<ConstantExpr>(C))
1621 if (CE->isCast())
1622 if (unsigned NewOp = CastInst::isEliminableCastPair(
1623 Instruction::CastOps(CE->getOpcode()),
1624 Instruction::CastOps(Opcode), CE->getOperand(0)->getType(),
1625 C->getType(), DestTy, &DL))
1626 return ConstantFoldCastOperand(NewOp, CE->getOperand(0), DestTy, DL);
1627
1628 switch (Opcode) {
1629 default:
1630 llvm_unreachable("Missing case");
1631 case Instruction::PtrToAddr:
1632 case Instruction::PtrToInt:
1633 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1634 Constant *FoldedValue = nullptr;
1635 // If the input is an inttoptr, eliminate the pair. This requires knowing
1636 // the width of a pointer, so it can't be done in ConstantExpr::getCast.
1637 if (CE->getOpcode() == Instruction::IntToPtr) {
1638 // zext/trunc the inttoptr to pointer/address size.
1639 Type *MidTy = Opcode == Instruction::PtrToInt
1640 ? DL.getAddressType(CE->getType())
1641 : DL.getIntPtrType(CE->getType());
1642 FoldedValue = ConstantFoldIntegerCast(CE->getOperand(0), MidTy,
1643 /*IsSigned=*/false, DL);
1644 } else if (auto *GEP = dyn_cast<GEPOperator>(CE)) {
1645 // If we have GEP, we can perform the following folds:
1646 // (ptrtoint/ptrtoaddr (gep null, x)) -> x
1647 // (ptrtoint/ptrtoaddr (gep (gep null, x), y) -> x + y, etc.
1648 unsigned BitWidth = DL.getIndexTypeSizeInBits(GEP->getType());
1649 APInt BaseOffset(BitWidth, 0);
1650 auto *Base = cast<Constant>(GEP->stripAndAccumulateConstantOffsets(
1651 DL, BaseOffset, /*AllowNonInbounds=*/true));
1652 if (Base->isNullValue()) {
1653 FoldedValue = ConstantInt::get(CE->getContext(), BaseOffset);
1654 } else {
1655 // ptrtoint/ptrtoaddr (gep i8, Ptr, (sub 0, V))
1656 // -> sub (ptrtoint/ptrtoaddr Ptr), V
1657 if (GEP->getNumIndices() == 1 &&
1658 GEP->getSourceElementType()->isIntegerTy(8)) {
1659 auto *Ptr = cast<Constant>(GEP->getPointerOperand());
1660 auto *Sub = dyn_cast<ConstantExpr>(GEP->getOperand(1));
1661 Type *IntIdxTy = DL.getIndexType(Ptr->getType());
1662 if (Sub && Sub->getType() == IntIdxTy &&
1663 Sub->getOpcode() == Instruction::Sub &&
1664 Sub->getOperand(0)->isNullValue())
1665 FoldedValue = ConstantExpr::getSub(
1666 ConstantExpr::getCast(Opcode, Ptr, IntIdxTy),
1667 Sub->getOperand(1));
1668 }
1669 }
1670 }
1671 if (FoldedValue) {
1672 // Do a zext or trunc to get to the ptrtoint/ptrtoaddr dest size.
1673 return ConstantFoldIntegerCast(FoldedValue, DestTy, /*IsSigned=*/false,
1674 DL);
1675 }
1676 }
1677 break;
1678 case Instruction::IntToPtr:
1679 // If the input is a ptrtoint, turn the pair into a ptr to ptr bitcast if
1680 // the int size is >= the ptr size and the address spaces are the same.
1681 // This requires knowing the width of a pointer, so it can't be done in
1682 // ConstantExpr::getCast.
1683 if (auto *CE = dyn_cast<ConstantExpr>(C)) {
1684 if (CE->getOpcode() == Instruction::PtrToInt) {
1685 Constant *SrcPtr = CE->getOperand(0);
1686 unsigned SrcPtrSize = DL.getPointerTypeSizeInBits(SrcPtr->getType());
1687 unsigned MidIntSize = CE->getType()->getScalarSizeInBits();
1688
1689 if (MidIntSize >= SrcPtrSize) {
1690 unsigned SrcAS = SrcPtr->getType()->getPointerAddressSpace();
1691 if (SrcAS == DestTy->getPointerAddressSpace())
1692 return FoldBitCast(CE->getOperand(0), DestTy, DL);
1693 }
1694 }
1695 }
1696 break;
1697 case Instruction::Trunc:
1698 case Instruction::ZExt:
1699 case Instruction::SExt:
1700 case Instruction::FPTrunc:
1701 case Instruction::FPExt:
1702 case Instruction::UIToFP:
1703 case Instruction::SIToFP:
1704 case Instruction::FPToUI:
1705 case Instruction::FPToSI:
1706 case Instruction::AddrSpaceCast:
1707 break;
1708 case Instruction::BitCast:
1709 return FoldBitCast(C, DestTy, DL);
1710 }
1711
1713 return ConstantExpr::getCast(Opcode, C, DestTy);
1714 return ConstantFoldCastInstruction(Opcode, C, DestTy);
1715}
1716
1718 bool IsSigned, const DataLayout &DL) {
1719 Type *SrcTy = C->getType();
1720 if (SrcTy == DestTy)
1721 return C;
1722 if (SrcTy->getScalarSizeInBits() > DestTy->getScalarSizeInBits())
1723 return ConstantFoldCastOperand(Instruction::Trunc, C, DestTy, DL);
1724 if (IsSigned)
1725 return ConstantFoldCastOperand(Instruction::SExt, C, DestTy, DL);
1726 return ConstantFoldCastOperand(Instruction::ZExt, C, DestTy, DL);
1727}
1728
1729//===----------------------------------------------------------------------===//
1730// Constant Folding for Calls
1731//
1732
1734 if (Call->isNoBuiltin())
1735 return false;
1736 if (Call->getFunctionType() != F->getFunctionType())
1737 return false;
1738
1739 // Allow FP calls (both libcalls and intrinsics) to avoid being folded.
1740 // This can be useful for GPU targets or in cross-compilation scenarios
1741 // when the exact target FP behaviour is required, and the host compiler's
1742 // behaviour may be slightly different from the device's run-time behaviour.
1743 if (DisableFPCallFolding && (F->getReturnType()->isFloatingPointTy() ||
1744 any_of(F->args(), [](const Argument &Arg) {
1745 return Arg.getType()->isFloatingPointTy();
1746 })))
1747 return false;
1748
1749 switch (F->getIntrinsicID()) {
1750 // Operations that do not operate floating-point numbers and do not depend on
1751 // FP environment can be folded even in strictfp functions.
1752 case Intrinsic::bswap:
1753 case Intrinsic::ctpop:
1754 case Intrinsic::ctlz:
1755 case Intrinsic::cttz:
1756 case Intrinsic::fshl:
1757 case Intrinsic::fshr:
1758 case Intrinsic::clmul:
1759 case Intrinsic::pdep:
1760 case Intrinsic::pext:
1761 case Intrinsic::launder_invariant_group:
1762 case Intrinsic::strip_invariant_group:
1763 case Intrinsic::masked_load:
1764 case Intrinsic::get_active_lane_mask:
1765 case Intrinsic::abs:
1766 case Intrinsic::smax:
1767 case Intrinsic::smin:
1768 case Intrinsic::umax:
1769 case Intrinsic::umin:
1770 case Intrinsic::scmp:
1771 case Intrinsic::ucmp:
1772 case Intrinsic::sadd_with_overflow:
1773 case Intrinsic::uadd_with_overflow:
1774 case Intrinsic::ssub_with_overflow:
1775 case Intrinsic::usub_with_overflow:
1776 case Intrinsic::smul_with_overflow:
1777 case Intrinsic::umul_with_overflow:
1778 case Intrinsic::sadd_sat:
1779 case Intrinsic::uadd_sat:
1780 case Intrinsic::ssub_sat:
1781 case Intrinsic::usub_sat:
1782 case Intrinsic::smul_fix:
1783 case Intrinsic::smul_fix_sat:
1784 case Intrinsic::bitreverse:
1785 case Intrinsic::is_constant:
1786 case Intrinsic::vector_reduce_add:
1787 case Intrinsic::vector_reduce_mul:
1788 case Intrinsic::vector_reduce_and:
1789 case Intrinsic::vector_reduce_or:
1790 case Intrinsic::vector_reduce_xor:
1791 case Intrinsic::vector_reduce_smin:
1792 case Intrinsic::vector_reduce_smax:
1793 case Intrinsic::vector_reduce_umin:
1794 case Intrinsic::vector_reduce_umax:
1795 case Intrinsic::vector_extract:
1796 case Intrinsic::vector_insert:
1797 case Intrinsic::vector_interleave2:
1798 case Intrinsic::vector_interleave3:
1799 case Intrinsic::vector_interleave4:
1800 case Intrinsic::vector_interleave5:
1801 case Intrinsic::vector_interleave6:
1802 case Intrinsic::vector_interleave7:
1803 case Intrinsic::vector_interleave8:
1804 case Intrinsic::vector_deinterleave2:
1805 case Intrinsic::vector_deinterleave3:
1806 case Intrinsic::vector_deinterleave4:
1807 case Intrinsic::vector_deinterleave5:
1808 case Intrinsic::vector_deinterleave6:
1809 case Intrinsic::vector_deinterleave7:
1810 case Intrinsic::vector_deinterleave8:
1811 // Target intrinsics
1812 case Intrinsic::amdgcn_perm:
1813 case Intrinsic::amdgcn_wave_reduce_umin:
1814 case Intrinsic::amdgcn_wave_reduce_umax:
1815 case Intrinsic::amdgcn_wave_reduce_max:
1816 case Intrinsic::amdgcn_wave_reduce_min:
1817 case Intrinsic::amdgcn_wave_reduce_and:
1818 case Intrinsic::amdgcn_wave_reduce_or:
1819 case Intrinsic::amdgcn_s_wqm:
1820 case Intrinsic::amdgcn_s_quadmask:
1821 case Intrinsic::amdgcn_s_bitreplicate:
1822 case Intrinsic::arm_mve_vctp8:
1823 case Intrinsic::arm_mve_vctp16:
1824 case Intrinsic::arm_mve_vctp32:
1825 case Intrinsic::arm_mve_vctp64:
1826 case Intrinsic::aarch64_sve_convert_from_svbool:
1827 case Intrinsic::wasm_alltrue:
1828 case Intrinsic::wasm_anytrue:
1829 case Intrinsic::wasm_dot:
1830 // WebAssembly float semantics are always known
1831 case Intrinsic::wasm_trunc_signed:
1832 case Intrinsic::wasm_trunc_unsigned:
1833 return true;
1834
1835 // Floating point operations cannot be folded in strictfp functions in
1836 // general case. They can be folded if FP environment is known to compiler.
1837 case Intrinsic::minnum:
1838 case Intrinsic::maxnum:
1839 case Intrinsic::minimum:
1840 case Intrinsic::maximum:
1841 case Intrinsic::minimumnum:
1842 case Intrinsic::maximumnum:
1843 case Intrinsic::log:
1844 case Intrinsic::log2:
1845 case Intrinsic::log10:
1846 case Intrinsic::exp:
1847 case Intrinsic::exp2:
1848 case Intrinsic::exp10:
1849 case Intrinsic::sqrt:
1850 case Intrinsic::sin:
1851 case Intrinsic::cos:
1852 case Intrinsic::sincos:
1853 case Intrinsic::sinh:
1854 case Intrinsic::cosh:
1855 case Intrinsic::atan:
1856 case Intrinsic::pow:
1857 case Intrinsic::powi:
1858 case Intrinsic::ldexp:
1859 case Intrinsic::fma:
1860 case Intrinsic::fmuladd:
1861 case Intrinsic::frexp:
1862 case Intrinsic::fptoui_sat:
1863 case Intrinsic::fptosi_sat:
1864 case Intrinsic::amdgcn_cos:
1865 case Intrinsic::amdgcn_cubeid:
1866 case Intrinsic::amdgcn_cubema:
1867 case Intrinsic::amdgcn_cubesc:
1868 case Intrinsic::amdgcn_cubetc:
1869 case Intrinsic::amdgcn_fmul_legacy:
1870 case Intrinsic::amdgcn_fma_legacy:
1871 case Intrinsic::amdgcn_fract:
1872 case Intrinsic::amdgcn_sin:
1873 // The intrinsics below depend on rounding mode in MXCSR.
1874 case Intrinsic::x86_sse_cvtss2si:
1875 case Intrinsic::x86_sse_cvtss2si64:
1876 case Intrinsic::x86_sse_cvttss2si:
1877 case Intrinsic::x86_sse_cvttss2si64:
1878 case Intrinsic::x86_sse2_cvtsd2si:
1879 case Intrinsic::x86_sse2_cvtsd2si64:
1880 case Intrinsic::x86_sse2_cvttsd2si:
1881 case Intrinsic::x86_sse2_cvttsd2si64:
1882 case Intrinsic::x86_avx512_vcvtss2si32:
1883 case Intrinsic::x86_avx512_vcvtss2si64:
1884 case Intrinsic::x86_avx512_cvttss2si:
1885 case Intrinsic::x86_avx512_cvttss2si64:
1886 case Intrinsic::x86_avx512_vcvtsd2si32:
1887 case Intrinsic::x86_avx512_vcvtsd2si64:
1888 case Intrinsic::x86_avx512_cvttsd2si:
1889 case Intrinsic::x86_avx512_cvttsd2si64:
1890 case Intrinsic::x86_avx512_vcvtss2usi32:
1891 case Intrinsic::x86_avx512_vcvtss2usi64:
1892 case Intrinsic::x86_avx512_cvttss2usi:
1893 case Intrinsic::x86_avx512_cvttss2usi64:
1894 case Intrinsic::x86_avx512_vcvtsd2usi32:
1895 case Intrinsic::x86_avx512_vcvtsd2usi64:
1896 case Intrinsic::x86_avx512_cvttsd2usi:
1897 case Intrinsic::x86_avx512_cvttsd2usi64:
1898
1899 // NVVM FMax intrinsics
1900 case Intrinsic::nvvm_fmax_d:
1901 case Intrinsic::nvvm_fmax_f:
1902 case Intrinsic::nvvm_fmax_ftz_f:
1903 case Intrinsic::nvvm_fmax_ftz_nan_f:
1904 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
1905 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
1906 case Intrinsic::nvvm_fmax_nan_f:
1907 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
1908 case Intrinsic::nvvm_fmax_xorsign_abs_f:
1909
1910 // NVVM FMin intrinsics
1911 case Intrinsic::nvvm_fmin_d:
1912 case Intrinsic::nvvm_fmin_f:
1913 case Intrinsic::nvvm_fmin_ftz_f:
1914 case Intrinsic::nvvm_fmin_ftz_nan_f:
1915 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
1916 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
1917 case Intrinsic::nvvm_fmin_nan_f:
1918 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
1919 case Intrinsic::nvvm_fmin_xorsign_abs_f:
1920
1921 // NVVM float/double to int32/uint32 conversion intrinsics
1922 case Intrinsic::nvvm_f2i_rm:
1923 case Intrinsic::nvvm_f2i_rn:
1924 case Intrinsic::nvvm_f2i_rp:
1925 case Intrinsic::nvvm_f2i_rz:
1926 case Intrinsic::nvvm_f2i_rm_ftz:
1927 case Intrinsic::nvvm_f2i_rn_ftz:
1928 case Intrinsic::nvvm_f2i_rp_ftz:
1929 case Intrinsic::nvvm_f2i_rz_ftz:
1930 case Intrinsic::nvvm_f2ui_rm:
1931 case Intrinsic::nvvm_f2ui_rn:
1932 case Intrinsic::nvvm_f2ui_rp:
1933 case Intrinsic::nvvm_f2ui_rz:
1934 case Intrinsic::nvvm_f2ui_rm_ftz:
1935 case Intrinsic::nvvm_f2ui_rn_ftz:
1936 case Intrinsic::nvvm_f2ui_rp_ftz:
1937 case Intrinsic::nvvm_f2ui_rz_ftz:
1938 case Intrinsic::nvvm_d2i_rm:
1939 case Intrinsic::nvvm_d2i_rn:
1940 case Intrinsic::nvvm_d2i_rp:
1941 case Intrinsic::nvvm_d2i_rz:
1942 case Intrinsic::nvvm_d2ui_rm:
1943 case Intrinsic::nvvm_d2ui_rn:
1944 case Intrinsic::nvvm_d2ui_rp:
1945 case Intrinsic::nvvm_d2ui_rz:
1946
1947 // NVVM float/double to int64/uint64 conversion intrinsics
1948 case Intrinsic::nvvm_f2ll_rm:
1949 case Intrinsic::nvvm_f2ll_rn:
1950 case Intrinsic::nvvm_f2ll_rp:
1951 case Intrinsic::nvvm_f2ll_rz:
1952 case Intrinsic::nvvm_f2ll_rm_ftz:
1953 case Intrinsic::nvvm_f2ll_rn_ftz:
1954 case Intrinsic::nvvm_f2ll_rp_ftz:
1955 case Intrinsic::nvvm_f2ll_rz_ftz:
1956 case Intrinsic::nvvm_f2ull_rm:
1957 case Intrinsic::nvvm_f2ull_rn:
1958 case Intrinsic::nvvm_f2ull_rp:
1959 case Intrinsic::nvvm_f2ull_rz:
1960 case Intrinsic::nvvm_f2ull_rm_ftz:
1961 case Intrinsic::nvvm_f2ull_rn_ftz:
1962 case Intrinsic::nvvm_f2ull_rp_ftz:
1963 case Intrinsic::nvvm_f2ull_rz_ftz:
1964 case Intrinsic::nvvm_d2ll_rm:
1965 case Intrinsic::nvvm_d2ll_rn:
1966 case Intrinsic::nvvm_d2ll_rp:
1967 case Intrinsic::nvvm_d2ll_rz:
1968 case Intrinsic::nvvm_d2ull_rm:
1969 case Intrinsic::nvvm_d2ull_rn:
1970 case Intrinsic::nvvm_d2ull_rp:
1971 case Intrinsic::nvvm_d2ull_rz:
1972
1973 // NVVM math intrinsics:
1974 case Intrinsic::nvvm_ceil_d:
1975 case Intrinsic::nvvm_ceil_f:
1976 case Intrinsic::nvvm_ceil_ftz_f:
1977
1978 case Intrinsic::nvvm_fabs:
1979 case Intrinsic::nvvm_fabs_ftz:
1980
1981 case Intrinsic::nvvm_floor_d:
1982 case Intrinsic::nvvm_floor_f:
1983 case Intrinsic::nvvm_floor_ftz_f:
1984
1985 case Intrinsic::nvvm_rcp_rm_d:
1986 case Intrinsic::nvvm_rcp_rm_f:
1987 case Intrinsic::nvvm_rcp_rm_ftz_f:
1988 case Intrinsic::nvvm_rcp_rn_d:
1989 case Intrinsic::nvvm_rcp_rn_f:
1990 case Intrinsic::nvvm_rcp_rn_ftz_f:
1991 case Intrinsic::nvvm_rcp_rp_d:
1992 case Intrinsic::nvvm_rcp_rp_f:
1993 case Intrinsic::nvvm_rcp_rp_ftz_f:
1994 case Intrinsic::nvvm_rcp_rz_d:
1995 case Intrinsic::nvvm_rcp_rz_f:
1996 case Intrinsic::nvvm_rcp_rz_ftz_f:
1997
1998 case Intrinsic::nvvm_round_d:
1999 case Intrinsic::nvvm_round_f:
2000 case Intrinsic::nvvm_round_ftz_f:
2001
2002 case Intrinsic::nvvm_saturate_d:
2003 case Intrinsic::nvvm_saturate_f:
2004 case Intrinsic::nvvm_saturate_ftz_f:
2005
2006 case Intrinsic::nvvm_sqrt_f:
2007 case Intrinsic::nvvm_sqrt_rn_d:
2008 case Intrinsic::nvvm_sqrt_rn_f:
2009 case Intrinsic::nvvm_sqrt_rn_ftz_f:
2010 return !Call->isStrictFP();
2011
2012 // NVVM add intrinsics with explicit rounding modes
2013 case Intrinsic::nvvm_add_rm_d:
2014 case Intrinsic::nvvm_add_rn_d:
2015 case Intrinsic::nvvm_add_rp_d:
2016 case Intrinsic::nvvm_add_rz_d:
2017 case Intrinsic::nvvm_add_rm_f:
2018 case Intrinsic::nvvm_add_rn_f:
2019 case Intrinsic::nvvm_add_rp_f:
2020 case Intrinsic::nvvm_add_rz_f:
2021 case Intrinsic::nvvm_add_rm_ftz_f:
2022 case Intrinsic::nvvm_add_rn_ftz_f:
2023 case Intrinsic::nvvm_add_rp_ftz_f:
2024 case Intrinsic::nvvm_add_rz_ftz_f:
2025
2026 // NVVM div intrinsics with explicit rounding modes
2027 case Intrinsic::nvvm_div_rm_d:
2028 case Intrinsic::nvvm_div_rn_d:
2029 case Intrinsic::nvvm_div_rp_d:
2030 case Intrinsic::nvvm_div_rz_d:
2031 case Intrinsic::nvvm_div_rm_f:
2032 case Intrinsic::nvvm_div_rn_f:
2033 case Intrinsic::nvvm_div_rp_f:
2034 case Intrinsic::nvvm_div_rz_f:
2035 case Intrinsic::nvvm_div_rm_ftz_f:
2036 case Intrinsic::nvvm_div_rn_ftz_f:
2037 case Intrinsic::nvvm_div_rp_ftz_f:
2038 case Intrinsic::nvvm_div_rz_ftz_f:
2039
2040 // NVVM mul intrinsics with explicit rounding modes
2041 case Intrinsic::nvvm_mul_rm_d:
2042 case Intrinsic::nvvm_mul_rn_d:
2043 case Intrinsic::nvvm_mul_rp_d:
2044 case Intrinsic::nvvm_mul_rz_d:
2045 case Intrinsic::nvvm_mul_rm_f:
2046 case Intrinsic::nvvm_mul_rn_f:
2047 case Intrinsic::nvvm_mul_rp_f:
2048 case Intrinsic::nvvm_mul_rz_f:
2049 case Intrinsic::nvvm_mul_rm_ftz_f:
2050 case Intrinsic::nvvm_mul_rn_ftz_f:
2051 case Intrinsic::nvvm_mul_rp_ftz_f:
2052 case Intrinsic::nvvm_mul_rz_ftz_f:
2053
2054 // NVVM fma intrinsics with explicit rounding modes
2055 case Intrinsic::nvvm_fma_rm_d:
2056 case Intrinsic::nvvm_fma_rn_d:
2057 case Intrinsic::nvvm_fma_rp_d:
2058 case Intrinsic::nvvm_fma_rz_d:
2059 case Intrinsic::nvvm_fma_rm_f:
2060 case Intrinsic::nvvm_fma_rn_f:
2061 case Intrinsic::nvvm_fma_rp_f:
2062 case Intrinsic::nvvm_fma_rz_f:
2063 case Intrinsic::nvvm_fma_rm_ftz_f:
2064 case Intrinsic::nvvm_fma_rn_ftz_f:
2065 case Intrinsic::nvvm_fma_rp_ftz_f:
2066 case Intrinsic::nvvm_fma_rz_ftz_f:
2067
2068 // Sign operations are actually bitwise operations, they do not raise
2069 // exceptions even for SNANs.
2070 case Intrinsic::fabs:
2071 case Intrinsic::copysign:
2072 case Intrinsic::is_fpclass:
2073 // Non-constrained variants of rounding operations means default FP
2074 // environment, they can be folded in any case.
2075 case Intrinsic::ceil:
2076 case Intrinsic::floor:
2077 case Intrinsic::round:
2078 case Intrinsic::roundeven:
2079 case Intrinsic::trunc:
2080 case Intrinsic::nearbyint:
2081 case Intrinsic::rint:
2082 case Intrinsic::canonicalize:
2083
2084 // Constrained intrinsics can be folded if FP environment is known
2085 // to compiler.
2086 case Intrinsic::experimental_constrained_fma:
2087 case Intrinsic::experimental_constrained_fmuladd:
2088 case Intrinsic::experimental_constrained_fadd:
2089 case Intrinsic::experimental_constrained_fsub:
2090 case Intrinsic::experimental_constrained_fmul:
2091 case Intrinsic::experimental_constrained_fdiv:
2092 case Intrinsic::experimental_constrained_frem:
2093 case Intrinsic::experimental_constrained_ceil:
2094 case Intrinsic::experimental_constrained_floor:
2095 case Intrinsic::experimental_constrained_round:
2096 case Intrinsic::experimental_constrained_roundeven:
2097 case Intrinsic::experimental_constrained_trunc:
2098 case Intrinsic::experimental_constrained_nearbyint:
2099 case Intrinsic::experimental_constrained_rint:
2100 case Intrinsic::experimental_constrained_fcmp:
2101 case Intrinsic::experimental_constrained_fcmps:
2102
2103 case Intrinsic::experimental_cttz_elts:
2104 return true;
2105 default:
2106 return false;
2107 case Intrinsic::not_intrinsic: break;
2108 }
2109
2110 if (!F->hasName() || Call->isStrictFP())
2111 return false;
2112
2113 // In these cases, the check of the length is required. We don't want to
2114 // return true for a name like "cos\0blah" which strcmp would return equal to
2115 // "cos", but has length 8.
2116 StringRef Name = F->getName();
2117 switch (Name[0]) {
2118 default:
2119 return false;
2120 // clang-format off
2121 case 'a':
2122 return Name == "acos" || Name == "acosf" ||
2123 Name == "asin" || Name == "asinf" ||
2124 Name == "atan" || Name == "atanf" ||
2125 Name == "atan2" || Name == "atan2f";
2126 case 'c':
2127 return Name == "ceil" || Name == "ceilf" ||
2128 Name == "cos" || Name == "cosf" ||
2129 Name == "cosh" || Name == "coshf";
2130 case 'e':
2131 return Name == "exp" || Name == "expf" || Name == "exp2" ||
2132 Name == "exp2f" || Name == "erf" || Name == "erff";
2133 case 'f':
2134 return Name == "fabs" || Name == "fabsf" ||
2135 Name == "floor" || Name == "floorf" ||
2136 Name == "fmod" || Name == "fmodf";
2137 case 'i':
2138 return Name == "ilogb" || Name == "ilogbf";
2139 case 'l':
2140 return Name == "log" || Name == "logf" || Name == "logl" ||
2141 Name == "log2" || Name == "log2f" || Name == "log10" ||
2142 Name == "log10f" || Name == "logb" || Name == "logbf" ||
2143 Name == "log1p" || Name == "log1pf";
2144 case 'n':
2145 return Name == "nearbyint" || Name == "nearbyintf" || Name == "nextafter" ||
2146 Name == "nextafterf" || Name == "nexttoward" ||
2147 Name == "nexttowardf";
2148 case 'p':
2149 return Name == "pow" || Name == "powf";
2150 case 'r':
2151 return Name == "remainder" || Name == "remainderf" ||
2152 Name == "rint" || Name == "rintf" ||
2153 Name == "round" || Name == "roundf" ||
2154 Name == "roundeven" || Name == "roundevenf";
2155 case 's':
2156 return Name == "sin" || Name == "sinf" ||
2157 Name == "sinh" || Name == "sinhf" ||
2158 Name == "sqrt" || Name == "sqrtf";
2159 case 't':
2160 return Name == "tan" || Name == "tanf" ||
2161 Name == "tanh" || Name == "tanhf" ||
2162 Name == "trunc" || Name == "truncf";
2163 case '_':
2164 // Check for various function names that get used for the math functions
2165 // when the header files are preprocessed with the macro
2166 // __FINITE_MATH_ONLY__ enabled.
2167 // The '12' here is the length of the shortest name that can match.
2168 // We need to check the size before looking at Name[1] and Name[2]
2169 // so we may as well check a limit that will eliminate mismatches.
2170 if (Name.size() < 12 || Name[1] != '_')
2171 return false;
2172 switch (Name[2]) {
2173 default:
2174 return false;
2175 case 'a':
2176 return Name == "__acos_finite" || Name == "__acosf_finite" ||
2177 Name == "__asin_finite" || Name == "__asinf_finite" ||
2178 Name == "__atan2_finite" || Name == "__atan2f_finite";
2179 case 'c':
2180 return Name == "__cosh_finite" || Name == "__coshf_finite";
2181 case 'e':
2182 return Name == "__exp_finite" || Name == "__expf_finite" ||
2183 Name == "__exp2_finite" || Name == "__exp2f_finite";
2184 case 'l':
2185 return Name == "__log_finite" || Name == "__logf_finite" ||
2186 Name == "__log10_finite" || Name == "__log10f_finite";
2187 case 'p':
2188 return Name == "__pow_finite" || Name == "__powf_finite";
2189 case 's':
2190 return Name == "__sinh_finite" || Name == "__sinhf_finite";
2191 }
2192 // clang-format on
2193 }
2194}
2195
2196namespace {
2197
2198Constant *GetConstantFoldFPValue(double V, Type *Ty) {
2199 if (Ty->isHalfTy() || Ty->isFloatTy()) {
2200 APFloat APF(V);
2201 bool unused;
2202 APF.convert(Ty->getFltSemantics(), APFloat::rmNearestTiesToEven, &unused);
2203 return ConstantFP::get(Ty->getContext(), APF);
2204 }
2205 if (Ty->isDoubleTy())
2206 return ConstantFP::get(Ty->getContext(), APFloat(V));
2207 llvm_unreachable("Can only constant fold half/float/double");
2208}
2209
2210#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2211Constant *GetConstantFoldFPValue128(float128 V, Type *Ty) {
2212 if (Ty->isFP128Ty())
2213 return ConstantFP::get(Ty, V);
2214 llvm_unreachable("Can only constant fold fp128");
2215}
2216#endif
2217
2218/// Clear the floating-point exception state.
2219inline void llvm_fenv_clearexcept() {
2220#if HAVE_DECL_FE_ALL_EXCEPT
2221 feclearexcept(FE_ALL_EXCEPT);
2222#endif
2223 errno = 0;
2224}
2225
2226/// Test if a floating-point exception was raised.
2227inline bool llvm_fenv_testexcept() {
2228 int errno_val = errno;
2229 if (errno_val == ERANGE || errno_val == EDOM)
2230 return true;
2231#if HAVE_DECL_FE_ALL_EXCEPT && HAVE_DECL_FE_INEXACT
2232 if (fetestexcept(FE_ALL_EXCEPT & ~FE_INEXACT))
2233 return true;
2234#endif
2235 return false;
2236}
2237
2238static APFloat FTZPreserveSign(const APFloat &V) {
2239 if (V.isDenormal())
2240 return APFloat::getZero(V.getSemantics(), V.isNegative());
2241 return V;
2242}
2243
2244static APFloat FlushToPositiveZero(const APFloat &V) {
2245 if (V.isDenormal())
2246 return APFloat::getZero(V.getSemantics(), false);
2247 return V;
2248}
2249
2250static APFloat FlushWithDenormKind(const APFloat &V,
2251 DenormalMode::DenormalModeKind DenormKind) {
2254 switch (DenormKind) {
2256 return V;
2258 return FTZPreserveSign(V);
2260 return FlushToPositiveZero(V);
2261 default:
2262 llvm_unreachable("Invalid denormal mode!");
2263 }
2264}
2265
2266Constant *ConstantFoldFP(double (*NativeFP)(double), const APFloat &V, Type *Ty,
2267 DenormalMode DenormMode = DenormalMode::getIEEE()) {
2268 if (!DenormMode.isValid() ||
2269 DenormMode.Input == DenormalMode::DenormalModeKind::Dynamic ||
2270 DenormMode.Output == DenormalMode::DenormalModeKind::Dynamic)
2271 return nullptr;
2272
2273 llvm_fenv_clearexcept();
2274 auto Input = FlushWithDenormKind(V, DenormMode.Input);
2275 double Result = NativeFP(Input.convertToDouble());
2276 if (llvm_fenv_testexcept()) {
2277 llvm_fenv_clearexcept();
2278 return nullptr;
2279 }
2280
2281 Constant *Output = GetConstantFoldFPValue(Result, Ty);
2282 if (DenormMode.Output == DenormalMode::DenormalModeKind::IEEE)
2283 return Output;
2284 const auto *CFP = static_cast<ConstantFP *>(Output);
2285 const auto Res = FlushWithDenormKind(CFP->getValueAPF(), DenormMode.Output);
2286 return ConstantFP::get(Ty->getContext(), Res);
2287}
2288
2289#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2290Constant *ConstantFoldFP128(float128 (*NativeFP)(float128), const APFloat &V,
2291 Type *Ty) {
2292 llvm_fenv_clearexcept();
2293 float128 Result = NativeFP(V.convertToQuad());
2294 if (llvm_fenv_testexcept()) {
2295 llvm_fenv_clearexcept();
2296 return nullptr;
2297 }
2298
2299 return GetConstantFoldFPValue128(Result, Ty);
2300}
2301#endif
2302
2303Constant *ConstantFoldBinaryFP(double (*NativeFP)(double, double),
2304 const APFloat &V, const APFloat &W, Type *Ty) {
2305 llvm_fenv_clearexcept();
2306 double Result = NativeFP(V.convertToDouble(), W.convertToDouble());
2307 if (llvm_fenv_testexcept()) {
2308 llvm_fenv_clearexcept();
2309 return nullptr;
2310 }
2311
2312 return GetConstantFoldFPValue(Result, Ty);
2313}
2314
2315Constant *constantFoldVectorReduce(Intrinsic::ID IID, Constant *Op) {
2316 auto *OpVT = cast<VectorType>(Op->getType());
2317
2318 // This is the same as the underlying binops - poison propagates.
2319 if (Op->containsPoisonElement())
2320 return PoisonValue::get(OpVT->getElementType());
2321
2322 // Shortcut non-accumulating reductions.
2323 if (Constant *SplatVal = Op->getSplatValue()) {
2324 switch (IID) {
2325 case Intrinsic::vector_reduce_and:
2326 case Intrinsic::vector_reduce_or:
2327 case Intrinsic::vector_reduce_smin:
2328 case Intrinsic::vector_reduce_smax:
2329 case Intrinsic::vector_reduce_umin:
2330 case Intrinsic::vector_reduce_umax:
2331 return SplatVal;
2332 case Intrinsic::vector_reduce_add:
2333 if (SplatVal->isNullValue())
2334 return SplatVal;
2335 break;
2336 case Intrinsic::vector_reduce_mul:
2337 if (SplatVal->isNullValue() || SplatVal->isOneValue())
2338 return SplatVal;
2339 break;
2340 case Intrinsic::vector_reduce_xor:
2341 if (SplatVal->isNullValue())
2342 return SplatVal;
2343 if (OpVT->getElementCount().isKnownMultipleOf(2))
2344 return Constant::getNullValue(OpVT->getElementType());
2345 break;
2346 }
2347 }
2348
2350 if (!VT)
2351 return nullptr;
2352
2353 // TODO: Handle undef.
2354 auto *EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(0U));
2355 if (!EltC)
2356 return nullptr;
2357
2358 APInt Acc = EltC->getValue();
2359 for (unsigned I = 1, E = VT->getNumElements(); I != E; I++) {
2360 if (!(EltC = dyn_cast_or_null<ConstantInt>(Op->getAggregateElement(I))))
2361 return nullptr;
2362 const APInt &X = EltC->getValue();
2363 switch (IID) {
2364 case Intrinsic::vector_reduce_add:
2365 Acc = Acc + X;
2366 break;
2367 case Intrinsic::vector_reduce_mul:
2368 Acc = Acc * X;
2369 break;
2370 case Intrinsic::vector_reduce_and:
2371 Acc = Acc & X;
2372 break;
2373 case Intrinsic::vector_reduce_or:
2374 Acc = Acc | X;
2375 break;
2376 case Intrinsic::vector_reduce_xor:
2377 Acc = Acc ^ X;
2378 break;
2379 case Intrinsic::vector_reduce_smin:
2380 Acc = APIntOps::smin(Acc, X);
2381 break;
2382 case Intrinsic::vector_reduce_smax:
2383 Acc = APIntOps::smax(Acc, X);
2384 break;
2385 case Intrinsic::vector_reduce_umin:
2386 Acc = APIntOps::umin(Acc, X);
2387 break;
2388 case Intrinsic::vector_reduce_umax:
2389 Acc = APIntOps::umax(Acc, X);
2390 break;
2391 }
2392 }
2393
2394 return ConstantInt::get(Op->getContext(), Acc);
2395}
2396
2397/// Attempt to fold an SSE floating point to integer conversion of a constant
2398/// floating point. If roundTowardZero is false, the default IEEE rounding is
2399/// used (toward nearest, ties to even). This matches the behavior of the
2400/// non-truncating SSE instructions in the default rounding mode. The desired
2401/// integer type Ty is used to select how many bits are available for the
2402/// result. Returns null if the conversion cannot be performed, otherwise
2403/// returns the Constant value resulting from the conversion.
2404Constant *ConstantFoldSSEConvertToInt(const APFloat &Val, bool roundTowardZero,
2405 Type *Ty, bool IsSigned) {
2406 // All of these conversion intrinsics form an integer of at most 64bits.
2407 unsigned ResultWidth = Ty->getIntegerBitWidth();
2408 assert(ResultWidth <= 64 &&
2409 "Can only constant fold conversions to 64 and 32 bit ints");
2410
2411 uint64_t UIntVal;
2412 bool isExact = false;
2416 Val.convertToInteger(MutableArrayRef(UIntVal), ResultWidth,
2417 IsSigned, mode, &isExact);
2418 if (status != APFloat::opOK &&
2419 (!roundTowardZero || status != APFloat::opInexact))
2420 return nullptr;
2421 return ConstantInt::get(Ty, UIntVal, IsSigned);
2422}
2423
2424double getValueAsDouble(ConstantFP *Op) {
2425 Type *Ty = Op->getType();
2426
2427 if (Ty->isBFloatTy() || Ty->isHalfTy() || Ty->isFloatTy() || Ty->isDoubleTy())
2428 return Op->getValueAPF().convertToDouble();
2429
2430 bool unused;
2431 APFloat APF = Op->getValueAPF();
2433 return APF.convertToDouble();
2434}
2435
2436static bool getConstIntOrUndef(Value *Op, const APInt *&C) {
2437 if (auto *CI = dyn_cast<ConstantInt>(Op)) {
2438 C = &CI->getValue();
2439 return true;
2440 }
2441 if (isa<UndefValue>(Op)) {
2442 C = nullptr;
2443 return true;
2444 }
2445 return false;
2446}
2447
2448/// Checks if the given intrinsic call, which evaluates to constant, is allowed
2449/// to be folded.
2450///
2451/// \param CI Constrained intrinsic call.
2452/// \param St Exception flags raised during constant evaluation.
2453static bool mayFoldConstrained(ConstrainedFPIntrinsic *CI,
2454 APFloat::opStatus St) {
2455 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2456 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2457
2458 // If the operation does not change exception status flags, it is safe
2459 // to fold.
2460 if (St == APFloat::opStatus::opOK)
2461 return true;
2462
2463 // If evaluation raised FP exception, the result can depend on rounding
2464 // mode. If the latter is unknown, folding is not possible.
2465 if (ORM == RoundingMode::Dynamic)
2466 return false;
2467
2468 // If FP exceptions are ignored, fold the call, even if such exception is
2469 // raised.
2470 if (EB && *EB != fp::ExceptionBehavior::ebStrict)
2471 return true;
2472
2473 // Leave the calculation for runtime so that exception flags be correctly set
2474 // in hardware.
2475 return false;
2476}
2477
2478/// Returns the rounding mode that should be used for constant evaluation.
2479static RoundingMode
2480getEvaluationRoundingMode(const ConstrainedFPIntrinsic *CI) {
2481 std::optional<RoundingMode> ORM = CI->getRoundingMode();
2482 if (!ORM || *ORM == RoundingMode::Dynamic)
2483 // Even if the rounding mode is unknown, try evaluating the operation.
2484 // If it does not raise inexact exception, rounding was not applied,
2485 // so the result is exact and does not depend on rounding mode. Whether
2486 // other FP exceptions are raised, it does not depend on rounding mode.
2488 return *ORM;
2489}
2490
2491/// Try to constant fold llvm.canonicalize for the given caller and value.
2492static Constant *constantFoldCanonicalize(const Type *Ty, const CallBase *CI,
2493 const APFloat &Src) {
2494 // Zero, positive and negative, is always OK to fold.
2495 if (Src.isZero()) {
2496 // Get a fresh 0, since ppc_fp128 does have non-canonical zeros.
2497 return ConstantFP::get(
2498 CI->getContext(),
2499 APFloat::getZero(Src.getSemantics(), Src.isNegative()));
2500 }
2501
2502 if (!Ty->isIEEELikeFPTy())
2503 return nullptr;
2504
2505 // Zero is always canonical and the sign must be preserved.
2506 //
2507 // Denorms and nans may have special encodings, but it should be OK to fold a
2508 // totally average number.
2509 if (Src.isNormal() || Src.isInfinity())
2510 return ConstantFP::get(CI->getContext(), Src);
2511
2512 if (Src.isDenormal() && CI->getParent() && CI->getFunction()) {
2513 DenormalMode DenormMode =
2514 CI->getFunction()->getDenormalMode(Src.getSemantics());
2515
2516 if (DenormMode == DenormalMode::getIEEE())
2517 return ConstantFP::get(CI->getContext(), Src);
2518
2519 if (DenormMode.Input == DenormalMode::Dynamic)
2520 return nullptr;
2521
2522 // If we know if either input or output is flushed, we can fold.
2523 if ((DenormMode.Input == DenormalMode::Dynamic &&
2524 DenormMode.Output == DenormalMode::IEEE) ||
2525 (DenormMode.Input == DenormalMode::IEEE &&
2526 DenormMode.Output == DenormalMode::Dynamic))
2527 return nullptr;
2528
2529 bool IsPositive =
2530 (!Src.isNegative() || DenormMode.Input == DenormalMode::PositiveZero ||
2531 (DenormMode.Output == DenormalMode::PositiveZero &&
2532 DenormMode.Input == DenormalMode::IEEE));
2533
2534 return ConstantFP::get(CI->getContext(),
2535 APFloat::getZero(Src.getSemantics(), !IsPositive));
2536 }
2537
2538 return nullptr;
2539}
2540
2541static Constant *ConstantFoldScalarCall1(StringRef Name,
2542 Intrinsic::ID IntrinsicID,
2543 Type *Ty,
2544 ArrayRef<Constant *> Operands,
2545 const TargetLibraryInfo *TLI,
2546 const CallBase *Call) {
2547 assert(Operands.size() == 1 && "Wrong number of operands.");
2548
2549 if (IntrinsicID == Intrinsic::is_constant) {
2550 // We know we have a "Constant" argument. But we want to only
2551 // return true for manifest constants, not those that depend on
2552 // constants with unknowable values, e.g. GlobalValue or BlockAddress.
2553 if (Operands[0]->isManifestConstant())
2554 return ConstantInt::getTrue(Ty->getContext());
2555 return nullptr;
2556 }
2557
2558 if (isa<UndefValue>(Operands[0])) {
2559 // cosine(arg) is between -1 and 1. cosine(invalid arg) is NaN.
2560 // ctpop() is between 0 and bitwidth, pick 0 for undef.
2561 // fptoui.sat and fptosi.sat can always fold to zero (for a zero input).
2562 if (IntrinsicID == Intrinsic::cos ||
2563 IntrinsicID == Intrinsic::ctpop ||
2564 IntrinsicID == Intrinsic::fptoui_sat ||
2565 IntrinsicID == Intrinsic::fptosi_sat ||
2566 IntrinsicID == Intrinsic::canonicalize)
2567 return Constant::getNullValue(Ty);
2568 if (IntrinsicID == Intrinsic::bswap ||
2569 IntrinsicID == Intrinsic::bitreverse ||
2570 IntrinsicID == Intrinsic::launder_invariant_group ||
2571 IntrinsicID == Intrinsic::strip_invariant_group)
2572 return Operands[0];
2573 }
2574
2575 if (isa<ConstantPointerNull>(Operands[0])) {
2576 // launder(null) == null == strip(null) iff in addrspace 0
2577 if (IntrinsicID == Intrinsic::launder_invariant_group ||
2578 IntrinsicID == Intrinsic::strip_invariant_group) {
2579 // If instruction is not yet put in a basic block (e.g. when cloning
2580 // a function during inlining), Call's caller may not be available.
2581 // So check Call's BB first before querying Call->getCaller.
2582 const Function *Caller =
2583 Call->getParent() ? Call->getCaller() : nullptr;
2584 if (Caller &&
2586 Caller, Operands[0]->getType()->getPointerAddressSpace())) {
2587 return Operands[0];
2588 }
2589 return nullptr;
2590 }
2591 }
2592
2593 if (auto *Op = dyn_cast<ConstantFP>(Operands[0])) {
2594 APFloat U = Op->getValueAPF();
2595
2596 if (IntrinsicID == Intrinsic::wasm_trunc_signed ||
2597 IntrinsicID == Intrinsic::wasm_trunc_unsigned) {
2598 bool Signed = IntrinsicID == Intrinsic::wasm_trunc_signed;
2599
2600 if (U.isNaN())
2601 return nullptr;
2602
2603 unsigned Width = Ty->getIntegerBitWidth();
2604 APSInt Int(Width, !Signed);
2605 bool IsExact = false;
2607 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2608
2610 return ConstantInt::get(Ty, Int);
2611
2612 return nullptr;
2613 }
2614
2615 if (IntrinsicID == Intrinsic::fptoui_sat ||
2616 IntrinsicID == Intrinsic::fptosi_sat) {
2617 // convertToInteger() already has the desired saturation semantics.
2618 APSInt Int(Ty->getIntegerBitWidth(),
2619 IntrinsicID == Intrinsic::fptoui_sat);
2620 bool IsExact;
2621 U.convertToInteger(Int, APFloat::rmTowardZero, &IsExact);
2622 return ConstantInt::get(Ty, Int);
2623 }
2624
2625 if (IntrinsicID == Intrinsic::canonicalize)
2626 return constantFoldCanonicalize(Ty, Call, U);
2627
2628#if defined(HAS_IEE754_FLOAT128) && defined(HAS_LOGF128)
2629 if (Ty->isFP128Ty()) {
2630 if (IntrinsicID == Intrinsic::log) {
2631 float128 Result = logf128(Op->getValueAPF().convertToQuad());
2632 return GetConstantFoldFPValue128(Result, Ty);
2633 }
2634
2635 LibFunc Fp128Func = NotLibFunc;
2636 if (TLI && TLI->getLibFunc(Name, Fp128Func) && TLI->has(Fp128Func) &&
2637 Fp128Func == LibFunc_logl)
2638 return ConstantFoldFP128(logf128, Op->getValueAPF(), Ty);
2639 }
2640#endif
2641
2642 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy() &&
2643 !Ty->isIntegerTy())
2644 return nullptr;
2645
2646 // Use internal versions of these intrinsics.
2647
2648 if (IntrinsicID == Intrinsic::nearbyint || IntrinsicID == Intrinsic::rint ||
2649 IntrinsicID == Intrinsic::roundeven) {
2650 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2651 return ConstantFP::get(Ty, U);
2652 }
2653
2654 if (IntrinsicID == Intrinsic::round) {
2655 U.roundToIntegral(APFloat::rmNearestTiesToAway);
2656 return ConstantFP::get(Ty, U);
2657 }
2658
2659 if (IntrinsicID == Intrinsic::roundeven) {
2660 U.roundToIntegral(APFloat::rmNearestTiesToEven);
2661 return ConstantFP::get(Ty, U);
2662 }
2663
2664 if (IntrinsicID == Intrinsic::ceil) {
2665 U.roundToIntegral(APFloat::rmTowardPositive);
2666 return ConstantFP::get(Ty, U);
2667 }
2668
2669 if (IntrinsicID == Intrinsic::floor) {
2670 U.roundToIntegral(APFloat::rmTowardNegative);
2671 return ConstantFP::get(Ty, U);
2672 }
2673
2674 if (IntrinsicID == Intrinsic::trunc) {
2675 U.roundToIntegral(APFloat::rmTowardZero);
2676 return ConstantFP::get(Ty, U);
2677 }
2678
2679 if (IntrinsicID == Intrinsic::fabs) {
2680 U.clearSign();
2681 return ConstantFP::get(Ty, U);
2682 }
2683
2684 if (IntrinsicID == Intrinsic::amdgcn_fract) {
2685 // The v_fract instruction behaves like the OpenCL spec, which defines
2686 // fract(x) as fmin(x - floor(x), 0x1.fffffep-1f): "The min() operator is
2687 // there to prevent fract(-small) from returning 1.0. It returns the
2688 // largest positive floating-point number less than 1.0."
2689 APFloat FloorU(U);
2690 FloorU.roundToIntegral(APFloat::rmTowardNegative);
2691 APFloat FractU(U - FloorU);
2692 APFloat AlmostOne(U.getSemantics(), 1);
2693 AlmostOne.next(/*nextDown*/ true);
2694 return ConstantFP::get(Ty, minimum(FractU, AlmostOne));
2695 }
2696
2697 // Rounding operations (floor, trunc, ceil, round and nearbyint) do not
2698 // raise FP exceptions, unless the argument is signaling NaN.
2699
2700 std::optional<APFloat::roundingMode> RM;
2701 switch (IntrinsicID) {
2702 default:
2703 break;
2704 case Intrinsic::experimental_constrained_nearbyint:
2705 case Intrinsic::experimental_constrained_rint: {
2707 RM = CI->getRoundingMode();
2708 if (!RM || *RM == RoundingMode::Dynamic)
2709 return nullptr;
2710 break;
2711 }
2712 case Intrinsic::experimental_constrained_round:
2714 break;
2715 case Intrinsic::experimental_constrained_ceil:
2717 break;
2718 case Intrinsic::experimental_constrained_floor:
2720 break;
2721 case Intrinsic::experimental_constrained_trunc:
2723 break;
2724 }
2725 if (RM) {
2727 if (U.isFinite()) {
2728 APFloat::opStatus St = U.roundToIntegral(*RM);
2729 if (IntrinsicID == Intrinsic::experimental_constrained_rint &&
2730 St == APFloat::opInexact) {
2731 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2732 if (EB == fp::ebStrict)
2733 return nullptr;
2734 }
2735 } else if (U.isSignaling()) {
2736 std::optional<fp::ExceptionBehavior> EB = CI->getExceptionBehavior();
2737 if (EB && *EB != fp::ebIgnore)
2738 return nullptr;
2739 U = APFloat::getQNaN(U.getSemantics());
2740 }
2741 return ConstantFP::get(Ty, U);
2742 }
2743
2744 // NVVM float/double to signed/unsigned int32/int64 conversions:
2745 switch (IntrinsicID) {
2746 // f2i
2747 case Intrinsic::nvvm_f2i_rm:
2748 case Intrinsic::nvvm_f2i_rn:
2749 case Intrinsic::nvvm_f2i_rp:
2750 case Intrinsic::nvvm_f2i_rz:
2751 case Intrinsic::nvvm_f2i_rm_ftz:
2752 case Intrinsic::nvvm_f2i_rn_ftz:
2753 case Intrinsic::nvvm_f2i_rp_ftz:
2754 case Intrinsic::nvvm_f2i_rz_ftz:
2755 // f2ui
2756 case Intrinsic::nvvm_f2ui_rm:
2757 case Intrinsic::nvvm_f2ui_rn:
2758 case Intrinsic::nvvm_f2ui_rp:
2759 case Intrinsic::nvvm_f2ui_rz:
2760 case Intrinsic::nvvm_f2ui_rm_ftz:
2761 case Intrinsic::nvvm_f2ui_rn_ftz:
2762 case Intrinsic::nvvm_f2ui_rp_ftz:
2763 case Intrinsic::nvvm_f2ui_rz_ftz:
2764 // d2i
2765 case Intrinsic::nvvm_d2i_rm:
2766 case Intrinsic::nvvm_d2i_rn:
2767 case Intrinsic::nvvm_d2i_rp:
2768 case Intrinsic::nvvm_d2i_rz:
2769 // d2ui
2770 case Intrinsic::nvvm_d2ui_rm:
2771 case Intrinsic::nvvm_d2ui_rn:
2772 case Intrinsic::nvvm_d2ui_rp:
2773 case Intrinsic::nvvm_d2ui_rz:
2774 // f2ll
2775 case Intrinsic::nvvm_f2ll_rm:
2776 case Intrinsic::nvvm_f2ll_rn:
2777 case Intrinsic::nvvm_f2ll_rp:
2778 case Intrinsic::nvvm_f2ll_rz:
2779 case Intrinsic::nvvm_f2ll_rm_ftz:
2780 case Intrinsic::nvvm_f2ll_rn_ftz:
2781 case Intrinsic::nvvm_f2ll_rp_ftz:
2782 case Intrinsic::nvvm_f2ll_rz_ftz:
2783 // f2ull
2784 case Intrinsic::nvvm_f2ull_rm:
2785 case Intrinsic::nvvm_f2ull_rn:
2786 case Intrinsic::nvvm_f2ull_rp:
2787 case Intrinsic::nvvm_f2ull_rz:
2788 case Intrinsic::nvvm_f2ull_rm_ftz:
2789 case Intrinsic::nvvm_f2ull_rn_ftz:
2790 case Intrinsic::nvvm_f2ull_rp_ftz:
2791 case Intrinsic::nvvm_f2ull_rz_ftz:
2792 // d2ll
2793 case Intrinsic::nvvm_d2ll_rm:
2794 case Intrinsic::nvvm_d2ll_rn:
2795 case Intrinsic::nvvm_d2ll_rp:
2796 case Intrinsic::nvvm_d2ll_rz:
2797 // d2ull
2798 case Intrinsic::nvvm_d2ull_rm:
2799 case Intrinsic::nvvm_d2ull_rn:
2800 case Intrinsic::nvvm_d2ull_rp:
2801 case Intrinsic::nvvm_d2ull_rz: {
2802 // In float-to-integer conversion, NaN inputs are converted to 0.
2803 if (U.isNaN()) {
2804 // In float-to-integer conversion, NaN inputs are converted to 0
2805 // when the source and destination bitwidths are both less than 64.
2806 if (nvvm::FPToIntegerIntrinsicNaNZero(IntrinsicID))
2807 return ConstantInt::get(Ty, 0);
2808
2809 // Otherwise, the most significant bit is set.
2810 unsigned BitWidth = Ty->getIntegerBitWidth();
2811 uint64_t Val = 1ULL << (BitWidth - 1);
2812 return ConstantInt::get(Ty, APInt(BitWidth, Val, /*IsSigned=*/false));
2813 }
2814
2815 APFloat::roundingMode RMode =
2817 bool IsFTZ = nvvm::FPToIntegerIntrinsicShouldFTZ(IntrinsicID);
2818 bool IsSigned = nvvm::FPToIntegerIntrinsicResultIsSigned(IntrinsicID);
2819
2820 APSInt ResInt(Ty->getIntegerBitWidth(), !IsSigned);
2821 auto FloatToRound = IsFTZ ? FTZPreserveSign(U) : U;
2822
2823 // Return max/min value for integers if the result is +/-inf or
2824 // is too large to fit in the result's integer bitwidth.
2825 bool IsExact = false;
2826 FloatToRound.convertToInteger(ResInt, RMode, &IsExact);
2827 return ConstantInt::get(Ty, ResInt);
2828 }
2829 }
2830
2831 /// We only fold functions with finite arguments. Folding NaN and inf is
2832 /// likely to be aborted with an exception anyway, and some host libms
2833 /// have known errors raising exceptions.
2834 if (!U.isFinite())
2835 return nullptr;
2836
2837 /// Currently APFloat versions of these functions do not exist, so we use
2838 /// the host native double versions. Float versions are not called
2839 /// directly but for all these it is true (float)(f((double)arg)) ==
2840 /// f(arg). Long double not supported yet.
2841 const APFloat &APF = Op->getValueAPF();
2842
2843 switch (IntrinsicID) {
2844 default: break;
2845 case Intrinsic::log:
2846 if (U.isZero())
2847 return ConstantFP::getInfinity(Ty, true);
2848 if (U.isNegative())
2849 return ConstantFP::getNaN(Ty);
2850 if (U.isExactlyValue(1.0))
2851 return ConstantFP::getZero(Ty);
2852 return ConstantFoldFP(log, APF, Ty);
2853 case Intrinsic::log2:
2854 if (U.isZero())
2855 return ConstantFP::getInfinity(Ty, true);
2856 if (U.isNegative())
2857 return ConstantFP::getNaN(Ty);
2858 if (U.isExactlyValue(1.0))
2859 return ConstantFP::getZero(Ty);
2860 // TODO: What about hosts that lack a C99 library?
2861 return ConstantFoldFP(log2, APF, Ty);
2862 case Intrinsic::log10:
2863 if (U.isZero())
2864 return ConstantFP::getInfinity(Ty, true);
2865 if (U.isNegative())
2866 return ConstantFP::getNaN(Ty);
2867 if (U.isExactlyValue(1.0))
2868 return ConstantFP::getZero(Ty);
2869 // TODO: What about hosts that lack a C99 library?
2870 return ConstantFoldFP(log10, APF, Ty);
2871 case Intrinsic::exp:
2872 return ConstantFoldFP(exp, APF, Ty);
2873 case Intrinsic::exp2:
2874 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
2875 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
2876 case Intrinsic::exp10:
2877 // Fold exp10(x) as pow(10, x), in case the host lacks a C99 library.
2878 return ConstantFoldBinaryFP(pow, APFloat(10.0), APF, Ty);
2879 case Intrinsic::sin:
2880 return ConstantFoldFP(sin, APF, Ty);
2881 case Intrinsic::cos:
2882 return ConstantFoldFP(cos, APF, Ty);
2883 case Intrinsic::sinh:
2884 return ConstantFoldFP(sinh, APF, Ty);
2885 case Intrinsic::cosh:
2886 return ConstantFoldFP(cosh, APF, Ty);
2887 case Intrinsic::atan:
2888 // Implement optional behavior from C's Annex F for +/-0.0.
2889 if (U.isZero())
2890 return ConstantFP::get(Ty, U);
2891 return ConstantFoldFP(atan, APF, Ty);
2892 case Intrinsic::sqrt:
2893 return ConstantFoldFP(sqrt, APF, Ty);
2894
2895 // NVVM Intrinsics:
2896 case Intrinsic::nvvm_ceil_ftz_f:
2897 case Intrinsic::nvvm_ceil_f:
2898 case Intrinsic::nvvm_ceil_d:
2899 return ConstantFoldFP(
2900 ceil, APF, Ty,
2902 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2903
2904 case Intrinsic::nvvm_fabs_ftz:
2905 case Intrinsic::nvvm_fabs:
2906 return ConstantFoldFP(
2907 fabs, APF, Ty,
2909 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2910
2911 case Intrinsic::nvvm_floor_ftz_f:
2912 case Intrinsic::nvvm_floor_f:
2913 case Intrinsic::nvvm_floor_d:
2914 return ConstantFoldFP(
2915 floor, APF, Ty,
2917 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2918
2919 case Intrinsic::nvvm_rcp_rm_ftz_f:
2920 case Intrinsic::nvvm_rcp_rn_ftz_f:
2921 case Intrinsic::nvvm_rcp_rp_ftz_f:
2922 case Intrinsic::nvvm_rcp_rz_ftz_f:
2923 case Intrinsic::nvvm_rcp_rm_d:
2924 case Intrinsic::nvvm_rcp_rm_f:
2925 case Intrinsic::nvvm_rcp_rn_d:
2926 case Intrinsic::nvvm_rcp_rn_f:
2927 case Intrinsic::nvvm_rcp_rp_d:
2928 case Intrinsic::nvvm_rcp_rp_f:
2929 case Intrinsic::nvvm_rcp_rz_d:
2930 case Intrinsic::nvvm_rcp_rz_f: {
2931 APFloat::roundingMode RoundMode = nvvm::GetRCPRoundingMode(IntrinsicID);
2932 bool IsFTZ = nvvm::RCPShouldFTZ(IntrinsicID);
2933
2934 auto Denominator = IsFTZ ? FTZPreserveSign(APF) : APF;
2936 APFloat::opStatus Status = Res.divide(Denominator, RoundMode);
2937
2939 if (IsFTZ)
2940 Res = FTZPreserveSign(Res);
2941 return ConstantFP::get(Ty, Res);
2942 }
2943 return nullptr;
2944 }
2945
2946 case Intrinsic::nvvm_round_ftz_f:
2947 case Intrinsic::nvvm_round_f:
2948 case Intrinsic::nvvm_round_d: {
2949 // nvvm_round is lowered to PTX cvt.rni, which will round to nearest
2950 // integer, choosing even integer if source is equidistant between two
2951 // integers, so the semantics are closer to "rint" rather than "round".
2952 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2953 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2955 return ConstantFP::get(Ty, V);
2956 }
2957
2958 case Intrinsic::nvvm_saturate_ftz_f:
2959 case Intrinsic::nvvm_saturate_d:
2960 case Intrinsic::nvvm_saturate_f: {
2961 bool IsFTZ = nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID);
2962 auto V = IsFTZ ? FTZPreserveSign(APF) : APF;
2963 if (V.isNegative() || V.isZero() || V.isNaN())
2964 return ConstantFP::getZero(Ty);
2966 if (V > One)
2967 return ConstantFP::get(Ty, One);
2968 return ConstantFP::get(Ty, APF);
2969 }
2970
2971 case Intrinsic::nvvm_sqrt_rn_ftz_f:
2972 case Intrinsic::nvvm_sqrt_f:
2973 case Intrinsic::nvvm_sqrt_rn_d:
2974 case Intrinsic::nvvm_sqrt_rn_f:
2975 if (APF.isNegative())
2976 return nullptr;
2977 return ConstantFoldFP(
2978 sqrt, APF, Ty,
2980 nvvm::UnaryMathIntrinsicShouldFTZ(IntrinsicID)));
2981
2982 // AMDGCN Intrinsics:
2983 case Intrinsic::amdgcn_cos:
2984 case Intrinsic::amdgcn_sin: {
2985 double V = getValueAsDouble(Op);
2986 if (V < -256.0 || V > 256.0)
2987 // The gfx8 and gfx9 architectures handle arguments outside the range
2988 // [-256, 256] differently. This should be a rare case so bail out
2989 // rather than trying to handle the difference.
2990 return nullptr;
2991 bool IsCos = IntrinsicID == Intrinsic::amdgcn_cos;
2992 double V4 = V * 4.0;
2993 if (V4 == floor(V4)) {
2994 // Force exact results for quarter-integer inputs.
2995 const double SinVals[4] = { 0.0, 1.0, 0.0, -1.0 };
2996 V = SinVals[((int)V4 + (IsCos ? 1 : 0)) & 3];
2997 } else {
2998 if (IsCos)
2999 V = cos(V * 2.0 * numbers::pi);
3000 else
3001 V = sin(V * 2.0 * numbers::pi);
3002 }
3003 return GetConstantFoldFPValue(V, Ty);
3004 }
3005 }
3006
3007 if (!TLI)
3008 return nullptr;
3009
3010 LibFunc Func = NotLibFunc;
3011 if (!TLI->getLibFunc(Name, Func))
3012 return nullptr;
3013
3014 switch (Func) {
3015 default:
3016 break;
3017 case LibFunc_acos:
3018 case LibFunc_acosf:
3019 case LibFunc_acos_finite:
3020 case LibFunc_acosf_finite:
3021 if (TLI->has(Func))
3022 return ConstantFoldFP(acos, APF, Ty);
3023 break;
3024 case LibFunc_asin:
3025 case LibFunc_asinf:
3026 case LibFunc_asin_finite:
3027 case LibFunc_asinf_finite:
3028 if (TLI->has(Func))
3029 return ConstantFoldFP(asin, APF, Ty);
3030 break;
3031 case LibFunc_atan:
3032 case LibFunc_atanf:
3033 // Implement optional behavior from C's Annex F for +/-0.0.
3034 if (U.isZero())
3035 return ConstantFP::get(Ty, U);
3036 if (TLI->has(Func))
3037 return ConstantFoldFP(atan, APF, Ty);
3038 break;
3039 case LibFunc_ceil:
3040 case LibFunc_ceilf:
3041 if (TLI->has(Func)) {
3042 U.roundToIntegral(APFloat::rmTowardPositive);
3043 return ConstantFP::get(Ty, U);
3044 }
3045 break;
3046 case LibFunc_cos:
3047 case LibFunc_cosf:
3048 if (TLI->has(Func))
3049 return ConstantFoldFP(cos, APF, Ty);
3050 break;
3051 case LibFunc_cosh:
3052 case LibFunc_coshf:
3053 case LibFunc_cosh_finite:
3054 case LibFunc_coshf_finite:
3055 if (TLI->has(Func))
3056 return ConstantFoldFP(cosh, APF, Ty);
3057 break;
3058 case LibFunc_exp:
3059 case LibFunc_expf:
3060 case LibFunc_exp_finite:
3061 case LibFunc_expf_finite:
3062 if (TLI->has(Func))
3063 return ConstantFoldFP(exp, APF, Ty);
3064 break;
3065 case LibFunc_exp2:
3066 case LibFunc_exp2f:
3067 case LibFunc_exp2_finite:
3068 case LibFunc_exp2f_finite:
3069 if (TLI->has(Func))
3070 // Fold exp2(x) as pow(2, x), in case the host lacks a C99 library.
3071 return ConstantFoldBinaryFP(pow, APFloat(2.0), APF, Ty);
3072 break;
3073 case LibFunc_fabs:
3074 case LibFunc_fabsf:
3075 if (TLI->has(Func)) {
3076 U.clearSign();
3077 return ConstantFP::get(Ty, U);
3078 }
3079 break;
3080 case LibFunc_floor:
3081 case LibFunc_floorf:
3082 if (TLI->has(Func)) {
3083 U.roundToIntegral(APFloat::rmTowardNegative);
3084 return ConstantFP::get(Ty, U);
3085 }
3086 break;
3087 case LibFunc_log:
3088 case LibFunc_logf:
3089 case LibFunc_log_finite:
3090 case LibFunc_logf_finite:
3091 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3092 return ConstantFoldFP(log, APF, Ty);
3093 break;
3094 case LibFunc_log2:
3095 case LibFunc_log2f:
3096 case LibFunc_log2_finite:
3097 case LibFunc_log2f_finite:
3098 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3099 // TODO: What about hosts that lack a C99 library?
3100 return ConstantFoldFP(log2, APF, Ty);
3101 break;
3102 case LibFunc_log10:
3103 case LibFunc_log10f:
3104 case LibFunc_log10_finite:
3105 case LibFunc_log10f_finite:
3106 if (!APF.isNegative() && !APF.isZero() && TLI->has(Func))
3107 // TODO: What about hosts that lack a C99 library?
3108 return ConstantFoldFP(log10, APF, Ty);
3109 break;
3110 case LibFunc_ilogb:
3111 case LibFunc_ilogbf:
3112 if (!APF.isZero() && TLI->has(Func))
3113 return ConstantInt::get(Ty, ilogb(APF), true);
3114 break;
3115 case LibFunc_logb:
3116 case LibFunc_logbf:
3117 if (!APF.isZero() && TLI->has(Func))
3118 return ConstantFoldFP(logb, APF, Ty);
3119 break;
3120 case LibFunc_log1p:
3121 case LibFunc_log1pf:
3122 // Implement optional behavior from C's Annex F for +/-0.0.
3123 if (U.isZero())
3124 return ConstantFP::get(Ty, U);
3125 if (APF > APFloat::getOne(APF.getSemantics(), true) && TLI->has(Func))
3126 return ConstantFoldFP(log1p, APF, Ty);
3127 break;
3128 case LibFunc_logl:
3129 return nullptr;
3130 case LibFunc_erf:
3131 case LibFunc_erff:
3132 if (TLI->has(Func))
3133 return ConstantFoldFP(erf, APF, Ty);
3134 break;
3135 case LibFunc_nearbyint:
3136 case LibFunc_nearbyintf:
3137 case LibFunc_rint:
3138 case LibFunc_rintf:
3139 case LibFunc_roundeven:
3140 case LibFunc_roundevenf:
3141 if (TLI->has(Func)) {
3142 U.roundToIntegral(APFloat::rmNearestTiesToEven);
3143 return ConstantFP::get(Ty, U);
3144 }
3145 break;
3146 case LibFunc_round:
3147 case LibFunc_roundf:
3148 if (TLI->has(Func)) {
3149 U.roundToIntegral(APFloat::rmNearestTiesToAway);
3150 return ConstantFP::get(Ty, U);
3151 }
3152 break;
3153 case LibFunc_sin:
3154 case LibFunc_sinf:
3155 if (TLI->has(Func))
3156 return ConstantFoldFP(sin, APF, Ty);
3157 break;
3158 case LibFunc_sinh:
3159 case LibFunc_sinhf:
3160 case LibFunc_sinh_finite:
3161 case LibFunc_sinhf_finite:
3162 if (TLI->has(Func))
3163 return ConstantFoldFP(sinh, APF, Ty);
3164 break;
3165 case LibFunc_sqrt:
3166 case LibFunc_sqrtf:
3167 if (!APF.isNegative() && TLI->has(Func))
3168 return ConstantFoldFP(sqrt, APF, Ty);
3169 break;
3170 case LibFunc_tan:
3171 case LibFunc_tanf:
3172 if (TLI->has(Func))
3173 return ConstantFoldFP(tan, APF, Ty);
3174 break;
3175 case LibFunc_tanh:
3176 case LibFunc_tanhf:
3177 if (TLI->has(Func))
3178 return ConstantFoldFP(tanh, APF, Ty);
3179 break;
3180 case LibFunc_trunc:
3181 case LibFunc_truncf:
3182 if (TLI->has(Func)) {
3183 U.roundToIntegral(APFloat::rmTowardZero);
3184 return ConstantFP::get(Ty, U);
3185 }
3186 break;
3187 }
3188 return nullptr;
3189 }
3190
3191 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
3192 switch (IntrinsicID) {
3193 case Intrinsic::bswap:
3194 return ConstantInt::get(Ty->getContext(), Op->getValue().byteSwap());
3195 case Intrinsic::ctpop:
3196 return ConstantInt::get(Ty, Op->getValue().popcount());
3197 case Intrinsic::bitreverse:
3198 return ConstantInt::get(Ty->getContext(), Op->getValue().reverseBits());
3199 case Intrinsic::amdgcn_s_wqm: {
3200 uint64_t Val = Op->getZExtValue();
3201 Val |= (Val & 0x5555555555555555ULL) << 1 |
3202 ((Val >> 1) & 0x5555555555555555ULL);
3203 Val |= (Val & 0x3333333333333333ULL) << 2 |
3204 ((Val >> 2) & 0x3333333333333333ULL);
3205 return ConstantInt::get(Ty, Val);
3206 }
3207
3208 case Intrinsic::amdgcn_s_quadmask: {
3209 uint64_t Val = Op->getZExtValue();
3210 uint64_t QuadMask = 0;
3211 for (unsigned I = 0; I < Op->getBitWidth() / 4; ++I, Val >>= 4) {
3212 if (!(Val & 0xF))
3213 continue;
3214
3215 QuadMask |= (1ULL << I);
3216 }
3217 return ConstantInt::get(Ty, QuadMask);
3218 }
3219
3220 case Intrinsic::amdgcn_s_bitreplicate: {
3221 uint64_t Val = Op->getZExtValue();
3222 Val = (Val & 0x000000000000FFFFULL) | (Val & 0x00000000FFFF0000ULL) << 16;
3223 Val = (Val & 0x000000FF000000FFULL) | (Val & 0x0000FF000000FF00ULL) << 8;
3224 Val = (Val & 0x000F000F000F000FULL) | (Val & 0x00F000F000F000F0ULL) << 4;
3225 Val = (Val & 0x0303030303030303ULL) | (Val & 0x0C0C0C0C0C0C0C0CULL) << 2;
3226 Val = (Val & 0x1111111111111111ULL) | (Val & 0x2222222222222222ULL) << 1;
3227 Val = Val | Val << 1;
3228 return ConstantInt::get(Ty, Val);
3229 }
3230 }
3231 }
3232
3233 if (Operands[0]->getType()->isVectorTy()) {
3234 auto *Op = cast<Constant>(Operands[0]);
3235 switch (IntrinsicID) {
3236 default: break;
3237 case Intrinsic::vector_reduce_add:
3238 case Intrinsic::vector_reduce_mul:
3239 case Intrinsic::vector_reduce_and:
3240 case Intrinsic::vector_reduce_or:
3241 case Intrinsic::vector_reduce_xor:
3242 case Intrinsic::vector_reduce_smin:
3243 case Intrinsic::vector_reduce_smax:
3244 case Intrinsic::vector_reduce_umin:
3245 case Intrinsic::vector_reduce_umax:
3246 if (Constant *C = constantFoldVectorReduce(IntrinsicID, Operands[0]))
3247 return C;
3248 break;
3249 case Intrinsic::x86_sse_cvtss2si:
3250 case Intrinsic::x86_sse_cvtss2si64:
3251 case Intrinsic::x86_sse2_cvtsd2si:
3252 case Intrinsic::x86_sse2_cvtsd2si64:
3253 if (ConstantFP *FPOp =
3254 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3255 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3256 /*roundTowardZero=*/false, Ty,
3257 /*IsSigned*/true);
3258 break;
3259 case Intrinsic::x86_sse_cvttss2si:
3260 case Intrinsic::x86_sse_cvttss2si64:
3261 case Intrinsic::x86_sse2_cvttsd2si:
3262 case Intrinsic::x86_sse2_cvttsd2si64:
3263 if (ConstantFP *FPOp =
3264 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3265 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3266 /*roundTowardZero=*/true, Ty,
3267 /*IsSigned*/true);
3268 break;
3269
3270 case Intrinsic::wasm_anytrue:
3271 return Op->isNullValue() ? ConstantInt::get(Ty, 0)
3272 : ConstantInt::get(Ty, 1);
3273
3274 case Intrinsic::wasm_alltrue:
3275 // Check each element individually
3276 unsigned E = cast<FixedVectorType>(Op->getType())->getNumElements();
3277 for (unsigned I = 0; I != E; ++I) {
3278 Constant *Elt = Op->getAggregateElement(I);
3279 // Return false as soon as we find a non-true element.
3280 if (Elt && Elt->isNullValue())
3281 return ConstantInt::get(Ty, 0);
3282 // Bail as soon as we find an element we cannot prove to be true.
3283 if (!Elt || !isa<ConstantInt>(Elt))
3284 return nullptr;
3285 }
3286
3287 return ConstantInt::get(Ty, 1);
3288 }
3289 }
3290
3291 return nullptr;
3292}
3293
3294static Constant *evaluateCompare(const APFloat &Op1, const APFloat &Op2,
3298 FCmpInst::Predicate Cond = FCmp->getPredicate();
3299 if (FCmp->isSignaling()) {
3300 if (Op1.isNaN() || Op2.isNaN())
3302 } else {
3303 if (Op1.isSignaling() || Op2.isSignaling())
3305 }
3306 bool Result = FCmpInst::compare(Op1, Op2, Cond);
3307 if (mayFoldConstrained(const_cast<ConstrainedFPCmpIntrinsic *>(FCmp), St))
3308 return ConstantInt::get(Call->getType()->getScalarType(), Result);
3309 return nullptr;
3310}
3311
3312static Constant *ConstantFoldNextToward(const APFloat &Op0, const APFloat &Op1,
3313 const Type *RetTy) {
3314 assert(RetTy != nullptr);
3315 bool LosesInfo;
3316
3317 if (Op1.isSignaling())
3318 return nullptr;
3319 if (Op1.isNaN()) {
3320 APFloat Ret(Op1);
3321 Ret.convert(RetTy->getFltSemantics(), detail::rmNearestTiesToEven,
3322 &LosesInfo);
3323 return ConstantFP::get(RetTy->getContext(), Ret);
3324 }
3325
3326 // Recall that the second argument of nexttoward is always a long double,
3327 // so we may need to promote the first argument for comparisons to be valid.
3328 APFloat PromotedOp0(Op0);
3329 PromotedOp0.convert(Op1.getSemantics(), detail::rmNearestTiesToEven,
3330 &LosesInfo);
3331 assert(!LosesInfo && "Unexpected lossy promotion");
3332 const APFloat::cmpResult Result = PromotedOp0.compare(Op1);
3333
3334 // When equal, the standard says we must return the second argument.
3335 // This allows nice behavior such as nexttoward(0.0, -0.0) = -0.0 and
3336 // nexttoward(-0.0, 0.0) = 0.0
3337 if (Result == detail::cmpEqual) {
3338 APFloat Ret(Op1);
3339 Ret.convert(RetTy->getFltSemantics(), detail::rmNearestTiesToEven,
3340 &LosesInfo);
3341 return ConstantFP::get(RetTy->getContext(), Ret);
3342 }
3343
3344 APFloat Next(Op0);
3345 Next.next(/*nextDown=*/Result == APFloat::cmpGreaterThan);
3346 if (Next.isZero() || Next.isDenormal() || Next.isSignaling())
3347 return nullptr;
3348 return ConstantFP::get(RetTy->getContext(), Next);
3349}
3350
3351static Constant *ConstantFoldLibCall2(StringRef Name, Type *Ty,
3352 ArrayRef<Constant *> Operands,
3353 const TargetLibraryInfo *TLI) {
3354 if (!TLI)
3355 return nullptr;
3356
3357 LibFunc Func = NotLibFunc;
3358 if (!TLI->getLibFunc(Name, Func))
3359 return nullptr;
3360
3361 const auto *Op1 = dyn_cast<ConstantFP>(Operands[0]);
3362 if (!Op1)
3363 return nullptr;
3364
3365 const auto *Op2 = dyn_cast<ConstantFP>(Operands[1]);
3366 if (!Op2)
3367 return nullptr;
3368
3369 const APFloat &Op1V = Op1->getValueAPF();
3370 const APFloat &Op2V = Op2->getValueAPF();
3371
3372 switch (Func) {
3373 default:
3374 break;
3375 case LibFunc_pow:
3376 case LibFunc_powf:
3377 case LibFunc_pow_finite:
3378 case LibFunc_powf_finite:
3379 if (TLI->has(Func))
3380 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3381 break;
3382 case LibFunc_fmod:
3383 case LibFunc_fmodf:
3384 if (TLI->has(Func)) {
3385 APFloat V = Op1->getValueAPF();
3386 if (APFloat::opStatus::opOK == V.mod(Op2->getValueAPF()))
3387 return ConstantFP::get(Ty, V);
3388 }
3389 break;
3390 case LibFunc_remainder:
3391 case LibFunc_remainderf:
3392 if (TLI->has(Func)) {
3393 APFloat V = Op1->getValueAPF();
3394 if (APFloat::opStatus::opOK == V.remainder(Op2->getValueAPF()))
3395 return ConstantFP::get(Ty, V);
3396 }
3397 break;
3398 case LibFunc_atan2:
3399 case LibFunc_atan2f:
3400 // atan2(+/-0.0, +/-0.0) is known to raise an exception on some libm
3401 // (Solaris), so we do not assume a known result for that.
3402 if (Op1V.isZero() && Op2V.isZero())
3403 return nullptr;
3404 [[fallthrough]];
3405 case LibFunc_atan2_finite:
3406 case LibFunc_atan2f_finite:
3407 if (TLI->has(Func))
3408 return ConstantFoldBinaryFP(atan2, Op1V, Op2V, Ty);
3409 break;
3410 case LibFunc_nextafter:
3411 case LibFunc_nextafterf:
3412 case LibFunc_nexttoward:
3413 case LibFunc_nexttowardf:
3414 if (TLI->has(Func))
3415 return ConstantFoldNextToward(Op1V, Op2V, Ty);
3416 break;
3417 }
3418
3419 return nullptr;
3420}
3421
3422static Constant *ConstantFoldIntrinsicCall2(Intrinsic::ID IntrinsicID, Type *Ty,
3423 ArrayRef<Constant *> Operands,
3424 const CallBase *Call) {
3425 assert(Operands.size() == 2 && "Wrong number of operands.");
3426
3427 if (Ty->isFloatingPointTy()) {
3428 // TODO: We should have undef handling for all of the FP intrinsics that
3429 // are attempted to be folded in this function.
3430 bool IsOp0Undef = isa<UndefValue>(Operands[0]);
3431 bool IsOp1Undef = isa<UndefValue>(Operands[1]);
3432 switch (IntrinsicID) {
3433 case Intrinsic::maxnum:
3434 case Intrinsic::minnum:
3435 case Intrinsic::maximum:
3436 case Intrinsic::minimum:
3437 case Intrinsic::maximumnum:
3438 case Intrinsic::minimumnum:
3439 case Intrinsic::nvvm_fmax_d:
3440 case Intrinsic::nvvm_fmin_d:
3441 // If one argument is undef, return the other argument.
3442 if (IsOp0Undef)
3443 return Operands[1];
3444 if (IsOp1Undef)
3445 return Operands[0];
3446 break;
3447
3448 case Intrinsic::nvvm_fmax_f:
3449 case Intrinsic::nvvm_fmax_ftz_f:
3450 case Intrinsic::nvvm_fmax_ftz_nan_f:
3451 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3452 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3453 case Intrinsic::nvvm_fmax_nan_f:
3454 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3455 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3456
3457 case Intrinsic::nvvm_fmin_f:
3458 case Intrinsic::nvvm_fmin_ftz_f:
3459 case Intrinsic::nvvm_fmin_ftz_nan_f:
3460 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3461 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3462 case Intrinsic::nvvm_fmin_nan_f:
3463 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3464 case Intrinsic::nvvm_fmin_xorsign_abs_f:
3465 // If one arg is undef, the other arg can be returned only if it is
3466 // constant, as we may need to flush it to sign-preserving zero or
3467 // canonicalize the NaN.
3468 if (!IsOp0Undef && !IsOp1Undef)
3469 break;
3470 if (auto *Op = dyn_cast<ConstantFP>(Operands[IsOp0Undef ? 1 : 0])) {
3471 if (Op->isNaN()) {
3472 APInt NVCanonicalNaN(32, 0x7fffffff);
3473 return ConstantFP::get(
3474 Ty, APFloat(Ty->getFltSemantics(), NVCanonicalNaN));
3475 }
3476 if (nvvm::FMinFMaxShouldFTZ(IntrinsicID))
3477 return ConstantFP::get(Ty, FTZPreserveSign(Op->getValueAPF()));
3478 else
3479 return Op;
3480 }
3481 break;
3482 }
3483 }
3484
3485 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
3486 const APFloat &Op1V = Op1->getValueAPF();
3487
3488 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
3489 if (Op2->getType() != Op1->getType())
3490 return nullptr;
3491 const APFloat &Op2V = Op2->getValueAPF();
3492
3493 if (const auto *ConstrIntr =
3495 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
3496 APFloat Res = Op1V;
3498 switch (IntrinsicID) {
3499 default:
3500 return nullptr;
3501 case Intrinsic::experimental_constrained_fadd:
3502 St = Res.add(Op2V, RM);
3503 break;
3504 case Intrinsic::experimental_constrained_fsub:
3505 St = Res.subtract(Op2V, RM);
3506 break;
3507 case Intrinsic::experimental_constrained_fmul:
3508 St = Res.multiply(Op2V, RM);
3509 break;
3510 case Intrinsic::experimental_constrained_fdiv:
3511 St = Res.divide(Op2V, RM);
3512 break;
3513 case Intrinsic::experimental_constrained_frem:
3514 St = Res.mod(Op2V);
3515 break;
3516 case Intrinsic::experimental_constrained_fcmp:
3517 case Intrinsic::experimental_constrained_fcmps:
3518 return evaluateCompare(Op1V, Op2V, ConstrIntr);
3519 }
3520 if (mayFoldConstrained(const_cast<ConstrainedFPIntrinsic *>(ConstrIntr),
3521 St))
3522 return ConstantFP::get(Ty, Res);
3523 return nullptr;
3524 }
3525
3526 switch (IntrinsicID) {
3527 default:
3528 break;
3529 case Intrinsic::copysign:
3530 return ConstantFP::get(Ty, APFloat::copySign(Op1V, Op2V));
3531 case Intrinsic::minnum:
3532 return ConstantFP::get(Ty, minnum(Op1V, Op2V));
3533 case Intrinsic::maxnum:
3534 return ConstantFP::get(Ty, maxnum(Op1V, Op2V));
3535 case Intrinsic::minimum:
3536 return ConstantFP::get(Ty, minimum(Op1V, Op2V));
3537 case Intrinsic::maximum:
3538 return ConstantFP::get(Ty, maximum(Op1V, Op2V));
3539 case Intrinsic::minimumnum:
3540 return ConstantFP::get(Ty, minimumnum(Op1V, Op2V));
3541 case Intrinsic::maximumnum:
3542 return ConstantFP::get(Ty, maximumnum(Op1V, Op2V));
3543
3544 case Intrinsic::nvvm_fmax_d:
3545 case Intrinsic::nvvm_fmax_f:
3546 case Intrinsic::nvvm_fmax_ftz_f:
3547 case Intrinsic::nvvm_fmax_ftz_nan_f:
3548 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3549 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3550 case Intrinsic::nvvm_fmax_nan_f:
3551 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3552 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3553
3554 case Intrinsic::nvvm_fmin_d:
3555 case Intrinsic::nvvm_fmin_f:
3556 case Intrinsic::nvvm_fmin_ftz_f:
3557 case Intrinsic::nvvm_fmin_ftz_nan_f:
3558 case Intrinsic::nvvm_fmin_ftz_nan_xorsign_abs_f:
3559 case Intrinsic::nvvm_fmin_ftz_xorsign_abs_f:
3560 case Intrinsic::nvvm_fmin_nan_f:
3561 case Intrinsic::nvvm_fmin_nan_xorsign_abs_f:
3562 case Intrinsic::nvvm_fmin_xorsign_abs_f: {
3563
3564 bool ShouldCanonicalizeNaNs = !(IntrinsicID == Intrinsic::nvvm_fmax_d ||
3565 IntrinsicID == Intrinsic::nvvm_fmin_d);
3566 bool IsFTZ = nvvm::FMinFMaxShouldFTZ(IntrinsicID);
3567 bool IsNaNPropagating = nvvm::FMinFMaxPropagatesNaNs(IntrinsicID);
3568 bool IsXorSignAbs = nvvm::FMinFMaxIsXorSignAbs(IntrinsicID);
3569
3570 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3571 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3572
3573 bool XorSign = false;
3574 if (IsXorSignAbs) {
3575 XorSign = A.isNegative() ^ B.isNegative();
3576 A = abs(A);
3577 B = abs(B);
3578 }
3579
3580 bool IsFMax = false;
3581 switch (IntrinsicID) {
3582 case Intrinsic::nvvm_fmax_d:
3583 case Intrinsic::nvvm_fmax_f:
3584 case Intrinsic::nvvm_fmax_ftz_f:
3585 case Intrinsic::nvvm_fmax_ftz_nan_f:
3586 case Intrinsic::nvvm_fmax_ftz_nan_xorsign_abs_f:
3587 case Intrinsic::nvvm_fmax_ftz_xorsign_abs_f:
3588 case Intrinsic::nvvm_fmax_nan_f:
3589 case Intrinsic::nvvm_fmax_nan_xorsign_abs_f:
3590 case Intrinsic::nvvm_fmax_xorsign_abs_f:
3591 IsFMax = true;
3592 break;
3593 }
3594 APFloat Res =
3595 IsFMax ? (IsNaNPropagating ? maximum(A, B) : maximumnum(A, B))
3596 : (IsNaNPropagating ? minimum(A, B) : minimumnum(A, B));
3597
3598 if (ShouldCanonicalizeNaNs && Res.isNaN()) {
3599 APFloat NVCanonicalNaN(Res.getSemantics(), APInt(32, 0x7fffffff));
3600 return ConstantFP::get(Ty, NVCanonicalNaN);
3601 }
3602
3603 if (IsXorSignAbs && XorSign != Res.isNegative())
3604 Res.changeSign();
3605
3606 return ConstantFP::get(Ty, Res);
3607 }
3608
3609 case Intrinsic::nvvm_add_rm_f:
3610 case Intrinsic::nvvm_add_rn_f:
3611 case Intrinsic::nvvm_add_rp_f:
3612 case Intrinsic::nvvm_add_rz_f:
3613 case Intrinsic::nvvm_add_rm_d:
3614 case Intrinsic::nvvm_add_rn_d:
3615 case Intrinsic::nvvm_add_rp_d:
3616 case Intrinsic::nvvm_add_rz_d:
3617 case Intrinsic::nvvm_add_rm_ftz_f:
3618 case Intrinsic::nvvm_add_rn_ftz_f:
3619 case Intrinsic::nvvm_add_rp_ftz_f:
3620 case Intrinsic::nvvm_add_rz_ftz_f: {
3621
3622 bool IsFTZ = nvvm::FAddShouldFTZ(IntrinsicID);
3623 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3624 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3625
3626 APFloat::roundingMode RoundMode =
3627 nvvm::GetFAddRoundingMode(IntrinsicID);
3628
3629 APFloat Res = A;
3630 APFloat::opStatus Status = Res.add(B, RoundMode);
3631
3632 if (!Res.isNaN() &&
3634 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3635 return ConstantFP::get(Ty, Res);
3636 }
3637 return nullptr;
3638 }
3639
3640 case Intrinsic::nvvm_mul_rm_f:
3641 case Intrinsic::nvvm_mul_rn_f:
3642 case Intrinsic::nvvm_mul_rp_f:
3643 case Intrinsic::nvvm_mul_rz_f:
3644 case Intrinsic::nvvm_mul_rm_d:
3645 case Intrinsic::nvvm_mul_rn_d:
3646 case Intrinsic::nvvm_mul_rp_d:
3647 case Intrinsic::nvvm_mul_rz_d:
3648 case Intrinsic::nvvm_mul_rm_ftz_f:
3649 case Intrinsic::nvvm_mul_rn_ftz_f:
3650 case Intrinsic::nvvm_mul_rp_ftz_f:
3651 case Intrinsic::nvvm_mul_rz_ftz_f: {
3652
3653 bool IsFTZ = nvvm::FMulShouldFTZ(IntrinsicID);
3654 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3655 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3656
3657 APFloat::roundingMode RoundMode =
3658 nvvm::GetFMulRoundingMode(IntrinsicID);
3659
3660 APFloat Res = A;
3661 APFloat::opStatus Status = Res.multiply(B, RoundMode);
3662
3663 if (!Res.isNaN() &&
3665 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3666 return ConstantFP::get(Ty, Res);
3667 }
3668 return nullptr;
3669 }
3670
3671 case Intrinsic::nvvm_div_rm_f:
3672 case Intrinsic::nvvm_div_rn_f:
3673 case Intrinsic::nvvm_div_rp_f:
3674 case Intrinsic::nvvm_div_rz_f:
3675 case Intrinsic::nvvm_div_rm_d:
3676 case Intrinsic::nvvm_div_rn_d:
3677 case Intrinsic::nvvm_div_rp_d:
3678 case Intrinsic::nvvm_div_rz_d:
3679 case Intrinsic::nvvm_div_rm_ftz_f:
3680 case Intrinsic::nvvm_div_rn_ftz_f:
3681 case Intrinsic::nvvm_div_rp_ftz_f:
3682 case Intrinsic::nvvm_div_rz_ftz_f: {
3683 bool IsFTZ = nvvm::FDivShouldFTZ(IntrinsicID);
3684 APFloat A = IsFTZ ? FTZPreserveSign(Op1V) : Op1V;
3685 APFloat B = IsFTZ ? FTZPreserveSign(Op2V) : Op2V;
3686 APFloat::roundingMode RoundMode =
3687 nvvm::GetFDivRoundingMode(IntrinsicID);
3688
3689 APFloat Res = A;
3690 APFloat::opStatus Status = Res.divide(B, RoundMode);
3691 if (!Res.isNaN() &&
3693 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
3694 return ConstantFP::get(Ty, Res);
3695 }
3696 return nullptr;
3697 }
3698 }
3699
3700 if (!Ty->isHalfTy() && !Ty->isFloatTy() && !Ty->isDoubleTy())
3701 return nullptr;
3702
3703 switch (IntrinsicID) {
3704 default:
3705 break;
3706 case Intrinsic::pow:
3707 return ConstantFoldBinaryFP(pow, Op1V, Op2V, Ty);
3708 case Intrinsic::amdgcn_fmul_legacy:
3709 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
3710 // NaN or infinity, gives +0.0.
3711 if (Op1V.isZero() || Op2V.isZero())
3712 return ConstantFP::getZero(Ty);
3713 return ConstantFP::get(Ty, Op1V * Op2V);
3714 }
3715
3716 } else if (auto *Op2C = dyn_cast<ConstantInt>(Operands[1])) {
3717 switch (IntrinsicID) {
3718 case Intrinsic::ldexp: {
3719 // APFloat::scalbn takes the exponent as `int`. Clamp wider integer
3720 // exponents into [INT_MIN, INT_MAX] so values still saturate the
3721 // result to +/-inf or +/-0.
3722 APInt Exp = Op2C->getValue();
3723 Exp = Exp.getBitWidth() < 32 ? Exp.sext(32) : Exp.truncSSat(32);
3724 return ConstantFP::get(
3725 Ty->getContext(),
3726 scalbn(Op1V, Exp.getSExtValue(), APFloat::rmNearestTiesToEven));
3727 }
3728 case Intrinsic::is_fpclass: {
3729 FPClassTest Mask = static_cast<FPClassTest>(Op2C->getZExtValue());
3730 bool Result =
3731 ((Mask & fcSNan) && Op1V.isNaN() && Op1V.isSignaling()) ||
3732 ((Mask & fcQNan) && Op1V.isNaN() && !Op1V.isSignaling()) ||
3733 ((Mask & fcNegInf) && Op1V.isNegInfinity()) ||
3734 ((Mask & fcNegNormal) && Op1V.isNormal() && Op1V.isNegative()) ||
3735 ((Mask & fcNegSubnormal) && Op1V.isDenormal() && Op1V.isNegative()) ||
3736 ((Mask & fcNegZero) && Op1V.isZero() && Op1V.isNegative()) ||
3737 ((Mask & fcPosZero) && Op1V.isZero() && !Op1V.isNegative()) ||
3738 ((Mask & fcPosSubnormal) && Op1V.isDenormal() && !Op1V.isNegative()) ||
3739 ((Mask & fcPosNormal) && Op1V.isNormal() && !Op1V.isNegative()) ||
3740 ((Mask & fcPosInf) && Op1V.isPosInfinity());
3741 return ConstantInt::get(Ty, Result);
3742 }
3743 case Intrinsic::powi: {
3744 int Exp = static_cast<int>(Op2C->getSExtValue());
3745 switch (Ty->getTypeID()) {
3746 case Type::HalfTyID:
3747 case Type::FloatTyID: {
3748 APFloat Res(static_cast<float>(std::pow(Op1V.convertToFloat(), Exp)));
3749 if (Ty->isHalfTy()) {
3750 bool Unused;
3752 &Unused);
3753 }
3754 return ConstantFP::get(Ty, Res);
3755 }
3756 case Type::DoubleTyID:
3757 return ConstantFP::get(Ty, std::pow(Op1V.convertToDouble(), Exp));
3758 default:
3759 return nullptr;
3760 }
3761 }
3762 default:
3763 break;
3764 }
3765 }
3766 return nullptr;
3767 }
3768
3769 if (Operands[0]->getType()->isIntegerTy() &&
3770 Operands[1]->getType()->isIntegerTy()) {
3771 const APInt *C0, *C1;
3772 if (!getConstIntOrUndef(Operands[0], C0) ||
3773 !getConstIntOrUndef(Operands[1], C1))
3774 return nullptr;
3775
3776 switch (IntrinsicID) {
3777 default: break;
3778 case Intrinsic::smax:
3779 case Intrinsic::smin:
3780 case Intrinsic::umax:
3781 case Intrinsic::umin:
3782 if (!C0 && !C1)
3783 return UndefValue::get(Ty);
3784 if (!C0 || !C1)
3785 return MinMaxIntrinsic::getSaturationPoint(IntrinsicID, Ty);
3786 return ConstantInt::get(
3787 Ty, ICmpInst::compare(*C0, *C1,
3788 MinMaxIntrinsic::getPredicate(IntrinsicID))
3789 ? *C0
3790 : *C1);
3791
3792 case Intrinsic::scmp:
3793 case Intrinsic::ucmp:
3794 if (!C0 || !C1)
3795 return ConstantInt::get(Ty, 0);
3796
3797 int Res;
3798 if (IntrinsicID == Intrinsic::scmp)
3799 Res = C0->sgt(*C1) ? 1 : C0->slt(*C1) ? -1 : 0;
3800 else
3801 Res = C0->ugt(*C1) ? 1 : C0->ult(*C1) ? -1 : 0;
3802 return ConstantInt::get(Ty, Res, /*IsSigned=*/true);
3803
3804 case Intrinsic::usub_with_overflow:
3805 case Intrinsic::ssub_with_overflow:
3806 // X - undef -> { 0, false }
3807 // undef - X -> { 0, false }
3808 if (!C0 || !C1)
3809 return Constant::getNullValue(Ty);
3810 [[fallthrough]];
3811 case Intrinsic::uadd_with_overflow:
3812 case Intrinsic::sadd_with_overflow:
3813 // X + undef -> { -1, false }
3814 // undef + x -> { -1, false }
3815 if (!C0 || !C1) {
3816 return ConstantStruct::get(
3817 cast<StructType>(Ty),
3818 {Constant::getAllOnesValue(Ty->getStructElementType(0)),
3819 Constant::getNullValue(Ty->getStructElementType(1))});
3820 }
3821 [[fallthrough]];
3822 case Intrinsic::smul_with_overflow:
3823 case Intrinsic::umul_with_overflow: {
3824 // undef * X -> { 0, false }
3825 // X * undef -> { 0, false }
3826 if (!C0 || !C1)
3827 return Constant::getNullValue(Ty);
3828
3829 APInt Res;
3830 bool Overflow;
3831 switch (IntrinsicID) {
3832 default: llvm_unreachable("Invalid case");
3833 case Intrinsic::sadd_with_overflow:
3834 Res = C0->sadd_ov(*C1, Overflow);
3835 break;
3836 case Intrinsic::uadd_with_overflow:
3837 Res = C0->uadd_ov(*C1, Overflow);
3838 break;
3839 case Intrinsic::ssub_with_overflow:
3840 Res = C0->ssub_ov(*C1, Overflow);
3841 break;
3842 case Intrinsic::usub_with_overflow:
3843 Res = C0->usub_ov(*C1, Overflow);
3844 break;
3845 case Intrinsic::smul_with_overflow:
3846 Res = C0->smul_ov(*C1, Overflow);
3847 break;
3848 case Intrinsic::umul_with_overflow:
3849 Res = C0->umul_ov(*C1, Overflow);
3850 break;
3851 }
3852 Constant *Ops[] = {
3853 ConstantInt::get(Ty->getContext(), Res),
3854 ConstantInt::get(Type::getInt1Ty(Ty->getContext()), Overflow)
3855 };
3857 }
3858 case Intrinsic::uadd_sat:
3859 case Intrinsic::sadd_sat:
3860 if (!C0 && !C1)
3861 return UndefValue::get(Ty);
3862 if (!C0 || !C1)
3863 return Constant::getAllOnesValue(Ty);
3864 if (IntrinsicID == Intrinsic::uadd_sat)
3865 return ConstantInt::get(Ty, C0->uadd_sat(*C1));
3866 else
3867 return ConstantInt::get(Ty, C0->sadd_sat(*C1));
3868 case Intrinsic::usub_sat:
3869 case Intrinsic::ssub_sat:
3870 if (!C0 && !C1)
3871 return UndefValue::get(Ty);
3872 if (!C0 || !C1)
3873 return Constant::getNullValue(Ty);
3874 if (IntrinsicID == Intrinsic::usub_sat)
3875 return ConstantInt::get(Ty, C0->usub_sat(*C1));
3876 else
3877 return ConstantInt::get(Ty, C0->ssub_sat(*C1));
3878 case Intrinsic::cttz:
3879 case Intrinsic::ctlz:
3880 assert(C1 && "Must be constant int");
3881
3882 // cttz(0, 1) and ctlz(0, 1) are poison.
3883 if (C1->isOne() && (!C0 || C0->isZero()))
3884 return PoisonValue::get(Ty);
3885 if (!C0)
3886 return Constant::getNullValue(Ty);
3887 if (IntrinsicID == Intrinsic::cttz)
3888 return ConstantInt::get(Ty, C0->countr_zero());
3889 else
3890 return ConstantInt::get(Ty, C0->countl_zero());
3891
3892 case Intrinsic::abs:
3893 assert(C1 && "Must be constant int");
3894 assert((C1->isOne() || C1->isZero()) && "Must be 0 or 1");
3895
3896 // Undef or minimum val operand with poison min --> poison
3897 if (C1->isOne() && (!C0 || C0->isMinSignedValue()))
3898 return PoisonValue::get(Ty);
3899
3900 // Undef operand with no poison min --> 0 (sign bit must be clear)
3901 if (!C0)
3902 return Constant::getNullValue(Ty);
3903
3904 return ConstantInt::get(Ty, C0->abs());
3905 case Intrinsic::clmul:
3906 if (!C0 || !C1)
3907 return Constant::getNullValue(Ty);
3908 return ConstantInt::get(Ty, APIntOps::clmul(*C0, *C1));
3909 case Intrinsic::pdep:
3910 if (!C0 || !C1)
3911 return Constant::getNullValue(Ty);
3912 return ConstantInt::get(Ty, APIntOps::expandBits(*C0, *C1));
3913 case Intrinsic::pext:
3914 if (!C0 || !C1)
3915 return Constant::getNullValue(Ty);
3916 return ConstantInt::get(Ty, APIntOps::compressBits(*C0, *C1));
3917 case Intrinsic::amdgcn_wave_reduce_umin:
3918 case Intrinsic::amdgcn_wave_reduce_umax:
3919 case Intrinsic::amdgcn_wave_reduce_max:
3920 case Intrinsic::amdgcn_wave_reduce_min:
3921 case Intrinsic::amdgcn_wave_reduce_and:
3922 case Intrinsic::amdgcn_wave_reduce_or:
3923 return Operands[0];
3924 }
3925
3926 return nullptr;
3927 }
3928
3929 // Support ConstantVector in case we have an Undef in the top.
3930 if ((isa<ConstantVector>(Operands[0]) ||
3931 isa<ConstantDataVector>(Operands[0])) &&
3932 // Check for default rounding mode.
3933 // FIXME: Support other rounding modes?
3934 isa<ConstantInt>(Operands[1]) &&
3935 cast<ConstantInt>(Operands[1])->getValue() == 4) {
3936 auto *Op = cast<Constant>(Operands[0]);
3937 switch (IntrinsicID) {
3938 default: break;
3939 case Intrinsic::x86_avx512_vcvtss2si32:
3940 case Intrinsic::x86_avx512_vcvtss2si64:
3941 case Intrinsic::x86_avx512_vcvtsd2si32:
3942 case Intrinsic::x86_avx512_vcvtsd2si64:
3943 if (ConstantFP *FPOp =
3944 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3945 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3946 /*roundTowardZero=*/false, Ty,
3947 /*IsSigned*/true);
3948 break;
3949 case Intrinsic::x86_avx512_vcvtss2usi32:
3950 case Intrinsic::x86_avx512_vcvtss2usi64:
3951 case Intrinsic::x86_avx512_vcvtsd2usi32:
3952 case Intrinsic::x86_avx512_vcvtsd2usi64:
3953 if (ConstantFP *FPOp =
3954 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3955 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3956 /*roundTowardZero=*/false, Ty,
3957 /*IsSigned*/false);
3958 break;
3959 case Intrinsic::x86_avx512_cvttss2si:
3960 case Intrinsic::x86_avx512_cvttss2si64:
3961 case Intrinsic::x86_avx512_cvttsd2si:
3962 case Intrinsic::x86_avx512_cvttsd2si64:
3963 if (ConstantFP *FPOp =
3964 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3965 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3966 /*roundTowardZero=*/true, Ty,
3967 /*IsSigned*/true);
3968 break;
3969 case Intrinsic::x86_avx512_cvttss2usi:
3970 case Intrinsic::x86_avx512_cvttss2usi64:
3971 case Intrinsic::x86_avx512_cvttsd2usi:
3972 case Intrinsic::x86_avx512_cvttsd2usi64:
3973 if (ConstantFP *FPOp =
3974 dyn_cast_or_null<ConstantFP>(Op->getAggregateElement(0U)))
3975 return ConstantFoldSSEConvertToInt(FPOp->getValueAPF(),
3976 /*roundTowardZero=*/true, Ty,
3977 /*IsSigned*/false);
3978 break;
3979 }
3980 }
3981
3982 if (IntrinsicID == Intrinsic::experimental_cttz_elts) {
3983 auto *FVTy = dyn_cast<FixedVectorType>(Operands[0]->getType());
3984 bool ZeroIsPoison = cast<ConstantInt>(Operands[1])->isOne();
3985 if (!FVTy)
3986 return nullptr;
3987 unsigned Width = Ty->getIntegerBitWidth();
3988 if (APInt::getMaxValue(Width).ult(FVTy->getNumElements()))
3989 return PoisonValue::get(Ty);
3990 for (unsigned I = 0; I < FVTy->getNumElements(); ++I) {
3991 Constant *Elt = Operands[0]->getAggregateElement(I);
3992 if (!Elt)
3993 return nullptr;
3994 if (isa<UndefValue>(Elt) || Elt->isNullValue())
3995 continue;
3996 return ConstantInt::get(Ty, I);
3997 }
3998 if (ZeroIsPoison)
3999 return PoisonValue::get(Ty);
4000 return ConstantInt::get(Ty, FVTy->getNumElements());
4001 }
4002 return nullptr;
4003}
4004
4005static APFloat ConstantFoldAMDGCNCubeIntrinsic(Intrinsic::ID IntrinsicID,
4006 const APFloat &S0,
4007 const APFloat &S1,
4008 const APFloat &S2) {
4009 unsigned ID;
4010 const fltSemantics &Sem = S0.getSemantics();
4011 APFloat MA(Sem), SC(Sem), TC(Sem);
4012 if (abs(S2) >= abs(S0) && abs(S2) >= abs(S1)) {
4013 if (S2.isNegative() && S2.isNonZero() && !S2.isNaN()) {
4014 // S2 < 0
4015 ID = 5;
4016 SC = -S0;
4017 } else {
4018 ID = 4;
4019 SC = S0;
4020 }
4021 MA = S2;
4022 TC = -S1;
4023 } else if (abs(S1) >= abs(S0)) {
4024 if (S1.isNegative() && S1.isNonZero() && !S1.isNaN()) {
4025 // S1 < 0
4026 ID = 3;
4027 TC = -S2;
4028 } else {
4029 ID = 2;
4030 TC = S2;
4031 }
4032 MA = S1;
4033 SC = S0;
4034 } else {
4035 if (S0.isNegative() && S0.isNonZero() && !S0.isNaN()) {
4036 // S0 < 0
4037 ID = 1;
4038 SC = S2;
4039 } else {
4040 ID = 0;
4041 SC = -S2;
4042 }
4043 MA = S0;
4044 TC = -S1;
4045 }
4046 switch (IntrinsicID) {
4047 default:
4048 llvm_unreachable("unhandled amdgcn cube intrinsic");
4049 case Intrinsic::amdgcn_cubeid:
4050 return APFloat(Sem, ID);
4051 case Intrinsic::amdgcn_cubema:
4052 return MA + MA;
4053 case Intrinsic::amdgcn_cubesc:
4054 return SC;
4055 case Intrinsic::amdgcn_cubetc:
4056 return TC;
4057 }
4058}
4059
4060static Constant *ConstantFoldAMDGCNPermIntrinsic(ArrayRef<Constant *> Operands,
4061 Type *Ty) {
4062 const APInt *C0, *C1, *C2;
4063 if (!getConstIntOrUndef(Operands[0], C0) ||
4064 !getConstIntOrUndef(Operands[1], C1) ||
4065 !getConstIntOrUndef(Operands[2], C2))
4066 return nullptr;
4067
4068 if (!C2)
4069 return UndefValue::get(Ty);
4070
4071 APInt Val(32, 0);
4072 unsigned NumUndefBytes = 0;
4073 for (unsigned I = 0; I < 32; I += 8) {
4074 unsigned Sel = C2->extractBitsAsZExtValue(8, I);
4075 unsigned B = 0;
4076
4077 if (Sel >= 13)
4078 B = 0xff;
4079 else if (Sel == 12)
4080 B = 0x00;
4081 else {
4082 const APInt *Src = ((Sel & 10) == 10 || (Sel & 12) == 4) ? C0 : C1;
4083 if (!Src)
4084 ++NumUndefBytes;
4085 else if (Sel < 8)
4086 B = Src->extractBitsAsZExtValue(8, (Sel & 3) * 8);
4087 else
4088 B = Src->extractBitsAsZExtValue(1, (Sel & 1) ? 31 : 15) * 0xff;
4089 }
4090
4091 Val.insertBits(B, I, 8);
4092 }
4093
4094 if (NumUndefBytes == 4)
4095 return UndefValue::get(Ty);
4096
4097 return ConstantInt::get(Ty, Val);
4098}
4099
4100static Constant *ConstantFoldScalarCall3(StringRef Name,
4101 Intrinsic::ID IntrinsicID,
4102 Type *Ty,
4103 ArrayRef<Constant *> Operands,
4104 const TargetLibraryInfo *TLI,
4105 const CallBase *Call) {
4106 assert(Operands.size() == 3 && "Wrong number of operands.");
4107
4108 if (const auto *Op1 = dyn_cast<ConstantFP>(Operands[0])) {
4109 if (const auto *Op2 = dyn_cast<ConstantFP>(Operands[1])) {
4110 if (const auto *Op3 = dyn_cast<ConstantFP>(Operands[2])) {
4111 const APFloat &C1 = Op1->getValueAPF();
4112 const APFloat &C2 = Op2->getValueAPF();
4113 const APFloat &C3 = Op3->getValueAPF();
4114
4115 if (const auto *ConstrIntr = dyn_cast<ConstrainedFPIntrinsic>(Call)) {
4116 RoundingMode RM = getEvaluationRoundingMode(ConstrIntr);
4117 APFloat Res = C1;
4119 switch (IntrinsicID) {
4120 default:
4121 return nullptr;
4122 case Intrinsic::experimental_constrained_fma:
4123 case Intrinsic::experimental_constrained_fmuladd:
4124 St = Res.fusedMultiplyAdd(C2, C3, RM);
4125 break;
4126 }
4127 if (mayFoldConstrained(
4128 const_cast<ConstrainedFPIntrinsic *>(ConstrIntr), St))
4129 return ConstantFP::get(Ty, Res);
4130 return nullptr;
4131 }
4132
4133 switch (IntrinsicID) {
4134 default: break;
4135 case Intrinsic::amdgcn_fma_legacy: {
4136 // The legacy behaviour is that multiplying +/- 0.0 by anything, even
4137 // NaN or infinity, gives +0.0.
4138 if (C1.isZero() || C2.isZero()) {
4139 // It's tempting to just return C3 here, but that would give the
4140 // wrong result if C3 was -0.0.
4141 return ConstantFP::get(Ty, APFloat(0.0f) + C3);
4142 }
4143 [[fallthrough]];
4144 }
4145 case Intrinsic::fma:
4146 case Intrinsic::fmuladd: {
4147 APFloat V = C1;
4149 return ConstantFP::get(Ty, V);
4150 }
4151
4152 case Intrinsic::nvvm_fma_rm_f:
4153 case Intrinsic::nvvm_fma_rn_f:
4154 case Intrinsic::nvvm_fma_rp_f:
4155 case Intrinsic::nvvm_fma_rz_f:
4156 case Intrinsic::nvvm_fma_rm_d:
4157 case Intrinsic::nvvm_fma_rn_d:
4158 case Intrinsic::nvvm_fma_rp_d:
4159 case Intrinsic::nvvm_fma_rz_d:
4160 case Intrinsic::nvvm_fma_rm_ftz_f:
4161 case Intrinsic::nvvm_fma_rn_ftz_f:
4162 case Intrinsic::nvvm_fma_rp_ftz_f:
4163 case Intrinsic::nvvm_fma_rz_ftz_f: {
4164 bool IsFTZ = nvvm::FMAShouldFTZ(IntrinsicID);
4165 APFloat A = IsFTZ ? FTZPreserveSign(C1) : C1;
4166 APFloat B = IsFTZ ? FTZPreserveSign(C2) : C2;
4167 APFloat C = IsFTZ ? FTZPreserveSign(C3) : C3;
4168
4169 APFloat::roundingMode RoundMode =
4170 nvvm::GetFMARoundingMode(IntrinsicID);
4171
4172 APFloat Res = A;
4173 APFloat::opStatus Status = Res.fusedMultiplyAdd(B, C, RoundMode);
4174
4175 if (!Res.isNaN() &&
4177 Res = IsFTZ ? FTZPreserveSign(Res) : Res;
4178 return ConstantFP::get(Ty, Res);
4179 }
4180 return nullptr;
4181 }
4182
4183 case Intrinsic::amdgcn_cubeid:
4184 case Intrinsic::amdgcn_cubema:
4185 case Intrinsic::amdgcn_cubesc:
4186 case Intrinsic::amdgcn_cubetc: {
4187 APFloat V = ConstantFoldAMDGCNCubeIntrinsic(IntrinsicID, C1, C2, C3);
4188 return ConstantFP::get(Ty, V);
4189 }
4190 }
4191 }
4192 }
4193 }
4194
4195 if (IntrinsicID == Intrinsic::smul_fix ||
4196 IntrinsicID == Intrinsic::smul_fix_sat) {
4197 const APInt *C0, *C1;
4198 if (!getConstIntOrUndef(Operands[0], C0) ||
4199 !getConstIntOrUndef(Operands[1], C1))
4200 return nullptr;
4201
4202 // undef * C -> 0
4203 // C * undef -> 0
4204 if (!C0 || !C1)
4205 return Constant::getNullValue(Ty);
4206
4207 // This code performs rounding towards negative infinity in case the result
4208 // cannot be represented exactly for the given scale. Targets that do care
4209 // about rounding should use a target hook for specifying how rounding
4210 // should be done, and provide their own folding to be consistent with
4211 // rounding. This is the same approach as used by
4212 // DAGTypeLegalizer::ExpandIntRes_MULFIX.
4213 unsigned Scale = cast<ConstantInt>(Operands[2])->getZExtValue();
4214 unsigned Width = C0->getBitWidth();
4215 assert(Scale < Width && "Illegal scale.");
4216 unsigned ExtendedWidth = Width * 2;
4217 APInt Product =
4218 (C0->sext(ExtendedWidth) * C1->sext(ExtendedWidth)).ashr(Scale);
4219 if (IntrinsicID == Intrinsic::smul_fix_sat) {
4220 APInt Max = APInt::getSignedMaxValue(Width).sext(ExtendedWidth);
4221 APInt Min = APInt::getSignedMinValue(Width).sext(ExtendedWidth);
4222 Product = APIntOps::smin(Product, Max);
4223 Product = APIntOps::smax(Product, Min);
4224 }
4225 return ConstantInt::get(Ty->getContext(), Product.sextOrTrunc(Width));
4226 }
4227
4228 if (IntrinsicID == Intrinsic::fshl || IntrinsicID == Intrinsic::fshr) {
4229 const APInt *C0, *C1, *C2;
4230 if (!getConstIntOrUndef(Operands[0], C0) ||
4231 !getConstIntOrUndef(Operands[1], C1) ||
4232 !getConstIntOrUndef(Operands[2], C2))
4233 return nullptr;
4234
4235 bool IsRight = IntrinsicID == Intrinsic::fshr;
4236 if (!C2)
4237 return Operands[IsRight ? 1 : 0];
4238 if (!C0 && !C1)
4239 return UndefValue::get(Ty);
4240
4241 // The shift amount is interpreted as modulo the bitwidth. If the shift
4242 // amount is effectively 0, avoid UB due to oversized inverse shift below.
4243 unsigned BitWidth = C2->getBitWidth();
4244 unsigned ShAmt = C2->urem(BitWidth);
4245 if (!ShAmt)
4246 return Operands[IsRight ? 1 : 0];
4247
4248 // (C0 << ShlAmt) | (C1 >> LshrAmt)
4249 unsigned LshrAmt = IsRight ? ShAmt : BitWidth - ShAmt;
4250 unsigned ShlAmt = !IsRight ? ShAmt : BitWidth - ShAmt;
4251 if (!C0)
4252 return ConstantInt::get(Ty, C1->lshr(LshrAmt));
4253 if (!C1)
4254 return ConstantInt::get(Ty, C0->shl(ShlAmt));
4255 return ConstantInt::get(Ty, C0->shl(ShlAmt) | C1->lshr(LshrAmt));
4256 }
4257
4258 if (IntrinsicID == Intrinsic::amdgcn_perm)
4259 return ConstantFoldAMDGCNPermIntrinsic(Operands, Ty);
4260
4261 return nullptr;
4262}
4263
4264static Constant *ConstantFoldScalarCall(StringRef Name,
4265 Intrinsic::ID IntrinsicID,
4266 Type *Ty,
4267 ArrayRef<Constant *> Operands,
4268 const TargetLibraryInfo *TLI,
4269 const CallBase *Call) {
4270 if (IntrinsicID != Intrinsic::not_intrinsic &&
4271 any_of(Operands, IsaPred<PoisonValue>) &&
4272 intrinsicPropagatesPoison(IntrinsicID))
4273 return PoisonValue::get(Ty);
4274
4275 if (Operands.size() == 1)
4276 return ConstantFoldScalarCall1(Name, IntrinsicID, Ty, Operands, TLI, Call);
4277
4278 if (Operands.size() == 2) {
4279 if (Constant *FoldedLibCall =
4280 ConstantFoldLibCall2(Name, Ty, Operands, TLI)) {
4281 return FoldedLibCall;
4282 }
4283 return ConstantFoldIntrinsicCall2(IntrinsicID, Ty, Operands, Call);
4284 }
4285
4286 if (Operands.size() == 3)
4287 return ConstantFoldScalarCall3(Name, IntrinsicID, Ty, Operands, TLI, Call);
4288
4289 return nullptr;
4290}
4291
4292static Constant *ConstantFoldFixedVectorCall(
4293 StringRef Name, Intrinsic::ID IntrinsicID, FixedVectorType *FVTy,
4294 ArrayRef<Constant *> Operands, const DataLayout &DL,
4295 const TargetLibraryInfo *TLI, const CallBase *Call) {
4297 SmallVector<Constant *, 4> Lane(Operands.size());
4298 Type *Ty = FVTy->getElementType();
4299
4300 switch (IntrinsicID) {
4301 case Intrinsic::masked_load: {
4302 auto *SrcPtr = Operands[0];
4303 auto *Mask = Operands[1];
4304 auto *Passthru = Operands[2];
4305
4306 Constant *VecData = ConstantFoldLoadFromConstPtr(SrcPtr, FVTy, DL);
4307
4308 SmallVector<Constant *, 32> NewElements;
4309 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4310 auto *MaskElt = Mask->getAggregateElement(I);
4311 if (!MaskElt)
4312 break;
4313 auto *PassthruElt = Passthru->getAggregateElement(I);
4314 auto *VecElt = VecData ? VecData->getAggregateElement(I) : nullptr;
4315 if (isa<UndefValue>(MaskElt)) {
4316 if (PassthruElt)
4317 NewElements.push_back(PassthruElt);
4318 else if (VecElt)
4319 NewElements.push_back(VecElt);
4320 else
4321 return nullptr;
4322 }
4323 if (MaskElt->isNullValue()) {
4324 if (!PassthruElt)
4325 return nullptr;
4326 NewElements.push_back(PassthruElt);
4327 } else if (MaskElt->isOneValue()) {
4328 if (!VecElt)
4329 return nullptr;
4330 NewElements.push_back(VecElt);
4331 } else {
4332 return nullptr;
4333 }
4334 }
4335 if (NewElements.size() != FVTy->getNumElements())
4336 return nullptr;
4337 return ConstantVector::get(NewElements);
4338 }
4339 case Intrinsic::arm_mve_vctp8:
4340 case Intrinsic::arm_mve_vctp16:
4341 case Intrinsic::arm_mve_vctp32:
4342 case Intrinsic::arm_mve_vctp64: {
4343 if (auto *Op = dyn_cast<ConstantInt>(Operands[0])) {
4344 unsigned Lanes = FVTy->getNumElements();
4345 uint64_t Limit = Op->getZExtValue();
4346
4348 for (unsigned i = 0; i < Lanes; i++) {
4349 if (i < Limit)
4351 else
4353 }
4354 return ConstantVector::get(NCs);
4355 }
4356 return nullptr;
4357 }
4358 case Intrinsic::get_active_lane_mask: {
4359 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4360 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4361 if (Op0 && Op1) {
4362 unsigned Lanes = FVTy->getNumElements();
4363 uint64_t Base = Op0->getZExtValue();
4364 uint64_t Limit = Op1->getZExtValue();
4365
4367 for (unsigned i = 0; i < Lanes; i++) {
4368 if (Base + i < Limit)
4370 else
4372 }
4373 return ConstantVector::get(NCs);
4374 }
4375 return nullptr;
4376 }
4377 case Intrinsic::vector_extract: {
4378 auto *Idx = dyn_cast<ConstantInt>(Operands[1]);
4379 Constant *Vec = Operands[0];
4380 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4381 return nullptr;
4382
4383 unsigned NumElements = FVTy->getNumElements();
4384 unsigned VecNumElements =
4385 cast<FixedVectorType>(Vec->getType())->getNumElements();
4386 unsigned StartingIndex = Idx->getZExtValue();
4387
4388 // Extracting entire vector is nop
4389 if (NumElements == VecNumElements && StartingIndex == 0)
4390 return Vec;
4391
4392 for (unsigned I = StartingIndex, E = StartingIndex + NumElements; I < E;
4393 ++I) {
4394 Constant *Elt = Vec->getAggregateElement(I);
4395 if (!Elt)
4396 return nullptr;
4397 Result[I - StartingIndex] = Elt;
4398 }
4399
4400 return ConstantVector::get(Result);
4401 }
4402 case Intrinsic::vector_insert: {
4403 Constant *Vec = Operands[0];
4404 Constant *SubVec = Operands[1];
4405 auto *Idx = dyn_cast<ConstantInt>(Operands[2]);
4406 if (!Idx || !isa<FixedVectorType>(Vec->getType()))
4407 return nullptr;
4408
4409 unsigned SubVecNumElements =
4410 cast<FixedVectorType>(SubVec->getType())->getNumElements();
4411 unsigned VecNumElements =
4412 cast<FixedVectorType>(Vec->getType())->getNumElements();
4413 unsigned IdxN = Idx->getZExtValue();
4414 // Replacing entire vector with a subvec is nop
4415 if (SubVecNumElements == VecNumElements && IdxN == 0)
4416 return SubVec;
4417
4418 for (unsigned I = 0; I < VecNumElements; ++I) {
4419 Constant *Elt;
4420 if (I < IdxN + SubVecNumElements)
4421 Elt = SubVec->getAggregateElement(I - IdxN);
4422 else
4423 Elt = Vec->getAggregateElement(I);
4424 if (!Elt)
4425 return nullptr;
4426 Result[I] = Elt;
4427 }
4428 return ConstantVector::get(Result);
4429 }
4430 case Intrinsic::vector_interleave2:
4431 case Intrinsic::vector_interleave3:
4432 case Intrinsic::vector_interleave4:
4433 case Intrinsic::vector_interleave5:
4434 case Intrinsic::vector_interleave6:
4435 case Intrinsic::vector_interleave7:
4436 case Intrinsic::vector_interleave8: {
4437 unsigned NumElements =
4438 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4439 unsigned NumOperands = Operands.size();
4440 for (unsigned I = 0; I < NumElements; ++I) {
4441 for (unsigned J = 0; J < NumOperands; ++J) {
4442 Constant *Elt = Operands[J]->getAggregateElement(I);
4443 if (!Elt)
4444 return nullptr;
4445 Result[NumOperands * I + J] = Elt;
4446 }
4447 }
4448 return ConstantVector::get(Result);
4449 }
4450 case Intrinsic::wasm_dot: {
4451 unsigned NumElements =
4452 cast<FixedVectorType>(Operands[0]->getType())->getNumElements();
4453
4454 assert(NumElements == 8 && Result.size() == 4 &&
4455 "wasm dot takes i16x8 and produces i32x4");
4456 assert(Ty->isIntegerTy());
4457 int32_t MulVector[8];
4458
4459 for (unsigned I = 0; I < NumElements; ++I) {
4460 ConstantInt *Elt0 =
4461 cast<ConstantInt>(Operands[0]->getAggregateElement(I));
4462 ConstantInt *Elt1 =
4463 cast<ConstantInt>(Operands[1]->getAggregateElement(I));
4464
4465 MulVector[I] = Elt0->getSExtValue() * Elt1->getSExtValue();
4466 }
4467 for (unsigned I = 0; I < Result.size(); I++) {
4468 int64_t IAdd = (int64_t)MulVector[I * 2] + (int64_t)MulVector[I * 2 + 1];
4469 Result[I] = ConstantInt::getSigned(Ty, IAdd, /*ImplicitTrunc=*/true);
4470 }
4471
4472 return ConstantVector::get(Result);
4473 }
4474 default:
4475 break;
4476 }
4477
4478 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4479 // Gather a column of constants.
4480 for (unsigned J = 0, JE = Operands.size(); J != JE; ++J) {
4481 // Some intrinsics use a scalar type for certain arguments.
4482 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, J, /*TTI=*/nullptr)) {
4483 Lane[J] = Operands[J];
4484 continue;
4485 }
4486
4487 Constant *Agg = Operands[J]->getAggregateElement(I);
4488 if (!Agg)
4489 return nullptr;
4490
4491 Lane[J] = Agg;
4492 }
4493
4494 // Use the regular scalar folding to simplify this column.
4495 Constant *Folded =
4496 ConstantFoldScalarCall(Name, IntrinsicID, Ty, Lane, TLI, Call);
4497 if (!Folded)
4498 return nullptr;
4499 Result[I] = Folded;
4500 }
4501
4502 return ConstantVector::get(Result);
4503}
4504
4505static Constant *ConstantFoldScalableVectorCall(
4506 StringRef Name, Intrinsic::ID IntrinsicID, ScalableVectorType *SVTy,
4507 ArrayRef<Constant *> Operands, const DataLayout &DL,
4508 const TargetLibraryInfo *TLI, const CallBase *Call) {
4509 switch (IntrinsicID) {
4510 case Intrinsic::aarch64_sve_convert_from_svbool: {
4511 Constant *Src = Operands[0];
4512 if (!Src->isNullValue())
4513 break;
4514
4515 return ConstantInt::getFalse(SVTy);
4516 }
4517 case Intrinsic::get_active_lane_mask: {
4518 auto *Op0 = dyn_cast<ConstantInt>(Operands[0]);
4519 auto *Op1 = dyn_cast<ConstantInt>(Operands[1]);
4520 if (Op0 && Op1 && Op0->getValue().uge(Op1->getValue()))
4521 return ConstantVector::getNullValue(SVTy);
4522 break;
4523 }
4524 case Intrinsic::vector_interleave2:
4525 case Intrinsic::vector_interleave3:
4526 case Intrinsic::vector_interleave4:
4527 case Intrinsic::vector_interleave5:
4528 case Intrinsic::vector_interleave6:
4529 case Intrinsic::vector_interleave7:
4530 case Intrinsic::vector_interleave8: {
4531 Constant *SplatVal = Operands[0]->getSplatValue();
4532 if (!SplatVal)
4533 return nullptr;
4534
4535 if (!llvm::all_equal(Operands))
4536 return nullptr;
4537
4538 return ConstantVector::getSplat(SVTy->getElementCount(), SplatVal);
4539 }
4540 default:
4541 break;
4542 }
4543
4544 // If trivially vectorizable, try folding it via the scalar call if all
4545 // operands are splats.
4546
4547 // TODO: ConstantFoldFixedVectorCall should probably check this too?
4548 if (!isTriviallyVectorizable(IntrinsicID))
4549 return nullptr;
4550
4552 for (auto [I, Op] : enumerate(Operands)) {
4553 if (isVectorIntrinsicWithScalarOpAtArg(IntrinsicID, I, /*TTI=*/nullptr)) {
4554 SplatOps.push_back(Op);
4555 continue;
4556 }
4557 Constant *Splat = Op->getSplatValue();
4558 if (!Splat)
4559 return nullptr;
4560 SplatOps.push_back(Splat);
4561 }
4562 Constant *Folded = ConstantFoldScalarCall(
4563 Name, IntrinsicID, SVTy->getElementType(), SplatOps, TLI, Call);
4564 if (!Folded)
4565 return nullptr;
4566 return ConstantVector::getSplat(SVTy->getElementCount(), Folded);
4567}
4568
4569static std::pair<Constant *, Constant *>
4570ConstantFoldScalarFrexpCall(Constant *Op, Type *IntTy) {
4571 if (isa<PoisonValue>(Op))
4572 return {Op, PoisonValue::get(IntTy)};
4573
4574 auto *ConstFP = dyn_cast<ConstantFP>(Op);
4575 if (!ConstFP)
4576 return {};
4577
4578 const APFloat &U = ConstFP->getValueAPF();
4579 int FrexpExp;
4580 APFloat FrexpMant = frexp(U, FrexpExp, APFloat::rmNearestTiesToEven);
4581 Constant *Result0 = ConstantFP::get(ConstFP->getType(), FrexpMant);
4582
4583 // The exponent is an "unspecified value" for inf/nan. We use zero to avoid
4584 // using undef.
4585 Constant *Result1 = FrexpMant.isFinite()
4586 ? ConstantInt::getSigned(IntTy, FrexpExp)
4587 : ConstantInt::getNullValue(IntTy);
4588 return {Result0, Result1};
4589}
4590
4591/// Handle intrinsics that return tuples, which may be tuples of vectors.
4592static Constant *
4593ConstantFoldStructCall(StringRef Name, Intrinsic::ID IntrinsicID,
4594 StructType *StTy, ArrayRef<Constant *> Operands,
4595 const DataLayout &DL, const TargetLibraryInfo *TLI,
4596 const CallBase *Call) {
4597
4598 switch (IntrinsicID) {
4599 case Intrinsic::frexp: {
4600 Type *Ty0 = StTy->getContainedType(0);
4601 Type *Ty1 = StTy->getContainedType(1)->getScalarType();
4602
4603 if (auto *FVTy0 = dyn_cast<FixedVectorType>(Ty0)) {
4604 SmallVector<Constant *, 4> Results0(FVTy0->getNumElements());
4605 SmallVector<Constant *, 4> Results1(FVTy0->getNumElements());
4606
4607 for (unsigned I = 0, E = FVTy0->getNumElements(); I != E; ++I) {
4608 Constant *Lane = Operands[0]->getAggregateElement(I);
4609 std::tie(Results0[I], Results1[I]) =
4610 ConstantFoldScalarFrexpCall(Lane, Ty1);
4611 if (!Results0[I])
4612 return nullptr;
4613 }
4614
4615 return ConstantStruct::get(StTy, ConstantVector::get(Results0),
4616 ConstantVector::get(Results1));
4617 }
4618
4619 auto [Result0, Result1] = ConstantFoldScalarFrexpCall(Operands[0], Ty1);
4620 if (!Result0)
4621 return nullptr;
4622 return ConstantStruct::get(StTy, Result0, Result1);
4623 }
4624 case Intrinsic::sincos: {
4625 Type *Ty = StTy->getContainedType(0);
4626 Type *TyScalar = Ty->getScalarType();
4627
4628 auto ConstantFoldScalarSincosCall =
4629 [&](Constant *Op) -> std::pair<Constant *, Constant *> {
4630 Constant *SinResult =
4631 ConstantFoldScalarCall(Name, Intrinsic::sin, TyScalar, Op, TLI, Call);
4632 Constant *CosResult =
4633 ConstantFoldScalarCall(Name, Intrinsic::cos, TyScalar, Op, TLI, Call);
4634 return std::make_pair(SinResult, CosResult);
4635 };
4636
4637 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty)) {
4638 SmallVector<Constant *> SinResults(FVTy->getNumElements());
4639 SmallVector<Constant *> CosResults(FVTy->getNumElements());
4640
4641 for (unsigned I = 0, E = FVTy->getNumElements(); I != E; ++I) {
4642 Constant *Lane = Operands[0]->getAggregateElement(I);
4643 std::tie(SinResults[I], CosResults[I]) =
4644 ConstantFoldScalarSincosCall(Lane);
4645 if (!SinResults[I] || !CosResults[I])
4646 return nullptr;
4647 }
4648
4649 return ConstantStruct::get(StTy, ConstantVector::get(SinResults),
4650 ConstantVector::get(CosResults));
4651 }
4652
4653 if (!Ty->isFloatingPointTy())
4654 return nullptr;
4655
4656 auto [SinResult, CosResult] = ConstantFoldScalarSincosCall(Operands[0]);
4657 if (!SinResult || !CosResult)
4658 return nullptr;
4659 return ConstantStruct::get(StTy, SinResult, CosResult);
4660 }
4661 case Intrinsic::vector_deinterleave2:
4662 case Intrinsic::vector_deinterleave3:
4663 case Intrinsic::vector_deinterleave4:
4664 case Intrinsic::vector_deinterleave5:
4665 case Intrinsic::vector_deinterleave6:
4666 case Intrinsic::vector_deinterleave7:
4667 case Intrinsic::vector_deinterleave8: {
4668 unsigned NumResults = StTy->getNumElements();
4669 auto *Vec = Operands[0];
4670 auto *VecTy = cast<VectorType>(Vec->getType());
4671
4672 ElementCount ResultEC =
4673 VecTy->getElementCount().divideCoefficientBy(NumResults);
4674
4675 if (auto *EltC = Vec->getSplatValue()) {
4676 auto *ResultVec = ConstantVector::getSplat(ResultEC, EltC);
4677 SmallVector<Constant *, 8> Results(NumResults, ResultVec);
4678 return ConstantStruct::get(StTy, Results);
4679 }
4680
4681 if (!ResultEC.isFixed())
4682 return nullptr;
4683
4684 unsigned NumElements = ResultEC.getFixedValue();
4686 SmallVector<Constant *> Elements(NumElements);
4687 for (unsigned I = 0; I != NumResults; ++I) {
4688 for (unsigned J = 0; J != NumElements; ++J) {
4689 Constant *Elt = Vec->getAggregateElement(J * NumResults + I);
4690 if (!Elt)
4691 return nullptr;
4692 Elements[J] = Elt;
4693 }
4694 Results[I] = ConstantVector::get(Elements);
4695 }
4696 return ConstantStruct::get(StTy, Results);
4697 }
4698 default:
4699 // TODO: Constant folding of vector intrinsics that fall through here does
4700 // not work (e.g. overflow intrinsics)
4701 return ConstantFoldScalarCall(Name, IntrinsicID, StTy, Operands, TLI, Call);
4702 }
4703
4704 return nullptr;
4705}
4706
4707} // end anonymous namespace
4708
4710 Type *Ty) {
4711 return ConstantFoldScalarCall1("", ID, Ty, Op, nullptr, nullptr);
4712}
4713
4715 Constant *RHS, Type *Ty) {
4716 return ConstantFoldIntrinsicCall2(ID, Ty, {LHS, RHS}, nullptr);
4717}
4718
4720 ArrayRef<Constant *> Operands,
4721 const TargetLibraryInfo *TLI,
4722 bool AllowNonDeterministic) {
4723 if (Call->isNoBuiltin())
4724 return nullptr;
4725 if (!F->hasName())
4726 return nullptr;
4727
4728 // If this is not an intrinsic and not recognized as a library call, bail out.
4729 Intrinsic::ID IID = F->getIntrinsicID();
4730 if (IID == Intrinsic::not_intrinsic) {
4731 if (!TLI)
4732 return nullptr;
4733 LibFunc LibF;
4734 if (!TLI->getLibFunc(*F, LibF))
4735 return nullptr;
4736 }
4737
4738 // Conservatively assume that floating-point libcalls may be
4739 // non-deterministic.
4740 Type *Ty = F->getReturnType();
4741 if (!AllowNonDeterministic && Ty->isFPOrFPVectorTy())
4742 return nullptr;
4743
4744 StringRef Name = F->getName();
4745 if (auto *FVTy = dyn_cast<FixedVectorType>(Ty))
4746 return ConstantFoldFixedVectorCall(
4747 Name, IID, FVTy, Operands, F->getDataLayout(), TLI, Call);
4748
4749 if (auto *SVTy = dyn_cast<ScalableVectorType>(Ty))
4750 return ConstantFoldScalableVectorCall(
4751 Name, IID, SVTy, Operands, F->getDataLayout(), TLI, Call);
4752
4753 if (auto *StTy = dyn_cast<StructType>(Ty))
4754 return ConstantFoldStructCall(Name, IID, StTy, Operands,
4755 F->getDataLayout(), TLI, Call);
4756
4757 // TODO: If this is a library function, we already discovered that above,
4758 // so we should pass the LibFunc, not the name (and it might be better
4759 // still to separate intrinsic handling from libcalls).
4760 return ConstantFoldScalarCall(Name, IID, Ty, Operands, TLI, Call);
4761}
4762
4764 const TargetLibraryInfo *TLI) {
4765 // FIXME: Refactor this code; this duplicates logic in LibCallsShrinkWrap
4766 // (and to some extent ConstantFoldScalarCall).
4767 if (Call->isNoBuiltin() || Call->isStrictFP())
4768 return false;
4769 Function *F = Call->getCalledFunction();
4770 if (!F)
4771 return false;
4772
4773 LibFunc Func;
4774 if (!TLI || !TLI->getLibFunc(*F, Func))
4775 return false;
4776
4777 if (Call->arg_size() == 1) {
4778 if (ConstantFP *OpC = dyn_cast<ConstantFP>(Call->getArgOperand(0))) {
4779 const APFloat &Op = OpC->getValueAPF();
4780 switch (Func) {
4781 case LibFunc_logl:
4782 case LibFunc_log:
4783 case LibFunc_logf:
4784 case LibFunc_log2l:
4785 case LibFunc_log2:
4786 case LibFunc_log2f:
4787 case LibFunc_log10l:
4788 case LibFunc_log10:
4789 case LibFunc_log10f:
4790 return Op.isNaN() || (!Op.isZero() && !Op.isNegative());
4791
4792 case LibFunc_ilogb:
4793 return !Op.isNaN() && !Op.isZero() && !Op.isInfinity();
4794
4795 case LibFunc_expl:
4796 case LibFunc_exp:
4797 case LibFunc_expf:
4798 // FIXME: These boundaries are slightly conservative.
4799 if (OpC->getType()->isDoubleTy())
4800 return !(Op < APFloat(-745.0) || Op > APFloat(709.0));
4801 if (OpC->getType()->isFloatTy())
4802 return !(Op < APFloat(-103.0f) || Op > APFloat(88.0f));
4803 break;
4804
4805 case LibFunc_exp2l:
4806 case LibFunc_exp2:
4807 case LibFunc_exp2f:
4808 // FIXME: These boundaries are slightly conservative.
4809 if (OpC->getType()->isDoubleTy())
4810 return !(Op < APFloat(-1074.0) || Op > APFloat(1023.0));
4811 if (OpC->getType()->isFloatTy())
4812 return !(Op < APFloat(-149.0f) || Op > APFloat(127.0f));
4813 break;
4814
4815 case LibFunc_sinl:
4816 case LibFunc_sin:
4817 case LibFunc_sinf:
4818 case LibFunc_cosl:
4819 case LibFunc_cos:
4820 case LibFunc_cosf:
4821 return !Op.isInfinity();
4822
4823 case LibFunc_tanl:
4824 case LibFunc_tan:
4825 case LibFunc_tanf: {
4826 // FIXME: Stop using the host math library.
4827 // FIXME: The computation isn't done in the right precision.
4828 Type *Ty = OpC->getType();
4829 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy())
4830 return ConstantFoldFP(tan, OpC->getValueAPF(), Ty) != nullptr;
4831 break;
4832 }
4833
4834 case LibFunc_atan:
4835 case LibFunc_atanf:
4836 case LibFunc_atanl:
4837 // Per POSIX, this MAY fail if Op is denormal. We choose not failing.
4838 return true;
4839
4840 case LibFunc_asinl:
4841 case LibFunc_asin:
4842 case LibFunc_asinf:
4843 case LibFunc_acosl:
4844 case LibFunc_acos:
4845 case LibFunc_acosf:
4846 return !(Op < APFloat::getOne(Op.getSemantics(), true) ||
4847 Op > APFloat::getOne(Op.getSemantics()));
4848
4849 case LibFunc_sinh:
4850 case LibFunc_cosh:
4851 case LibFunc_sinhf:
4852 case LibFunc_coshf:
4853 case LibFunc_sinhl:
4854 case LibFunc_coshl:
4855 // FIXME: These boundaries are slightly conservative.
4856 if (OpC->getType()->isDoubleTy())
4857 return !(Op < APFloat(-710.0) || Op > APFloat(710.0));
4858 if (OpC->getType()->isFloatTy())
4859 return !(Op < APFloat(-89.0f) || Op > APFloat(89.0f));
4860 break;
4861
4862 case LibFunc_sqrtl:
4863 case LibFunc_sqrt:
4864 case LibFunc_sqrtf:
4865 return Op.isNaN() || Op.isZero() || !Op.isNegative();
4866
4867 // FIXME: Add more functions: sqrt_finite, atanh, expm1, log1p,
4868 // maybe others?
4869 default:
4870 break;
4871 }
4872 }
4873 }
4874
4875 if (Call->arg_size() == 2) {
4876 ConstantFP *Op0C = dyn_cast<ConstantFP>(Call->getArgOperand(0));
4877 ConstantFP *Op1C = dyn_cast<ConstantFP>(Call->getArgOperand(1));
4878 if (Op0C && Op1C) {
4879 const APFloat &Op0 = Op0C->getValueAPF();
4880 const APFloat &Op1 = Op1C->getValueAPF();
4881
4882 switch (Func) {
4883 case LibFunc_powl:
4884 case LibFunc_pow:
4885 case LibFunc_powf: {
4886 // FIXME: Stop using the host math library.
4887 // FIXME: The computation isn't done in the right precision.
4888 Type *Ty = Op0C->getType();
4889 if (Ty->isDoubleTy() || Ty->isFloatTy() || Ty->isHalfTy()) {
4890 if (Ty == Op1C->getType())
4891 return ConstantFoldBinaryFP(pow, Op0, Op1, Ty) != nullptr;
4892 }
4893 break;
4894 }
4895
4896 case LibFunc_fmodl:
4897 case LibFunc_fmod:
4898 case LibFunc_fmodf:
4899 case LibFunc_remainderl:
4900 case LibFunc_remainder:
4901 case LibFunc_remainderf:
4902 return Op0.isNaN() || Op1.isNaN() ||
4903 (!Op0.isInfinity() && !Op1.isZero());
4904
4905 case LibFunc_atan2:
4906 case LibFunc_atan2f:
4907 case LibFunc_atan2l:
4908 // Although IEEE-754 says atan2(+/-0.0, +/-0.0) are well-defined, and
4909 // GLIBC and MSVC do not appear to raise an error on those, we
4910 // cannot rely on that behavior. POSIX and C11 say that a domain error
4911 // may occur, so allow for that possibility.
4912 return !Op0.isZero() || !Op1.isZero();
4913
4914 case LibFunc_nextafter:
4915 case LibFunc_nextafterf:
4916 case LibFunc_nextafterl:
4917 case LibFunc_nexttoward:
4918 case LibFunc_nexttowardf:
4919 case LibFunc_nexttowardl: {
4920 return ConstantFoldNextToward(Op0, Op1, F->getReturnType()) != nullptr;
4921 }
4922 default:
4923 break;
4924 }
4925 }
4926 }
4927
4928 return false;
4929}
4930
4932 unsigned CastOp, const DataLayout &DL,
4933 PreservedCastFlags *Flags) {
4934 switch (CastOp) {
4935 case Instruction::BitCast:
4936 // Bitcast is always lossless.
4937 return ConstantFoldCastOperand(Instruction::BitCast, C, InvCastTo, DL);
4938 case Instruction::Trunc: {
4939 auto *ZExtC = ConstantFoldCastOperand(Instruction::ZExt, C, InvCastTo, DL);
4940 if (Flags) {
4941 // Truncation back on ZExt value is always NUW.
4942 Flags->NUW = true;
4943 // Test positivity of C.
4944 auto *SExtC =
4945 ConstantFoldCastOperand(Instruction::SExt, C, InvCastTo, DL);
4946 Flags->NSW = ZExtC == SExtC;
4947 }
4948 return ZExtC;
4949 }
4950 case Instruction::SExt:
4951 case Instruction::ZExt: {
4952 auto *InvC = ConstantExpr::getTrunc(C, InvCastTo);
4953 auto *CastInvC = ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4954 // Must satisfy CastOp(InvC) == C.
4955 if (!CastInvC || CastInvC != C)
4956 return nullptr;
4957 if (Flags && CastOp == Instruction::ZExt) {
4958 auto *SExtInvC =
4959 ConstantFoldCastOperand(Instruction::SExt, InvC, C->getType(), DL);
4960 // Test positivity of InvC.
4961 Flags->NNeg = CastInvC == SExtInvC;
4962 }
4963 return InvC;
4964 }
4965 case Instruction::FPExt: {
4966 Constant *InvC =
4967 ConstantFoldCastOperand(Instruction::FPTrunc, C, InvCastTo, DL);
4968 if (InvC) {
4969 Constant *CastInvC =
4970 ConstantFoldCastOperand(CastOp, InvC, C->getType(), DL);
4971 if (CastInvC == C)
4972 return InvC;
4973 }
4974 return nullptr;
4975 }
4976 default:
4977 return nullptr;
4978 }
4979}
4980
4982 const DataLayout &DL,
4983 PreservedCastFlags *Flags) {
4984 return getLosslessInvCast(C, DestTy, Instruction::ZExt, DL, Flags);
4985}
4986
4988 const DataLayout &DL,
4989 PreservedCastFlags *Flags) {
4990 return getLosslessInvCast(C, DestTy, Instruction::SExt, DL, Flags);
4991}
4992
4993void TargetFolder::anchor() {}
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
constexpr LLT S1
This file declares a class to represent arbitrary precision floating point values and provide a varie...
This file implements a class to represent arbitrary precision integral constant values and operations...
This file implements the APSInt class, which is a simple class that represents an arbitrary sized int...
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
#define X(NUM, ENUM, NAME)
Definition ELF.h:853
static GCRegistry::Add< ErlangGC > A("erlang", "erlang-compatible garbage collector")
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static GCRegistry::Add< OcamlGC > B("ocaml", "ocaml 3.10-compatible GC")
static Constant * FoldBitCast(Constant *V, Type *DestTy)
static ConstantFP * flushDenormalConstant(Type *Ty, const APFloat &APF, DenormalMode::DenormalModeKind Mode)
Constant * getConstantAtOffset(Constant *Base, APInt Offset, const DataLayout &DL)
If this Offset points exactly to the start of an aggregate element, return that element,...
static cl::opt< bool > DisableFPCallFolding("disable-fp-call-folding", cl::desc("Disable constant-folding of FP intrinsics and libcalls."), cl::init(false), cl::Hidden)
static ConstantFP * flushDenormalConstantFP(ConstantFP *CFP, const Instruction *Inst, bool IsOutput)
static DenormalMode getInstrDenormalMode(const Instruction *CtxI, Type *Ty)
Return the denormal mode that can be assumed when executing a floating point operation at CtxI.
This file contains the declarations for the subclasses of Constant, which represent the different fla...
This file defines the DenseMap class.
Hexagon Common GEP
amode Optimize addressing mode
static constexpr Value * getValue(Ty &ValueOrUse)
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
static bool InRange(int64_t Value, unsigned short Shift, int LBound, int HBound)
This file contains the definitions of the enumerations and flags associated with NVVM Intrinsics,...
if(PassOpts->AAPipeline)
const SmallVectorImpl< MachineOperand > & Cond
static cl::opt< RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode > Mode("regalloc-enable-advisor", cl::Hidden, cl::init(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default), cl::desc("Enable regalloc advisor mode"), cl::values(clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Default, "default", "Default"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Release, "release", "precompiled"), clEnumValN(RegAllocEvictionAdvisorAnalysisLegacy::AdvisorMode::Development, "development", "for training")))
This file contains some templates that are useful if you are working with the STL at all.
This file implements the SmallBitVector class.
This file defines the SmallVector class.
static SymbolRef::Type getType(const Symbol *Sym)
Definition TapiFile.cpp:39
The Input class is used to parse a yaml document into in-memory structs and vectors.
cmpResult
IEEE-754R 5.11: Floating Point Comparison Relations.
Definition APFloat.h:335
static constexpr roundingMode rmTowardZero
Definition APFloat.h:349
llvm::RoundingMode roundingMode
IEEE-754R 4.3: Rounding-direction attributes.
Definition APFloat.h:343
static const fltSemantics & IEEEdouble()
Definition APFloat.h:298
static constexpr roundingMode rmTowardNegative
Definition APFloat.h:348
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:345
static constexpr roundingMode rmTowardPositive
Definition APFloat.h:347
static const fltSemantics & IEEEhalf()
Definition APFloat.h:295
static constexpr roundingMode rmNearestTiesToAway
Definition APFloat.h:350
opStatus
IEEE-754R 7: Default exception handling.
Definition APFloat.h:361
static APFloat getQNaN(const fltSemantics &Sem, bool Negative=false, const APInt *payload=nullptr)
Factory for QNaN values.
Definition APFloat.h:1185
opStatus divide(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1273
void copySign(const APFloat &RHS)
Definition APFloat.h:1367
LLVM_ABI opStatus convert(const fltSemantics &ToSemantics, roundingMode RM, bool *losesInfo)
Definition APFloat.cpp:5901
opStatus subtract(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1255
bool isNegative() const
Definition APFloat.h:1544
LLVM_ABI double convertToDouble() const
Converts this APFloat to host double value.
Definition APFloat.cpp:5960
bool isPosInfinity() const
Definition APFloat.h:1557
bool isNormal() const
Definition APFloat.h:1548
bool isDenormal() const
Definition APFloat.h:1545
opStatus add(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1246
const fltSemantics & getSemantics() const
Definition APFloat.h:1552
bool isNonZero() const
Definition APFloat.h:1553
bool isFinite() const
Definition APFloat.h:1549
bool isNaN() const
Definition APFloat.h:1542
static APFloat getOne(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative One.
Definition APFloat.h:1153
opStatus multiply(const APFloat &RHS, roundingMode RM)
Definition APFloat.h:1264
LLVM_ABI float convertToFloat() const
Converts this APFloat to host float value.
Definition APFloat.cpp:5988
bool isSignaling() const
Definition APFloat.h:1546
opStatus fusedMultiplyAdd(const APFloat &Multiplicand, const APFloat &Addend, roundingMode RM)
Definition APFloat.h:1300
bool isZero() const
Definition APFloat.h:1540
opStatus convertToInteger(MutableArrayRef< integerPart > Input, unsigned int Width, bool IsSigned, roundingMode RM, bool *IsExact) const
Definition APFloat.h:1397
opStatus mod(const APFloat &RHS)
Definition APFloat.h:1291
bool isNegInfinity() const
Definition APFloat.h:1558
opStatus roundToIntegral(roundingMode RM)
Definition APFloat.h:1313
void changeSign()
Definition APFloat.h:1362
static APFloat getZero(const fltSemantics &Sem, bool Negative=false)
Factory for Positive and Negative Zero.
Definition APFloat.h:1144
bool isInfinity() const
Definition APFloat.h:1541
Class for arbitrary precision integers.
Definition APInt.h:78
LLVM_ABI APInt umul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:2006
LLVM_ABI APInt usub_sat(const APInt &RHS) const
Definition APInt.cpp:2090
bool isMinSignedValue() const
Determine if this is the smallest signed value.
Definition APInt.h:424
uint64_t getZExtValue() const
Get zero extended value.
Definition APInt.h:1563
LLVM_ABI uint64_t extractBitsAsZExtValue(unsigned numBits, unsigned bitPosition) const
Definition APInt.cpp:521
LLVM_ABI APInt zextOrTrunc(unsigned width) const
Zero extend or truncate to width.
Definition APInt.cpp:1076
static APInt getMaxValue(unsigned numBits)
Gets maximum unsigned value of APInt for specific bit width.
Definition APInt.h:207
APInt abs() const
Get the absolute value.
Definition APInt.h:1818
LLVM_ABI APInt sadd_sat(const APInt &RHS) const
Definition APInt.cpp:2061
bool sgt(const APInt &RHS) const
Signed greater than comparison.
Definition APInt.h:1208
LLVM_ABI APInt usub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1983
bool ugt(const APInt &RHS) const
Unsigned greater than comparison.
Definition APInt.h:1189
bool isZero() const
Determine if this value is zero, i.e. all bits are clear.
Definition APInt.h:381
LLVM_ABI APInt urem(const APInt &RHS) const
Unsigned remainder operation.
Definition APInt.cpp:1692
unsigned getBitWidth() const
Return the number of bits in the APInt.
Definition APInt.h:1511
bool ult(const APInt &RHS) const
Unsigned less than comparison.
Definition APInt.h:1118
static APInt getSignedMaxValue(unsigned numBits)
Gets maximum signed value of APInt for a specific bit width.
Definition APInt.h:210
LLVM_ABI APInt sadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1963
LLVM_ABI APInt uadd_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1970
unsigned countr_zero() const
Count the number of trailing zero bits.
Definition APInt.h:1662
unsigned countl_zero() const
The APInt version of std::countl_zero.
Definition APInt.h:1621
static APInt getSignedMinValue(unsigned numBits)
Gets minimum signed value of APInt for a specific bit width.
Definition APInt.h:220
LLVM_ABI APInt sextOrTrunc(unsigned width) const
Sign extend or truncate to width.
Definition APInt.cpp:1084
LLVM_ABI APInt uadd_sat(const APInt &RHS) const
Definition APInt.cpp:2071
APInt ashr(unsigned ShiftAmt) const
Arithmetic right-shift function.
Definition APInt.h:834
LLVM_ABI APInt smul_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1995
LLVM_ABI APInt sext(unsigned width) const
Sign extend to a new width.
Definition APInt.cpp:1028
APInt shl(unsigned shiftAmt) const
Left-shift function.
Definition APInt.h:880
bool slt(const APInt &RHS) const
Signed less than comparison.
Definition APInt.h:1137
static APInt getZero(unsigned numBits)
Get the '0' value for the specified bit-width.
Definition APInt.h:201
LLVM_ABI APInt extractBits(unsigned numBits, unsigned bitPosition) const
Return an APInt with the extracted bits [bitPosition,bitPosition+numBits).
Definition APInt.cpp:483
LLVM_ABI APInt ssub_ov(const APInt &RHS, bool &Overflow) const
Definition APInt.cpp:1976
bool isOne() const
Determine if this is a value of 1.
Definition APInt.h:390
APInt lshr(unsigned shiftAmt) const
Logical right-shift function.
Definition APInt.h:858
LLVM_ABI APInt ssub_sat(const APInt &RHS) const
Definition APInt.cpp:2080
An arbitrary precision integer that knows its signedness.
Definition APSInt.h:24
This class represents an incoming formal argument to a Function.
Definition Argument.h:32
Represent a constant reference to an array (0 or more elements consecutively in memory),...
Definition ArrayRef.h:40
size_t size() const
Get the array size.
Definition ArrayRef.h:141
Base class for all callable instructions (InvokeInst and CallInst) Holds everything related to callin...
static LLVM_ABI Instruction::CastOps getCastOpcode(const Value *Val, bool SrcIsSigned, Type *Ty, bool DstIsSigned)
Returns the opcode necessary to cast Val into Ty using usual casting rules.
static LLVM_ABI unsigned isEliminableCastPair(Instruction::CastOps firstOpcode, Instruction::CastOps secondOpcode, Type *SrcTy, Type *MidTy, Type *DstTy, const DataLayout *DL)
Determine how a pair of casts can be eliminated, if they can be at all.
static LLVM_ABI bool castIsValid(Instruction::CastOps op, Type *SrcTy, Type *DstTy)
This method can be used to determine if a cast from SrcTy to DstTy using Opcode op is valid or not.
Predicate
This enumeration lists the possible predicates for CmpInst subclasses.
Definition InstrTypes.h:740
bool isSigned() const
Definition InstrTypes.h:993
Predicate getSwappedPredicate() const
For example, EQ->EQ, SLE->SGE, ULT->UGT, OEQ->OEQ, ULE->UGE, OLT->OGT, etc.
Definition InstrTypes.h:890
static bool isFPPredicate(Predicate P)
Definition InstrTypes.h:833
static Constant * get(LLVMContext &Context, ArrayRef< ElementTy > Elts)
get() constructor - Return a constant with array type with an element count and element type matching...
Definition Constants.h:872
static LLVM_ABI Constant * getIntToPtr(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getExtractElement(Constant *Vec, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI bool isDesirableCastOp(unsigned Opcode)
Whether creating a constant expression for this cast is desirable.
static LLVM_ABI Constant * getCast(unsigned ops, Constant *C, Type *Ty, bool OnlyIfReduced=false)
Convenience function for getting a Cast operation.
static LLVM_ABI Constant * getSub(Constant *C1, Constant *C2, bool HasNUW=false, bool HasNSW=false)
static Constant * getPtrAdd(Constant *Ptr, Constant *Offset, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReduced=nullptr)
Create a getelementptr i8, ptr, offset constant expression.
Definition Constants.h:1491
static LLVM_ABI Constant * getInsertElement(Constant *Vec, Constant *Elt, Constant *Idx, Type *OnlyIfReducedTy=nullptr)
static LLVM_ABI Constant * getShuffleVector(Constant *V1, Constant *V2, ArrayRef< int > Mask, Type *OnlyIfReducedTy=nullptr)
static bool isSupportedGetElementPtr(const Type *SrcElemTy)
Whether creating a constant expression for this getelementptr type is supported.
Definition Constants.h:1592
static LLVM_ABI Constant * get(unsigned Opcode, Constant *C1, Constant *C2, unsigned Flags=0, Type *OnlyIfReducedTy=nullptr)
get - Return a binary or shift operator constant expression, folding if possible.
static LLVM_ABI bool isDesirableBinOp(unsigned Opcode)
Whether creating a constant expression for this binary operator is desirable.
static Constant * getGetElementPtr(Type *Ty, Constant *C, ArrayRef< Constant * > IdxList, GEPNoWrapFlags NW=GEPNoWrapFlags::none(), std::optional< ConstantRange > InRange=std::nullopt, Type *OnlyIfReducedTy=nullptr)
Getelementptr form.
Definition Constants.h:1464
static LLVM_ABI Constant * getBitCast(Constant *C, Type *Ty, bool OnlyIfReduced=false)
static LLVM_ABI Constant * getTrunc(Constant *C, Type *Ty, bool OnlyIfReduced=false)
ConstantFP - Floating Point Values [float, double].
Definition Constants.h:420
const APFloat & getValueAPF() const
Definition Constants.h:463
static LLVM_ABI ConstantFP * getZero(Type *Ty, bool Negative=false)
static LLVM_ABI ConstantFP * getNaN(Type *Ty, bool Negative=false, uint64_t Payload=0)
static LLVM_ABI ConstantFP * getInfinity(Type *Ty, bool Negative=false)
This is the shared class of boolean and integer constants.
Definition Constants.h:87
static LLVM_ABI ConstantInt * getTrue(LLVMContext &Context)
static ConstantInt * getSigned(IntegerType *Ty, int64_t V, bool ImplicitTrunc=false)
Return a ConstantInt with the specified value for the specified type.
Definition Constants.h:135
static LLVM_ABI ConstantInt * getFalse(LLVMContext &Context)
int64_t getSExtValue() const
Return the constant as a 64-bit integer value after it has been sign extended as appropriate for the ...
Definition Constants.h:174
static LLVM_ABI ConstantInt * getBool(LLVMContext &Context, bool V)
static LLVM_ABI Constant * get(StructType *T, ArrayRef< Constant * > V)
static LLVM_ABI Constant * getSplat(ElementCount EC, Constant *Elt)
Return a ConstantVector with the specified constant in each element.
static LLVM_ABI Constant * get(ArrayRef< Constant * > V)
This is an important base class in LLVM.
Definition Constant.h:43
LLVM_ABI Constant * getSplatValue(bool AllowPoison=false) const
If all elements of the vector constant have the same value, return that value.
bool isNullValue() const
Return true if this is the value that would be returned by getNullValue.
Definition Constant.h:64
static LLVM_ABI Constant * getAllOnesValue(Type *Ty)
static LLVM_ABI Constant * getNullValue(Type *Ty)
Constructor to create a '0' constant of arbitrary type.
LLVM_ABI Constant * getAggregateElement(unsigned Elt) const
For aggregates (struct/array/vector) return the constant that corresponds to the specified element if...
Constrained floating point compare intrinsics.
This is the common base class for constrained floating point intrinsics.
LLVM_ABI std::optional< fp::ExceptionBehavior > getExceptionBehavior() const
LLVM_ABI std::optional< RoundingMode > getRoundingMode() const
Wrapper for a function that represents a value that functionally represents the original function.
Definition Constants.h:1137
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
iterator find(const_arg_type_t< KeyT > Val)
Definition DenseMap.h:225
iterator end()
Definition DenseMap.h:143
std::pair< iterator, bool > insert(const std::pair< KeyT, ValueT > &KV)
Definition DenseMap.h:286
static LLVM_ABI bool compare(const APFloat &LHS, const APFloat &RHS, FCmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Class to represent fixed width SIMD vectors.
unsigned getNumElements() const
static LLVM_ABI FixedVectorType * get(Type *ElementType, unsigned NumElts)
Definition Type.cpp:869
DenormalMode getDenormalMode(const fltSemantics &FPType) const
Returns the denormal handling type for the default rounding mode of the function.
Definition Function.cpp:800
Represents flags for the getelementptr instruction/expression.
static GEPNoWrapFlags inBounds()
GEPNoWrapFlags withoutNoUnsignedSignedWrap() const
static GEPNoWrapFlags noUnsignedWrap()
bool hasNoUnsignedSignedWrap() const
bool isInBounds() const
static LLVM_ABI Type * getIndexedType(Type *Ty, ArrayRef< Value * > IdxList)
Returns the result type of a getelementptr with the given source element type and indexes.
PointerType * getType() const
Global values are always pointers.
LLVM_ABI const DataLayout & getDataLayout() const
Get the data layout of the module this global belongs to.
Definition Globals.cpp:141
const Constant * getInitializer() const
getInitializer - Return the initializer for this global variable.
bool isConstant() const
If the value is a global constant, its value is immutable throughout the runtime execution of the pro...
bool hasDefinitiveInitializer() const
hasDefinitiveInitializer - Whether the global variable has an initializer, and any other instances of...
static LLVM_ABI bool compare(const APInt &LHS, const APInt &RHS, ICmpInst::Predicate Pred)
Return result of LHS Pred RHS comparison.
Predicate getSignedPredicate() const
For example, EQ->EQ, SLE->SLE, UGT->SGT, etc.
bool isEquality() const
Return true if this predicate is either EQ or NE.
bool isCast() const
bool isBinaryOp() const
LLVM_ABI const Function * getFunction() const
Return the function this instruction belongs to.
bool isUnaryOp() const
static LLVM_ABI IntegerType * get(LLVMContext &C, unsigned NumBits)
This static method is the primary way of constructing an IntegerType.
Definition Type.cpp:350
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
static APInt getSaturationPoint(Intrinsic::ID ID, unsigned numBits)
Min/max intrinsics are monotonic, they operate on a fixed-bitwidth values, so there is a certain thre...
static ICmpInst::Predicate getPredicate(Intrinsic::ID ID)
Returns the comparison predicate underlying the intrinsic.
static LLVM_ABI PoisonValue * get(Type *T)
Static factory methods - Return an 'poison' object of the specified type.
Class to represent scalable SIMD vectors.
This is a 'bitvector' (really, a variable-sized bit array), optimized for the case when the array is ...
SmallBitVector & set()
iterator_range< const_set_bits_iterator > set_bits() const
void push_back(const T &Elt)
pointer data()
Return a pointer to the vector's buffer, even if empty().
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
Used to lazily calculate structure layout information for a target machine, based on the DataLayout s...
Definition DataLayout.h:743
LLVM_ABI unsigned getElementContainingOffset(uint64_t FixedOffset) const
Given a valid byte offset into the structure, returns the structure index that contains it.
TypeSize getElementOffset(unsigned Idx) const
Definition DataLayout.h:774
Class to represent struct types.
unsigned getNumElements() const
Random access to the elements.
Provides information about what library functions are available for the current target.
bool has(LibFunc F) const
Tests whether a library function is available.
bool getLibFunc(StringRef funcName, LibFunc &F) const
Searches for a particular function name.
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI IntegerType * getInt64Ty(LLVMContext &C)
Definition Type.cpp:310
bool isByteTy() const
True if this is an instance of ByteType.
Definition Type.h:242
bool isVectorTy() const
True if this is an instance of VectorType.
Definition Type.h:288
static LLVM_ABI IntegerType * getInt32Ty(LLVMContext &C)
Definition Type.cpp:309
bool isPointerTy() const
True if this is an instance of PointerType.
Definition Type.h:282
LLVM_ABI unsigned getPointerAddressSpace() const
Get the address space of this pointer or pointer vector type.
@ HalfTyID
16-bit floating point type
Definition Type.h:57
@ FloatTyID
32-bit floating point type
Definition Type.h:59
@ DoubleTyID
64-bit floating point type
Definition Type.h:60
Type * getScalarType() const
If this is a vector type, return the element type, otherwise return 'this'.
Definition Type.h:368
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:197
bool isByteOrByteVectorTy() const
Return true if this is a byte type or a vector of byte types.
Definition Type.h:248
static LLVM_ABI IntegerType * getInt16Ty(LLVMContext &C)
Definition Type.cpp:308
bool isSized(SmallPtrSetImpl< Type * > *Visited=nullptr) const
Return true if it makes sense to take the size of this type.
Definition Type.h:326
LLVMContext & getContext() const
Return the LLVMContext in which this type was uniqued.
Definition Type.h:130
LLVM_ABI unsigned getScalarSizeInBits() const LLVM_READONLY
If this is a vector type, return the getPrimitiveSizeInBits value for the element type.
Definition Type.cpp:232
static LLVM_ABI IntegerType * getInt1Ty(LLVMContext &C)
Definition Type.cpp:306
bool isFloatingPointTy() const
Return true if this is one of the floating-point types.
Definition Type.h:186
bool isPtrOrPtrVectorTy() const
Return true if this is a pointer type or a vector of pointer types.
Definition Type.h:285
bool isX86_AMXTy() const
Return true if this is X86 AMX.
Definition Type.h:202
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257
static LLVM_ABI IntegerType * getIntNTy(LLVMContext &C, unsigned N)
Definition Type.cpp:313
Type * getContainedType(unsigned i) const
This method is used to implement the type iterator (defined at the end of the file).
Definition Type.h:397
LLVM_ABI const fltSemantics & getFltSemantics() const
Definition Type.cpp:106
static LLVM_ABI UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
A Use represents the edge between a Value definition and its users.
Definition Use.h:35
LLVM Value Representation.
Definition Value.h:75
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
LLVMContext & getContext() const
All values hold a context through their type.
Definition Value.h:258
LLVM_ABI const Value * stripAndAccumulateConstantOffsets(const DataLayout &DL, APInt &Offset, bool AllowNonInbounds, bool AllowInvariantGroup=false, function_ref< bool(Value &Value, APInt &Offset)> ExternalAnalysis=nullptr, bool LookThroughIntToPtr=false) const
Accumulate the constant offset this value has compared to a base pointer.
LLVM_ABI uint64_t getPointerDereferenceableBytes(const DataLayout &DL, bool &CanBeNull, bool *CanBeFreed) const
Returns the number of bytes known to be dereferenceable for the pointer value.
Definition Value.cpp:909
Base class of all SIMD vector types.
ElementCount getElementCount() const
Return an ElementCount instance to represent the (possibly scalable) number of elements in the vector...
Type * getElementType() const
constexpr ScalarTy getFixedValue() const
Definition TypeSize.h:200
constexpr bool isScalable() const
Returns whether the quantity is scaled by a runtime quantity (vscale).
Definition TypeSize.h:168
constexpr bool isFixed() const
Returns true if the quantity is not scaled by vscale.
Definition TypeSize.h:171
constexpr LeafTy divideCoefficientBy(ScalarTy RHS) const
We do not provide the '/' operator here because division for polynomial types does not work in the sa...
Definition TypeSize.h:252
static constexpr bool isKnownGE(const FixedOrScalableQuantity &LHS, const FixedOrScalableQuantity &RHS)
Definition TypeSize.h:237
const ParentTy * getParent() const
Definition ilist_node.h:34
CallInst * Call
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
LLVM_ABI APInt compressBits(const APInt &Val, const APInt &Mask)
Perform a "compress" operation, also known as pext or bext.
Definition APInt.cpp:3242
const APInt & smin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be signed.
Definition APInt.h:2277
const APInt & smax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be signed.
Definition APInt.h:2282
LLVM_ABI APInt clmul(const APInt &LHS, const APInt &RHS)
Perform a carry-less multiply, also known as XOR multiplication, and return low-bits.
Definition APInt.cpp:3222
const APInt & umin(const APInt &A, const APInt &B)
Determine the smaller of two APInts considered to be unsigned.
Definition APInt.h:2287
LLVM_ABI APInt expandBits(const APInt &Val, const APInt &Mask)
Perform an "expand" operation, also known as pdep or bdep.
Definition APInt.cpp:3252
const APInt & umax(const APInt &A, const APInt &B)
Determine the larger of two APInts considered to be unsigned.
Definition APInt.h:2292
constexpr std::underlying_type_t< E > Mask()
Get a bitmask with 1s in all places up to the high-order bit of E's largest value.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ CE
Windows NT (Windows on ARM)
Definition MCAsmInfo.h:50
initializer< Ty > init(const Ty &Val)
static constexpr roundingMode rmNearestTiesToEven
Definition APFloat.h:432
static constexpr cmpResult cmpEqual
Definition APFloat.h:440
@ ebStrict
This corresponds to "fpexcept.strict".
Definition FPEnv.h:42
@ ebIgnore
This corresponds to "fpexcept.ignore".
Definition FPEnv.h:40
constexpr double pi
APFloat::roundingMode GetFMARoundingMode(Intrinsic::ID IntrinsicID)
DenormalMode GetNVVMDenormMode(bool ShouldFTZ)
bool FPToIntegerIntrinsicNaNZero(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFDivRoundingMode(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicResultIsSigned(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFPToIntegerRoundingMode(Intrinsic::ID IntrinsicID)
bool RCPShouldFTZ(Intrinsic::ID IntrinsicID)
bool FPToIntegerIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FDivShouldFTZ(Intrinsic::ID IntrinsicID)
bool FAddShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxIsXorSignAbs(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFMulRoundingMode(Intrinsic::ID IntrinsicID)
bool UnaryMathIntrinsicShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMinFMaxShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetFAddRoundingMode(Intrinsic::ID IntrinsicID)
bool FMAShouldFTZ(Intrinsic::ID IntrinsicID)
bool FMulShouldFTZ(Intrinsic::ID IntrinsicID)
APFloat::roundingMode GetRCPRoundingMode(Intrinsic::ID IntrinsicID)
bool FMinFMaxPropagatesNaNs(Intrinsic::ID IntrinsicID)
NodeAddr< FuncNode * > Func
Definition RDFGraph.h:393
LLVM_ABI std::error_code status(const Twine &path, file_status &result, bool follow=true)
Get file status as if by POSIX stat().
This is an optimization pass for GlobalISel generic memory operations.
auto drop_begin(T &&RangeOrContainer, size_t N=1)
Return a range covering RangeOrContainer with the first N elements excluded.
Definition STLExtras.h:315
@ Offset
Definition DWP.cpp:558
bool all_of(R &&range, UnaryPredicate P)
Provide wrappers to std::all_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1738
LLVM_ABI Constant * ConstantFoldLoadThroughBitcast(Constant *C, Type *DestTy, const DataLayout &DL)
ConstantFoldLoadThroughBitcast - try to cast constant to destination type returning null if unsuccess...
static double log2(double V)
LLVM_ABI Constant * ConstantFoldSelectInstruction(Constant *Cond, Constant *V1, Constant *V2)
Attempt to constant fold a select instruction with the specified operands.
LLVM_ABI Constant * ConstantFoldFPInstOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL, const Instruction *I, bool AllowNonDeterministic=true)
Attempt to constant fold a floating point binary operation with the specified operands,...
auto enumerate(FirstRange &&First, RestRanges &&...Rest)
Given two or more input ranges, returns a new range whose values are tuples (A, B,...
Definition STLExtras.h:2553
LLVM_ABI bool canConstantFoldCallTo(const CallBase *Call, const Function *F)
canConstantFoldCallTo - Return true if its even possible to fold a call to the specified function.
unsigned getPointerAddressSpace(const Type *T)
Definition SPIRVUtils.h:389
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
LLVM_ABI Constant * ConstantFoldInstruction(const Instruction *I, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldInstruction - Try to constant fold the specified instruction.
APFloat abs(APFloat X)
Returns the absolute value of the argument.
Definition APFloat.h:1666
LLVM_ABI Constant * ConstantFoldUnaryIntrinsic(Intrinsic::ID ID, Constant *Op, Type *Ty)
LLVM_ABI Constant * ConstantFoldCompareInstruction(CmpInst::Predicate Predicate, Constant *C1, Constant *C2)
LLVM_ABI Constant * ConstantFoldUnaryInstruction(unsigned Opcode, Constant *V)
LLVM_ABI bool IsConstantOffsetFromGlobal(Constant *C, GlobalValue *&GV, APInt &Offset, const DataLayout &DL, DSOLocalEquivalent **DSOEquiv=nullptr)
If this constant is a constant offset from a global, return the global and the constant.
LLVM_ABI bool isMathLibCallNoop(const CallBase *Call, const TargetLibraryInfo *TLI)
Check whether the given call has no side-effects.
LLVM_ABI Constant * ReadByteArrayFromGlobal(const GlobalVariable *GV, uint64_t Offset)
auto dyn_cast_if_present(const Y &Val)
dyn_cast_if_present<X> - Functionally identical to dyn_cast, except that a null (or none in the case ...
Definition Casting.h:732
LLVM_READONLY APFloat maximum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximum semantics.
Definition APFloat.h:1746
LLVM_ABI Constant * ConstantFoldCompareInstOperands(unsigned Predicate, Constant *LHS, Constant *RHS, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, const Instruction *I=nullptr)
Attempt to constant fold a compare instruction (icmp/fcmp) with the specified operands.
int ilogb(const APFloat &Arg)
Returns the exponent of the internal representation of the APFloat.
Definition APFloat.h:1637
bool isa_and_nonnull(const Y &Val)
Definition Casting.h:676
LLVM_ABI Constant * ConstantFoldCall(const CallBase *Call, Function *F, ArrayRef< Constant * > Operands, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldCall - Attempt to constant fold a call to the specified function with the specified argum...
APFloat frexp(const APFloat &X, int &Exp, APFloat::roundingMode RM)
Equivalent of C standard library function.
Definition APFloat.h:1658
LLVM_ABI Constant * ConstantFoldExtractValueInstruction(Constant *Agg, ArrayRef< unsigned > Idxs)
Attempt to constant fold an extractvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldConstant(const Constant *C, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr)
ConstantFoldConstant - Fold the constant using the specified DataLayout.
auto dyn_cast_or_null(const Y &Val)
Definition Casting.h:753
bool any_of(R &&range, UnaryPredicate P)
Provide wrappers to std::any_of which take ranges instead of having to pass begin/end explicitly.
Definition STLExtras.h:1745
LLVM_READONLY APFloat maxnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 maxNum semantics.
Definition APFloat.h:1701
LLVM_ABI Constant * ConstantFoldLoadFromUniformValue(Constant *C, Type *Ty, const DataLayout &DL)
If C is a uniform value where all bits are the same (either all zero, all ones, all undef or all pois...
LLVM_ABI Constant * ConstantFoldUnaryOpOperand(unsigned Opcode, Constant *Op, const DataLayout &DL)
Attempt to constant fold a unary operation with the specified operand.
LLVM_ABI Constant * FlushFPConstant(Constant *Operand, const Instruction *I, bool IsOutput)
Attempt to flush float point constant according to denormal mode set in the instruction's parent func...
LLVM_ABI Constant * getLosslessUnsignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
LLVM_READONLY LLVM_ABI std::optional< APFloat > exp(const APFloat &X, RoundingMode RM=APFloat::rmNearestTiesToEven, APFloat::opStatus *Status=nullptr)
Implement IEEE 754-2019 exp functions.
Definition APFloat.cpp:6106
decltype(auto) get(const PointerIntPair< PointerTy, IntBits, IntType, PtrTraits, Info > &Pair)
LLVM_READONLY APFloat minimumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimumNumber semantics.
Definition APFloat.h:1732
FPClassTest
Floating-point class tests, supported by 'is_fpclass' intrinsic.
APFloat scalbn(APFloat X, int Exp, APFloat::roundingMode RM)
Returns: X * 2^Exp for integral exponents.
Definition APFloat.h:1646
LLVM_ABI void computeKnownBits(const Value *V, KnownBits &Known, const DataLayout &DL, AssumptionCache *AC=nullptr, const Instruction *CxtI=nullptr, const DominatorTree *DT=nullptr, bool UseInstrInfo=true, unsigned Depth=0)
Determine which bits of V are known to be either zero or one and return them in the KnownZero/KnownOn...
LLVM_ABI bool NullPointerIsDefined(const Function *F, unsigned AS=0)
Check whether null pointer dereferencing is considered undefined behavior for a given function or an ...
LLVM_ABI Constant * getLosslessSignedTrunc(Constant *C, Type *DestTy, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
LLVM_ABI Constant * ConstantFoldBinaryIntrinsic(Intrinsic::ID ID, Constant *LHS, Constant *RHS, Type *Ty)
LLVM_ABI Constant * ConstantFoldCastOperand(unsigned Opcode, Constant *C, Type *DestTy, const DataLayout &DL)
Attempt to constant fold a cast with the specified operand.
LLVM_ABI Constant * ConstantFoldLoadFromConst(Constant *C, Type *Ty, const APInt &Offset, const DataLayout &DL)
Extract value of C at the given Offset reinterpreted as Ty.
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
LLVM_ABI bool intrinsicPropagatesPoison(Intrinsic::ID IID)
Return whether this intrinsic propagates poison for all operands.
LLVM_ABI Constant * ConstantFoldBinaryOpOperands(unsigned Opcode, Constant *LHS, Constant *RHS, const DataLayout &DL)
Attempt to constant fold a binary operation with the specified operands.
MutableArrayRef(T &OneElt) -> MutableArrayRef< T >
LLVM_READONLY APFloat minnum(const APFloat &A, const APFloat &B)
Implements IEEE-754 2008 minNum semantics.
Definition APFloat.h:1682
@ Sub
Subtraction of integers.
LLVM_ABI bool isVectorIntrinsicWithScalarOpAtArg(Intrinsic::ID ID, unsigned ScalarOpdIdx, const TargetTransformInfo *TTI)
Identifies if the vector form of the intrinsic has a scalar operand.
FunctionAddr VTableAddr Next
Definition InstrProf.h:141
DWARFExpression::Operation Op
RoundingMode
Rounding mode.
@ NearestTiesToEven
roundTiesToEven.
@ Dynamic
Denotes mode unknown at compile time.
LLVM_ABI bool isGuaranteedNotToBeUndefOrPoison(const Value *V, AssumptionCache *AC=nullptr, const Instruction *CtxI=nullptr, const DominatorTree *DT=nullptr, unsigned Depth=0)
Return true if this function can prove that V does not have undef bits and is never poison.
constexpr unsigned BitWidth
LLVM_ABI Constant * getLosslessInvCast(Constant *C, Type *InvCastTo, unsigned CastOp, const DataLayout &DL, PreservedCastFlags *Flags=nullptr)
Try to cast C to InvC losslessly, satisfying CastOp(InvC) equals C, or CastOp(InvC) is a refined valu...
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
bool all_equal(std::initializer_list< T > Values)
Returns true if all Values in the initializer lists are equal or the list.
Definition STLExtras.h:2165
LLVM_ABI Constant * ConstantFoldCastInstruction(unsigned opcode, Constant *V, Type *DestTy)
LLVM_ABI Constant * ConstantFoldInsertValueInstruction(Constant *Agg, Constant *Val, ArrayRef< unsigned > Idxs)
Attempt to constant fold an insertvalue instruction with the specified operands and indices.
LLVM_ABI Constant * ConstantFoldLoadFromConstPtr(Constant *C, Type *Ty, APInt Offset, const DataLayout &DL)
Return the value that a load from C with offset Offset would produce if it is constant and determinab...
LLVM_ABI Constant * ConstantFoldInstOperands(const Instruction *I, ArrayRef< Constant * > Ops, const DataLayout &DL, const TargetLibraryInfo *TLI=nullptr, bool AllowNonDeterministic=true)
ConstantFoldInstOperands - Attempt to constant fold an instruction with the specified operands.
LLVM_READONLY APFloat minimum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 minimum semantics.
Definition APFloat.h:1719
LLVM_READONLY APFloat maximumnum(const APFloat &A, const APFloat &B)
Implements IEEE 754-2019 maximumNumber semantics.
Definition APFloat.h:1759
LLVM_ABI const Value * getUnderlyingObject(const Value *V, unsigned MaxLookup=MaxLookupSearchDepth)
This method strips off any GEP address adjustments, pointer casts or llvm.threadlocal....
LLVM_ABI Constant * ConstantFoldIntegerCast(Constant *C, Type *DestTy, bool IsSigned, const DataLayout &DL)
Constant fold a zext, sext or trunc, depending on IsSigned and whether the DestTy is wider or narrowe...
LLVM_ABI bool isTriviallyVectorizable(Intrinsic::ID ID)
Identify if the intrinsic is trivially vectorizable.
constexpr detail::IsaCheckPredicate< Types... > IsaPred
Function object wrapper for the llvm::isa type check.
Definition Casting.h:866
LLVM_ABI Constant * ConstantFoldBinaryInstruction(unsigned Opcode, Constant *V1, Constant *V2)
Represent subnormal handling kind for floating point instruction inputs and outputs.
DenormalModeKind Input
Denormal treatment kind for floating point instruction inputs in the default floating-point environme...
DenormalModeKind
Represent handled modes for denormal (aka subnormal) modes in the floating point environment.
@ PreserveSign
The sign of a flushed-to-zero number is preserved in the sign of 0.
@ PositiveZero
Denormals are flushed to positive zero.
@ Dynamic
Denormals have unknown treatment.
@ IEEE
IEEE-754 denormal numbers preserved.
DenormalModeKind Output
Denormal flushing mode for floating point instruction results in the default floating point environme...
static constexpr DenormalMode getDynamic()
static constexpr DenormalMode getIEEE()
bool isConstant() const
Returns true if we know the value of all bits.
Definition KnownBits.h:54
const APInt & getConstant() const
Returns the value when all bits have a known value.
Definition KnownBits.h:58