LLVM 23.0.0git
BPFISelLowering.cpp
Go to the documentation of this file.
1//===-- BPFISelLowering.cpp - BPF DAG Lowering Implementation ------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file defines the interfaces that BPF uses to lower LLVM code into a
10// selection DAG.
11//
12//===----------------------------------------------------------------------===//
13
14#include "BPFISelLowering.h"
15#include "BPF.h"
16#include "BPFSubtarget.h"
25#include "llvm/IR/DIBuilder.h"
28#include "llvm/IR/Module.h"
29#include "llvm/Support/Debug.h"
33
34using namespace llvm;
35
36#define DEBUG_TYPE "bpf-lower"
37
38static cl::opt<bool> BPFExpandMemcpyInOrder("bpf-expand-memcpy-in-order",
39 cl::Hidden, cl::init(false),
40 cl::desc("Expand memcpy into load/store pairs in order"));
41
43 "bpf-min-jump-table-entries", cl::init(13), cl::Hidden,
44 cl::desc("Set minimum number of entries to use a jump table on BPF"));
45
47 "bpf-allows-libcalls", cl::Hidden, cl::init(false),
48 cl::desc("Allow libcalls instead of rejecting unsupported built-in "
49 "functions"));
50
51static void fail(const SDLoc &DL, SelectionDAG &DAG, const Twine &Msg,
52 SDValue Val = {}) {
53 std::string Str;
54 if (Val) {
55 raw_string_ostream OS(Str);
56 Val->print(OS);
57 OS << ' ';
58 }
61 MF.getFunction(), Twine(Str).concat(Msg), DL.getDebugLoc()));
62}
63
65 const BPFSubtarget &STI)
66 : TargetLowering(TM, STI) {
67
68 // Set up the register classes.
69 addRegisterClass(MVT::i64, &BPF::GPRRegClass);
70 if (STI.getHasAlu32())
71 addRegisterClass(MVT::i32, &BPF::GPR32RegClass);
72
73 // Compute derived properties from the register classes
75
77
81
82 if (!STI.hasGotox())
84
86
88 if (STI.hasGotox())
90
94
95 // Set unsupported atomic operations as Custom so
96 // we can emit better error messages than fatal error
97 // from selectiondag.
98 for (auto VT : {MVT::i8, MVT::i16, MVT::i32}) {
99 if (VT == MVT::i32) {
100 if (STI.getHasAlu32())
101 continue;
102 } else {
104 }
105
111 }
112
113 for (auto VT : {MVT::i32, MVT::i64}) {
116 }
117
119
120 for (auto VT : { MVT::i32, MVT::i64 }) {
121 if (VT == MVT::i32 && !STI.getHasAlu32())
122 continue;
123
126 if (!STI.hasSdivSmod()) {
129 }
144
148 }
149
150 if (STI.getHasAlu32()) {
153 STI.getHasJmp32() ? Custom : Promote);
154 }
155
157 if (!STI.hasMovsx()) {
161 }
162
163 // Extended load operations for i1 types must be promoted
164 for (MVT VT : MVT::integer_valuetypes()) {
168
169 if (!STI.hasLdsx()) {
171 setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i16, Expand);
172 setLoadExtAction(ISD::SEXTLOAD, VT, MVT::i32, Expand);
173 }
174 }
175
179
180 // Function alignments
183
185 // LLVM generic code will try to expand memcpy into load/store pairs at this
186 // stage which is before quite a few IR optimization passes, therefore the
187 // loads and stores could potentially be moved apart from each other which
188 // will cause trouble to memcpy pattern matcher inside kernel eBPF JIT
189 // compilers.
190 //
191 // When -bpf-expand-memcpy-in-order specified, we want to defer the expand
192 // of memcpy to later stage in IR optimization pipeline so those load/store
193 // pairs won't be touched and could be kept in order. Hence, we set
194 // MaxStoresPerMem* to zero to disable the generic getMemcpyLoadsAndStores
195 // code path, and ask LLVM to use target expander EmitTargetCodeForMemcpy.
200 } else {
201 // inline memcpy() for kernel to see explicit copy
202 unsigned CommonMaxStores =
204
209 }
210
211 // CPU/Feature control
212 HasAlu32 = STI.getHasAlu32();
213 HasJmp32 = STI.getHasJmp32();
214 HasJmpExt = STI.getHasJmpExt();
215 HasMovsx = STI.hasMovsx();
216
217 AllowsMisalignedMemAccess = STI.getAllowsMisalignedMemAccess();
218}
219
222 unsigned *Fast) const {
223 // allows-misaligned-mem-access is disabled
224 if (!AllowsMisalignedMemAccess)
225 return false;
226
227 // only allow misalignment for simple value types
228 if (!VT.isSimple())
229 return false;
230
231 // always assume fast mode when misalignment is allowed
232 if (Fast)
233 *Fast = true;
234
235 return true;
236}
237
239 return false;
240}
241
242bool BPFTargetLowering::isTruncateFree(Type *Ty1, Type *Ty2) const {
243 if (!Ty1->isIntegerTy() || !Ty2->isIntegerTy())
244 return false;
245 unsigned NumBits1 = Ty1->getPrimitiveSizeInBits();
246 unsigned NumBits2 = Ty2->getPrimitiveSizeInBits();
247 return NumBits1 > NumBits2;
248}
249
250bool BPFTargetLowering::isTruncateFree(EVT VT1, EVT VT2) const {
251 if (!VT1.isInteger() || !VT2.isInteger())
252 return false;
253 unsigned NumBits1 = VT1.getSizeInBits();
254 unsigned NumBits2 = VT2.getSizeInBits();
255 return NumBits1 > NumBits2;
256}
257
258bool BPFTargetLowering::isZExtFree(Type *Ty1, Type *Ty2) const {
259 if (!getHasAlu32() || !Ty1->isIntegerTy() || !Ty2->isIntegerTy())
260 return false;
261 unsigned NumBits1 = Ty1->getPrimitiveSizeInBits();
262 unsigned NumBits2 = Ty2->getPrimitiveSizeInBits();
263 return NumBits1 == 32 && NumBits2 == 64;
264}
265
266bool BPFTargetLowering::isZExtFree(EVT VT1, EVT VT2) const {
267 if (!getHasAlu32() || !VT1.isInteger() || !VT2.isInteger())
268 return false;
269 unsigned NumBits1 = VT1.getSizeInBits();
270 unsigned NumBits2 = VT2.getSizeInBits();
271 return NumBits1 == 32 && NumBits2 == 64;
272}
273
274bool BPFTargetLowering::isZExtFree(SDValue Val, EVT VT2) const {
275 EVT VT1 = Val.getValueType();
276 if (Val.getOpcode() == ISD::LOAD && VT1.isSimple() && VT2.isSimple()) {
277 MVT MT1 = VT1.getSimpleVT().SimpleTy;
278 MVT MT2 = VT2.getSimpleVT().SimpleTy;
279 if ((MT1 == MVT::i8 || MT1 == MVT::i16 || MT1 == MVT::i32) &&
280 (MT2 == MVT::i32 || MT2 == MVT::i64))
281 return true;
282 }
283 return TargetLoweringBase::isZExtFree(Val, VT2);
284}
285
289
292 if (Constraint.size() == 1) {
293 switch (Constraint[0]) {
294 default:
295 break;
296 case 'w':
297 return C_RegisterClass;
298 }
299 }
300
301 return TargetLowering::getConstraintType(Constraint);
302}
303
304std::pair<unsigned, const TargetRegisterClass *>
306 StringRef Constraint,
307 MVT VT) const {
308 if (Constraint.size() == 1) {
309 // GCC Constraint Letters
310 switch (Constraint[0]) {
311 case 'r': // GENERAL_REGS
312 return std::make_pair(0U, &BPF::GPRRegClass);
313 case 'w':
314 if (HasAlu32)
315 return std::make_pair(0U, &BPF::GPR32RegClass);
316 break;
317 default:
318 break;
319 }
320 }
321
323}
324
325void BPFTargetLowering::ReplaceNodeResults(
327 const char *Msg;
328 uint32_t Opcode = N->getOpcode();
329 switch (Opcode) {
330 default:
331 report_fatal_error("unhandled custom legalization: " + Twine(Opcode));
336 case ISD::ATOMIC_SWAP:
338 if (HasAlu32 || Opcode == ISD::ATOMIC_LOAD_ADD)
339 Msg = "unsupported atomic operation, please use 32/64 bit version";
340 else
341 Msg = "unsupported atomic operation, please use 64 bit version";
342 break;
343 case ISD::ATOMIC_LOAD:
345 return;
346 }
347
348 SDLoc DL(N);
349 // We'll still produce a fatal error downstream, but this diagnostic is more
350 // user-friendly.
351 fail(DL, DAG, Msg);
352}
353
355 switch (Op.getOpcode()) {
356 default:
357 report_fatal_error("unimplemented opcode: " + Twine(Op.getOpcode()));
358 case ISD::BR_CC:
359 return LowerBR_CC(Op, DAG);
360 case ISD::JumpTable:
361 return LowerJumpTable(Op, DAG);
363 return LowerGlobalAddress(Op, DAG);
365 return LowerConstantPool(Op, DAG);
367 return LowerBlockAddress(Op, DAG);
368 case ISD::SELECT_CC:
369 return LowerSELECT_CC(Op, DAG);
370 case ISD::SDIV:
371 case ISD::SREM:
372 return LowerSDIVSREM(Op, DAG);
373 case ISD::SHL_PARTS:
374 case ISD::SRL_PARTS:
375 case ISD::SRA_PARTS:
376 return LowerShiftParts(Op, DAG);
378 return LowerDYNAMIC_STACKALLOC(Op, DAG);
379 case ISD::ATOMIC_LOAD:
381 return LowerATOMIC_LOAD_STORE(Op, DAG);
383 return LowerATOMIC_FENCE(Op, DAG);
384 case ISD::TRAP:
385 return LowerTRAP(Op, DAG);
386 }
387}
388
389// Calling Convention Implementation
390#include "BPFGenCallingConv.inc"
391
392// Apply AssertSext/AssertZext and truncate based on VA's LocInfo.
394 const CCValAssign &VA, EVT RegVT,
395 SDValue ArgValue) {
396 if (VA.getLocInfo() == CCValAssign::SExt)
397 ArgValue = DAG.getNode(ISD::AssertSext, DL, RegVT, ArgValue,
398 DAG.getValueType(VA.getValVT()));
399 else if (VA.getLocInfo() == CCValAssign::ZExt)
400 ArgValue = DAG.getNode(ISD::AssertZext, DL, RegVT, ArgValue,
401 DAG.getValueType(VA.getValVT()));
402 if (VA.getLocInfo() != CCValAssign::Full)
403 ArgValue = DAG.getNode(ISD::TRUNCATE, DL, VA.getValVT(), ArgValue);
404 return ArgValue;
405}
406
407SDValue BPFTargetLowering::LowerFormalArguments(
408 SDValue Chain, CallingConv::ID CallConv, bool IsVarArg,
409 const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,
410 SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {
411 switch (CallConv) {
412 default:
413 report_fatal_error("unimplemented calling convention: " + Twine(CallConv));
414 case CallingConv::C:
416 break;
417 }
418
419 MachineFunction &MF = DAG.getMachineFunction();
420 MachineRegisterInfo &RegInfo = MF.getRegInfo();
421
422 // Assign locations to all of the incoming arguments.
424 CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());
425 CCInfo.AnalyzeFormalArguments(Ins, getHasAlu32() ? CC_BPF32 : CC_BPF64);
426
427 for (size_t I = 0; I < ArgLocs.size(); ++I) {
428 auto &VA = ArgLocs[I];
429 EVT RegVT = VA.getLocVT();
430
431 if (VA.isRegLoc()) {
432 // Arguments passed in registers
433 MVT::SimpleValueType SimpleTy = RegVT.getSimpleVT().SimpleTy;
434 switch (SimpleTy) {
435 default: {
436 std::string Str;
437 {
438 raw_string_ostream OS(Str);
439 RegVT.print(OS);
440 }
441 report_fatal_error("unhandled argument type: " + Twine(Str));
442 }
443 case MVT::i32:
444 case MVT::i64:
445 Register VReg = RegInfo.createVirtualRegister(
446 SimpleTy == MVT::i64 ? &BPF::GPRRegClass : &BPF::GPR32RegClass);
447 RegInfo.addLiveIn(VA.getLocReg(), VReg);
448 SDValue ArgValue = DAG.getCopyFromReg(Chain, DL, VReg, RegVT);
449 InVals.push_back(convertLocValType(DAG, DL, VA, RegVT, ArgValue));
450 break;
451 }
452 continue;
453 }
454
455 if (VA.isMemLoc()) {
456 // For example, two stack arguments,
457 // arg1: Off = 8
458 // arg2: off = 16
459 int Off = VA.getLocMemOffset() + 8;
460 if (Off > INT16_MAX) {
461 fail(DL, DAG, "extra parameter stack depth exceeded limit");
462 break;
463 }
464
465 // Physical extra argument slot is always 64-bit.
466 SDValue StackVal = DAG.getNode(BPFISD::LOAD_STACK_ARG, DL,
467 DAG.getVTList(MVT::i64, MVT::Other), Chain,
468 DAG.getConstant(Off, DL, MVT::i64));
469 SDValue ArgValue = StackVal.getValue(0);
470 Chain = StackVal.getValue(1);
471 InVals.push_back(convertLocValType(DAG, DL, VA, MVT::i64, ArgValue));
472 continue;
473 }
474 }
475
476 if (IsVarArg)
477 fail(DL, DAG, "variadic functions are not supported");
478 return Chain;
479}
480
481static void resetRegMaskBit(const TargetRegisterInfo *TRI, uint32_t *RegMask,
482 MCRegister Reg) {
483 for (MCPhysReg SubReg : TRI->subregs_inclusive(Reg))
484 RegMask[SubReg / 32] &= ~(1u << (SubReg % 32));
485}
486
488 MachineFunction &MF,
489 const uint32_t *BaseRegMask) {
490 uint32_t *RegMask = MF.allocateRegMask();
491 unsigned RegMaskSize = MachineOperand::getRegMaskSize(TRI->getNumRegs());
492 memcpy(RegMask, BaseRegMask, sizeof(RegMask[0]) * RegMaskSize);
493 return RegMask;
494}
495
496SDValue BPFTargetLowering::LowerCall(TargetLowering::CallLoweringInfo &CLI,
497 SmallVectorImpl<SDValue> &InVals) const {
498 SelectionDAG &DAG = CLI.DAG;
499 auto &Outs = CLI.Outs;
500 auto &OutVals = CLI.OutVals;
501 auto &Ins = CLI.Ins;
502 SDValue Chain = CLI.Chain;
503 SDValue Callee = CLI.Callee;
504 bool &IsTailCall = CLI.IsTailCall;
505 CallingConv::ID CallConv = CLI.CallConv;
506 bool IsVarArg = CLI.IsVarArg;
507 MachineFunction &MF = DAG.getMachineFunction();
508
509 // BPF target does not support tail call optimization.
510 IsTailCall = false;
511
512 switch (CallConv) {
513 default:
514 report_fatal_error("unsupported calling convention: " + Twine(CallConv));
516 case CallingConv::C:
517 break;
518 }
519
520 // Analyze operands of the call, assigning locations to each operand.
522 CCState CCInfo(CallConv, IsVarArg, MF, ArgLocs, *DAG.getContext());
523
524 CCInfo.AnalyzeCallOperands(Outs, getHasAlu32() ? CC_BPF32 : CC_BPF64);
525
526 unsigned NumBytes = CCInfo.getStackSize();
527
528 for (auto &Arg : Outs) {
529 ISD::ArgFlagsTy Flags = Arg.Flags;
530 if (!Flags.isByVal())
531 continue;
532 fail(CLI.DL, DAG, "pass by value not supported", Callee);
533 break;
534 }
535
536 auto PtrVT = getPointerTy(MF.getDataLayout());
537 Chain = DAG.getCALLSEQ_START(Chain, NumBytes, 0, CLI.DL);
538
540
541 // Walk arg assignments
542 for (size_t i = 0; i < OutVals.size(); ++i) {
543 CCValAssign &VA = ArgLocs[i];
544 SDValue &Arg = OutVals[i];
545
546 // Promote the value if needed.
547 switch (VA.getLocInfo()) {
548 default:
549 report_fatal_error("unhandled location info: " + Twine(VA.getLocInfo()));
551 break;
553 Arg = DAG.getNode(ISD::SIGN_EXTEND, CLI.DL, VA.getLocVT(), Arg);
554 break;
556 Arg = DAG.getNode(ISD::ZERO_EXTEND, CLI.DL, VA.getLocVT(), Arg);
557 break;
559 Arg = DAG.getNode(ISD::ANY_EXTEND, CLI.DL, VA.getLocVT(), Arg);
560 break;
561 }
562
563 // Push arguments into RegsToPass vector
564 if (VA.isRegLoc()) {
565 RegsToPass.push_back(std::make_pair(VA.getLocReg(), Arg));
566 continue;
567 }
568
569 if (VA.isMemLoc()) {
570 int Off = -8 - VA.getLocMemOffset();
571 if (Off < INT16_MIN) {
572 fail(CLI.DL, DAG, "extra parameter stack depth exceeded limit");
573 break;
574 }
575
576 // STORE_STACK_ARG requires i64 operands. With ALU32 mode, the CC
577 // promotion may only extend to i32, so extend to i64 if needed.
578 if (Arg.getValueType() != MVT::i64)
579 Arg = DAG.getNode(ISD::ANY_EXTEND, CLI.DL, MVT::i64, Arg);
580
581 SDValue OffVal = DAG.getConstant(Off, CLI.DL, MVT::i64);
582 Chain = DAG.getNode(BPFISD::STORE_STACK_ARG, CLI.DL, MVT::Other, Chain,
583 OffVal, Arg);
584 continue;
585 }
586
587 report_fatal_error("unhandled argument location");
588 }
589
590 SDValue InGlue;
591
592 // Build a sequence of copy-to-reg nodes chained together with token chain and
593 // flag operands which copy the outgoing args into registers. The InGlue in
594 // necessary since all emitted instructions must be stuck together.
595 for (auto &Reg : RegsToPass) {
596 Chain = DAG.getCopyToReg(Chain, CLI.DL, Reg.first, Reg.second, InGlue);
597 InGlue = Chain.getValue(1);
598 }
599
600 // If the callee is a GlobalAddress node (quite common, every direct call is)
601 // turn it into a TargetGlobalAddress node so that legalize doesn't hack it.
602 // Likewise ExternalSymbol -> TargetExternalSymbol.
603 if (GlobalAddressSDNode *G = dyn_cast<GlobalAddressSDNode>(Callee)) {
604 Callee = DAG.getTargetGlobalAddress(G->getGlobal(), CLI.DL, PtrVT,
605 G->getOffset(), 0);
606 } else if (ExternalSymbolSDNode *E = dyn_cast<ExternalSymbolSDNode>(Callee)) {
607 Callee = DAG.getTargetExternalSymbol(E->getSymbol(), PtrVT, 0);
608 StringRef Sym = E->getSymbol();
609 if (!BPFAllowsLibcalls && Sym != BPF_TRAP && Sym != "__multi3" &&
610 Sym != "__divti3" && Sym != "__modti3" && Sym != "__udivti3" &&
611 Sym != "__umodti3" && Sym != "memcpy" && Sym != "memset" &&
612 Sym != "memmove")
613 fail(
614 CLI.DL, DAG,
615 Twine("A call to built-in function '" + Sym + "' is not supported."));
616 }
617
618 // Returns a chain & a flag for retval copy to use.
619 SDVTList NodeTys = DAG.getVTList(MVT::Other, MVT::Glue);
621 Ops.push_back(Chain);
622 Ops.push_back(Callee);
623
624 // Add argument registers to the end of the list so that they are
625 // known live into the call.
626 for (auto &Reg : RegsToPass)
627 Ops.push_back(DAG.getRegister(Reg.first, Reg.second.getValueType()));
628
629 bool HasFastCall =
630 (CLI.CB && isa<CallInst>(CLI.CB) && CLI.CB->hasFnAttr("bpf_fastcall"));
631 const TargetRegisterInfo *TRI = MF.getSubtarget().getRegisterInfo();
632 if (HasFastCall) {
633 uint32_t *RegMask = regMaskFromTemplate(
634 TRI, MF, TRI->getCallPreservedMask(MF, CallingConv::PreserveAll));
635 for (auto const &RegPair : RegsToPass)
636 resetRegMaskBit(TRI, RegMask, RegPair.first);
637 if (!CLI.CB->getType()->isVoidTy())
638 resetRegMaskBit(TRI, RegMask, BPF::R0);
639 Ops.push_back(DAG.getRegisterMask(RegMask));
640 } else {
641 Ops.push_back(
642 DAG.getRegisterMask(TRI->getCallPreservedMask(MF, CLI.CallConv)));
643 }
644
645 if (InGlue.getNode())
646 Ops.push_back(InGlue);
647
648 Chain = DAG.getNode(BPFISD::CALL, CLI.DL, NodeTys, Ops);
649 InGlue = Chain.getValue(1);
650
651 DAG.addNoMergeSiteInfo(Chain.getNode(), CLI.NoMerge);
652
653 // Create the CALLSEQ_END node.
654 Chain = DAG.getCALLSEQ_END(Chain, NumBytes, 0, InGlue, CLI.DL);
655 InGlue = Chain.getValue(1);
656
657 // Handle result values, copying them out of physregs into vregs that we
658 // return.
659 return LowerCallResult(Chain, InGlue, CallConv, IsVarArg, Ins, CLI.DL, DAG,
660 InVals);
661}
662
664BPFTargetLowering::LowerReturn(SDValue Chain, CallingConv::ID CallConv,
665 bool IsVarArg,
667 const SmallVectorImpl<SDValue> &OutVals,
668 const SDLoc &DL, SelectionDAG &DAG) const {
669 unsigned Opc = BPFISD::RET_GLUE;
670
671 // CCValAssign - represent the assignment of the return value to a location
673 MachineFunction &MF = DAG.getMachineFunction();
674
675 // CCState - Info about the registers and stack slot.
676 CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());
677
678 // Analize return values.
679 CCInfo.AnalyzeReturn(Outs, getHasAlu32() ? RetCC_BPF32 : RetCC_BPF64);
680
681 SDValue Glue;
682 SmallVector<SDValue, 4> RetOps(1, Chain);
683
684 // Copy the result values into the output registers.
685 for (size_t i = 0; i != RVLocs.size(); ++i) {
686 CCValAssign &VA = RVLocs[i];
687 if (!VA.isRegLoc())
688 report_fatal_error("stack return values are not supported");
689
690 Chain = DAG.getCopyToReg(Chain, DL, VA.getLocReg(), OutVals[i], Glue);
691
692 // Guarantee that all emitted copies are stuck together,
693 // avoiding something bad.
694 Glue = Chain.getValue(1);
695 RetOps.push_back(DAG.getRegister(VA.getLocReg(), VA.getLocVT()));
696 }
697
698 RetOps[0] = Chain; // Update chain.
699
700 // Add the glue if we have it.
701 if (Glue.getNode())
702 RetOps.push_back(Glue);
703
704 return DAG.getNode(Opc, DL, MVT::Other, RetOps);
705}
706
707SDValue BPFTargetLowering::LowerCallResult(
708 SDValue Chain, SDValue InGlue, CallingConv::ID CallConv, bool IsVarArg,
709 const SmallVectorImpl<ISD::InputArg> &Ins, const SDLoc &DL,
710 SelectionDAG &DAG, SmallVectorImpl<SDValue> &InVals) const {
711
712 MachineFunction &MF = DAG.getMachineFunction();
713 // Assign locations to each value returned by this call.
715 CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, *DAG.getContext());
716
717 CCInfo.AnalyzeCallResult(Ins, getHasAlu32() ? RetCC_BPF32 : RetCC_BPF64);
718
719 // Copy all of the result registers out of their specified physreg.
720 for (auto &Val : RVLocs) {
721 Chain = DAG.getCopyFromReg(Chain, DL, Val.getLocReg(),
722 Val.getValVT(), InGlue).getValue(1);
723 InGlue = Chain.getValue(2);
724 InVals.push_back(Chain.getValue(0));
725 }
726
727 return Chain;
728}
729
731 switch (CC) {
732 default:
733 break;
734 case ISD::SETULT:
735 case ISD::SETULE:
736 case ISD::SETLT:
737 case ISD::SETLE:
739 std::swap(LHS, RHS);
740 break;
741 }
742}
743
744SDValue BPFTargetLowering::LowerSDIVSREM(SDValue Op, SelectionDAG &DAG) const {
745 SDLoc DL(Op);
746 fail(DL, DAG,
747 "unsupported signed division, please convert to unsigned div/mod.");
748 return DAG.getUNDEF(Op->getValueType(0));
749}
750
751SDValue BPFTargetLowering::LowerShiftParts(SDValue Op,
752 SelectionDAG &DAG) const {
753 SDValue Lo, Hi;
754 expandShiftParts(Op.getNode(), Lo, Hi, DAG);
755 return DAG.getMergeValues({Lo, Hi}, SDLoc(Op));
756}
757
758SDValue BPFTargetLowering::LowerDYNAMIC_STACKALLOC(SDValue Op,
759 SelectionDAG &DAG) const {
760 SDLoc DL(Op);
761 fail(DL, DAG, "unsupported dynamic stack allocation");
762 auto Ops = {DAG.getConstant(0, SDLoc(), Op.getValueType()), Op.getOperand(0)};
763 return DAG.getMergeValues(Ops, SDLoc());
764}
765
766SDValue BPFTargetLowering::LowerBR_CC(SDValue Op, SelectionDAG &DAG) const {
767 SDValue Chain = Op.getOperand(0);
768 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(1))->get();
769 SDValue LHS = Op.getOperand(2);
770 SDValue RHS = Op.getOperand(3);
771 SDValue Dest = Op.getOperand(4);
772 SDLoc DL(Op);
773
774 if (!getHasJmpExt())
775 NegateCC(LHS, RHS, CC);
776
777 return DAG.getNode(BPFISD::BR_CC, DL, Op.getValueType(), Chain, LHS, RHS,
778 DAG.getConstant(CC, DL, LHS.getValueType()), Dest);
779}
780
781SDValue BPFTargetLowering::LowerSELECT_CC(SDValue Op, SelectionDAG &DAG) const {
782 SDValue LHS = Op.getOperand(0);
783 SDValue RHS = Op.getOperand(1);
784 SDValue TrueV = Op.getOperand(2);
785 SDValue FalseV = Op.getOperand(3);
786 ISD::CondCode CC = cast<CondCodeSDNode>(Op.getOperand(4))->get();
787 SDLoc DL(Op);
788
789 if (!getHasJmpExt())
790 NegateCC(LHS, RHS, CC);
791
792 SDValue TargetCC = DAG.getConstant(CC, DL, LHS.getValueType());
793 SDValue Ops[] = {LHS, RHS, TargetCC, TrueV, FalseV};
794
795 return DAG.getNode(BPFISD::SELECT_CC, DL, Op.getValueType(), Ops);
796}
797
798SDValue BPFTargetLowering::LowerATOMIC_LOAD_STORE(SDValue Op,
799 SelectionDAG &DAG) const {
800 SDNode *N = Op.getNode();
801 SDLoc DL(N);
802
803 if (cast<AtomicSDNode>(N)->getMergedOrdering() ==
805 fail(DL, DAG,
806 "sequentially consistent (seq_cst) "
807 "atomic load/store is not supported");
808
809 return Op;
810}
811
812SDValue BPFTargetLowering::LowerATOMIC_FENCE(SDValue Op,
813 SelectionDAG &DAG) const {
814 SDLoc DL(Op);
815 SyncScope::ID FenceSSID =
816 static_cast<SyncScope::ID>(Op.getConstantOperandVal(2));
817
818 if (FenceSSID == SyncScope::SingleThread)
819 // MEMBARRIER is a compiler barrier; it codegens to a no-op.
820 return DAG.getNode(ISD::MEMBARRIER, DL, MVT::Other, Op.getOperand(0));
821
822 report_fatal_error("Runtime fence is not supported at the moment");
823}
824
826 if (auto *Fn = M->getFunction(BPF_TRAP))
827 return Fn;
828
829 FunctionType *FT = FunctionType::get(Type::getVoidTy(M->getContext()), false);
830 Function *NewF =
832 NewF->setDSOLocal(true);
834 NewF->setSection(".ksyms");
835
836 if (M->debug_compile_units().empty())
837 return NewF;
838
839 DIBuilder DBuilder(*M);
840 DITypeArray ParamTypes =
841 DBuilder.getOrCreateTypeArray({nullptr /*void return*/});
842 DISubroutineType *FuncType = DBuilder.createSubroutineType(ParamTypes);
843 DICompileUnit *CU = *M->debug_compile_units_begin();
844 DISubprogram *SP =
845 DBuilder.createFunction(CU, BPF_TRAP, BPF_TRAP, nullptr, 0, FuncType, 0,
846 DINode::FlagZero, DISubprogram::SPFlagZero);
847 NewF->setSubprogram(SP);
848 return NewF;
849}
850
851SDValue BPFTargetLowering::LowerTRAP(SDValue Op, SelectionDAG &DAG) const {
852 MachineFunction &MF = DAG.getMachineFunction();
853 TargetLowering::CallLoweringInfo CLI(DAG);
855 SDNode *N = Op.getNode();
856 SDLoc DL(N);
857
859 auto PtrVT = getPointerTy(MF.getDataLayout());
860 CLI.Callee = DAG.getTargetGlobalAddress(Fn, DL, PtrVT);
861 CLI.Chain = N->getOperand(0);
862 CLI.IsTailCall = false;
864 CLI.IsVarArg = false;
865 CLI.DL = std::move(DL);
866 CLI.NoMerge = false;
867 CLI.DoesNotReturn = true;
868 return LowerCall(CLI, InVals);
869}
870
871SDValue BPFTargetLowering::LowerJumpTable(SDValue Op, SelectionDAG &DAG) const {
872 JumpTableSDNode *N = cast<JumpTableSDNode>(Op);
873 return getAddr(N, DAG);
874}
875
877 SelectionDAG &DAG, unsigned Flags) {
878 return DAG.getTargetConstantPool(N->getConstVal(), Ty, N->getAlign(),
879 N->getOffset(), Flags);
880}
881
883 SelectionDAG &DAG, unsigned Flags) {
884 return DAG.getTargetJumpTable(N->getIndex(), Ty, Flags);
885}
886
887template <class NodeTy>
888SDValue BPFTargetLowering::getAddr(NodeTy *N, SelectionDAG &DAG,
889 unsigned Flags) const {
890 SDLoc DL(N);
891
892 SDValue GA = getTargetNode(N, DL, MVT::i64, DAG, Flags);
893
894 return DAG.getNode(BPFISD::Wrapper, DL, MVT::i64, GA);
895}
896
897SDValue BPFTargetLowering::LowerGlobalAddress(SDValue Op,
898 SelectionDAG &DAG) const {
899 GlobalAddressSDNode *N = cast<GlobalAddressSDNode>(Op);
900 if (N->getOffset() != 0)
901 report_fatal_error("invalid offset for global address: " +
902 Twine(N->getOffset()));
903
904 const GlobalValue *GVal = N->getGlobal();
905 SDLoc DL(Op);
906
907 // Wrap it in a TargetGlobalAddress
908 SDValue Addr = DAG.getTargetGlobalAddress(GVal, DL, MVT::i64);
909
910 // Emit pseudo instruction
911 return SDValue(DAG.getMachineNode(BPF::LDIMM64, DL, MVT::i64, Addr), 0);
912}
913
914SDValue BPFTargetLowering::LowerConstantPool(SDValue Op,
915 SelectionDAG &DAG) const {
916 ConstantPoolSDNode *N = cast<ConstantPoolSDNode>(Op);
917
918 return getAddr(N, DAG);
919}
920
921SDValue BPFTargetLowering::LowerBlockAddress(SDValue Op,
922 SelectionDAG &DAG) const {
923 const BlockAddress *BA = cast<BlockAddressSDNode>(Op)->getBlockAddress();
924 SDLoc DL(Op);
925
926 // Wrap it in a TargetBlockAddress
927 SDValue Addr = DAG.getTargetBlockAddress(BA, MVT::i64);
928
929 // Emit pseudo instruction
930 return SDValue(DAG.getMachineNode(BPF::LDIMM64, DL, MVT::i64, Addr), 0);
931}
932
933unsigned
934BPFTargetLowering::EmitSubregExt(MachineInstr &MI, MachineBasicBlock *BB,
935 unsigned Reg, bool isSigned) const {
936 const TargetInstrInfo &TII = *BB->getParent()->getSubtarget().getInstrInfo();
937 const TargetRegisterClass *RC = getRegClassFor(MVT::i64);
938 int RShiftOp = isSigned ? BPF::SRA_ri : BPF::SRL_ri;
939 MachineFunction *F = BB->getParent();
940 DebugLoc DL = MI.getDebugLoc();
941
942 MachineRegisterInfo &RegInfo = F->getRegInfo();
943
944 if (!isSigned) {
945 Register PromotedReg0 = RegInfo.createVirtualRegister(RC);
946 BuildMI(BB, DL, TII.get(BPF::MOV_32_64), PromotedReg0).addReg(Reg);
947 return PromotedReg0;
948 }
949 Register PromotedReg0 = RegInfo.createVirtualRegister(RC);
950 Register PromotedReg1 = RegInfo.createVirtualRegister(RC);
951 Register PromotedReg2 = RegInfo.createVirtualRegister(RC);
952 if (HasMovsx) {
953 BuildMI(BB, DL, TII.get(BPF::MOVSX_rr_32), PromotedReg0).addReg(Reg);
954 } else {
955 BuildMI(BB, DL, TII.get(BPF::MOV_32_64), PromotedReg0).addReg(Reg);
956 BuildMI(BB, DL, TII.get(BPF::SLL_ri), PromotedReg1)
957 .addReg(PromotedReg0).addImm(32);
958 BuildMI(BB, DL, TII.get(RShiftOp), PromotedReg2)
959 .addReg(PromotedReg1).addImm(32);
960 }
961
962 return PromotedReg2;
963}
964
966BPFTargetLowering::EmitInstrWithCustomInserterMemcpy(MachineInstr &MI,
968 const {
969 MachineFunction *MF = MI.getParent()->getParent();
970 MachineRegisterInfo &MRI = MF->getRegInfo();
971 MachineInstrBuilder MIB(*MF, MI);
972 unsigned ScratchReg;
973
974 // This function does custom insertion during lowering BPFISD::MEMCPY which
975 // only has two register operands from memcpy semantics, the copy source
976 // address and the copy destination address.
977 //
978 // Because we will expand BPFISD::MEMCPY into load/store pairs, we will need
979 // a third scratch register to serve as the destination register of load and
980 // source register of store.
981 //
982 // The scratch register here is with the Define | Dead | EarlyClobber flags.
983 // The EarlyClobber flag has the semantic property that the operand it is
984 // attached to is clobbered before the rest of the inputs are read. Hence it
985 // must be unique among the operands to the instruction. The Define flag is
986 // needed to coerce the machine verifier that an Undef value isn't a problem
987 // as we anyway is loading memory into it. The Dead flag is needed as the
988 // value in scratch isn't supposed to be used by any other instruction.
989 ScratchReg = MRI.createVirtualRegister(&BPF::GPRRegClass);
990 MIB.addReg(ScratchReg,
992
993 return BB;
994}
995
996MachineBasicBlock *BPFTargetLowering::EmitInstrWithCustomInserterLDimm64(
997 MachineInstr &MI, MachineBasicBlock *BB) const {
998 MachineFunction *MF = BB->getParent();
999 const BPFInstrInfo *TII = MF->getSubtarget<BPFSubtarget>().getInstrInfo();
1000 const TargetRegisterClass *RC = getRegClassFor(MVT::i64);
1001 MachineRegisterInfo &RegInfo = MF->getRegInfo();
1002 DebugLoc DL = MI.getDebugLoc();
1003
1004 // Build address taken map for Global Varaibles and BlockAddresses
1005 DenseMap<const BasicBlock *, MachineBasicBlock *> AddressTakenBBs;
1006 for (MachineBasicBlock &MBB : *MF) {
1007 if (const BasicBlock *BB = MBB.getBasicBlock())
1008 if (BB->hasAddressTaken())
1009 AddressTakenBBs[BB] = &MBB;
1010 }
1011
1012 MachineOperand &MO = MI.getOperand(1);
1013 assert(MO.isBlockAddress() || MO.isGlobal());
1014
1015 Register ResultReg = MI.getOperand(0).getReg();
1016 Register TmpReg = RegInfo.createVirtualRegister(RC);
1017
1018 std::vector<MachineBasicBlock *> Targets;
1019 unsigned JTI;
1020
1021 if (MO.isBlockAddress()) {
1022 auto *BA = MO.getBlockAddress();
1023 MachineBasicBlock *TgtMBB = AddressTakenBBs[BA->getBasicBlock()];
1024 assert(TgtMBB);
1025
1026 Targets.push_back(TgtMBB);
1027 JTI = MF->getOrCreateJumpTableInfo(getJumpTableEncoding())
1028 ->createJumpTableIndex(Targets);
1029
1030 BuildMI(*BB, MI, DL, TII->get(BPF::LD_imm64), TmpReg)
1031 .addJumpTableIndex(JTI);
1032 BuildMI(*BB, MI, DL, TII->get(BPF::LDD), ResultReg)
1033 .addReg(TmpReg)
1034 .addImm(0);
1035 MI.eraseFromParent();
1036 return BB;
1037 }
1038
1039 // Helper: emit LD_imm64 with operand GlobalAddress or JumpTable
1040 auto emitLDImm64 = [&](const GlobalValue *GV = nullptr, unsigned JTI = -1) {
1041 auto MIB = BuildMI(*BB, MI, DL, TII->get(BPF::LD_imm64), ResultReg);
1042 if (GV)
1043 MIB.addGlobalAddress(GV);
1044 else
1045 MIB.addJumpTableIndex(JTI);
1046 MI.eraseFromParent();
1047 return BB;
1048 };
1049
1050 // Must be a global at this point
1051 const GlobalValue *GVal = MO.getGlobal();
1052 const auto *GV = dyn_cast<GlobalVariable>(GVal);
1053
1054 if (!GV || GV->getLinkage() != GlobalValue::PrivateLinkage ||
1055 !GV->isConstant() || !GV->hasInitializer())
1056 return emitLDImm64(GVal);
1057
1058 const auto *CA = dyn_cast<ConstantArray>(GV->getInitializer());
1059 if (!CA)
1060 return emitLDImm64(GVal);
1061
1062 for (const Use &Op : CA->operands()) {
1063 if (!isa<BlockAddress>(Op))
1064 return emitLDImm64(GVal);
1065 auto *BA = cast<BlockAddress>(Op);
1066 MachineBasicBlock *TgtMBB = AddressTakenBBs[BA->getBasicBlock()];
1067 assert(TgtMBB);
1068 Targets.push_back(TgtMBB);
1069 }
1070
1071 JTI = MF->getOrCreateJumpTableInfo(getJumpTableEncoding())
1072 ->createJumpTableIndex(Targets);
1073 return emitLDImm64(nullptr, JTI);
1074}
1075
1078 MachineBasicBlock *BB) const {
1080 DebugLoc DL = MI.getDebugLoc();
1081 unsigned Opc = MI.getOpcode();
1082 bool isSelectRROp = (Opc == BPF::Select ||
1083 Opc == BPF::Select_64_32 ||
1084 Opc == BPF::Select_32 ||
1085 Opc == BPF::Select_32_64);
1086
1087 bool isMemcpyOp = Opc == BPF::MEMCPY;
1088 bool isLDimm64Op = Opc == BPF::LDIMM64;
1089
1090#ifndef NDEBUG
1091 bool isSelectRIOp = (Opc == BPF::Select_Ri ||
1092 Opc == BPF::Select_Ri_64_32 ||
1093 Opc == BPF::Select_Ri_32 ||
1094 Opc == BPF::Select_Ri_32_64);
1095
1096 if (!(isSelectRROp || isSelectRIOp || isMemcpyOp || isLDimm64Op))
1097 report_fatal_error("unhandled instruction type: " + Twine(Opc));
1098#endif
1099
1100 if (isMemcpyOp)
1101 return EmitInstrWithCustomInserterMemcpy(MI, BB);
1102
1103 if (isLDimm64Op)
1104 return EmitInstrWithCustomInserterLDimm64(MI, BB);
1105
1106 bool is32BitCmp = (Opc == BPF::Select_32 ||
1107 Opc == BPF::Select_32_64 ||
1108 Opc == BPF::Select_Ri_32 ||
1109 Opc == BPF::Select_Ri_32_64);
1110
1111 // To "insert" a SELECT instruction, we actually have to insert the diamond
1112 // control-flow pattern. The incoming instruction knows the destination vreg
1113 // to set, the condition code register to branch on, the true/false values to
1114 // select between, and a branch opcode to use.
1115 const BasicBlock *LLVM_BB = BB->getBasicBlock();
1117
1118 // ThisMBB:
1119 // ...
1120 // TrueVal = ...
1121 // jmp_XX r1, r2 goto Copy1MBB
1122 // fallthrough --> Copy0MBB
1123 MachineBasicBlock *ThisMBB = BB;
1124 MachineFunction *F = BB->getParent();
1125 MachineBasicBlock *Copy0MBB = F->CreateMachineBasicBlock(LLVM_BB);
1126 MachineBasicBlock *Copy1MBB = F->CreateMachineBasicBlock(LLVM_BB);
1127
1128 F->insert(I, Copy0MBB);
1129 F->insert(I, Copy1MBB);
1130 // Update machine-CFG edges by transferring all successors of the current
1131 // block to the new block which will contain the Phi node for the select.
1132 Copy1MBB->splice(Copy1MBB->begin(), BB,
1133 std::next(MachineBasicBlock::iterator(MI)), BB->end());
1134 Copy1MBB->transferSuccessorsAndUpdatePHIs(BB);
1135 // Next, add the true and fallthrough blocks as its successors.
1136 BB->addSuccessor(Copy0MBB);
1137 BB->addSuccessor(Copy1MBB);
1138
1139 // Insert Branch if Flag
1140 int CC = MI.getOperand(3).getImm();
1141 int NewCC;
1142 switch (CC) {
1143#define SET_NEWCC(X, Y) \
1144 case ISD::X: \
1145 if (is32BitCmp && HasJmp32) \
1146 NewCC = isSelectRROp ? BPF::Y##_rr_32 : BPF::Y##_ri_32; \
1147 else \
1148 NewCC = isSelectRROp ? BPF::Y##_rr : BPF::Y##_ri; \
1149 break
1150 SET_NEWCC(SETGT, JSGT);
1151 SET_NEWCC(SETUGT, JUGT);
1152 SET_NEWCC(SETGE, JSGE);
1153 SET_NEWCC(SETUGE, JUGE);
1154 SET_NEWCC(SETEQ, JEQ);
1155 SET_NEWCC(SETNE, JNE);
1156 SET_NEWCC(SETLT, JSLT);
1157 SET_NEWCC(SETULT, JULT);
1158 SET_NEWCC(SETLE, JSLE);
1159 SET_NEWCC(SETULE, JULE);
1160 default:
1161 report_fatal_error("unimplemented select CondCode " + Twine(CC));
1162 }
1163
1164 Register LHS = MI.getOperand(1).getReg();
1165 bool isSignedCmp = (CC == ISD::SETGT ||
1166 CC == ISD::SETGE ||
1167 CC == ISD::SETLT ||
1168 CC == ISD::SETLE);
1169
1170 // eBPF at the moment only has 64-bit comparison. Any 32-bit comparison need
1171 // to be promoted, however if the 32-bit comparison operands are destination
1172 // registers then they are implicitly zero-extended already, there is no
1173 // need of explicit zero-extend sequence for them.
1174 //
1175 // We simply do extension for all situations in this method, but we will
1176 // try to remove those unnecessary in BPFMIPeephole pass.
1177 if (is32BitCmp && !HasJmp32)
1178 LHS = EmitSubregExt(MI, BB, LHS, isSignedCmp);
1179
1180 if (isSelectRROp) {
1181 Register RHS = MI.getOperand(2).getReg();
1182
1183 if (is32BitCmp && !HasJmp32)
1184 RHS = EmitSubregExt(MI, BB, RHS, isSignedCmp);
1185
1186 BuildMI(BB, DL, TII.get(NewCC)).addReg(LHS).addReg(RHS).addMBB(Copy1MBB);
1187 } else {
1188 int64_t imm32 = MI.getOperand(2).getImm();
1189 // Check before we build J*_ri instruction.
1190 if (!isInt<32>(imm32))
1191 report_fatal_error("immediate overflows 32 bits: " + Twine(imm32));
1192 BuildMI(BB, DL, TII.get(NewCC))
1193 .addReg(LHS).addImm(imm32).addMBB(Copy1MBB);
1194 }
1195
1196 // Copy0MBB:
1197 // %FalseValue = ...
1198 // # fallthrough to Copy1MBB
1199 BB = Copy0MBB;
1200
1201 // Update machine-CFG edges
1202 BB->addSuccessor(Copy1MBB);
1203
1204 // Copy1MBB:
1205 // %Result = phi [ %FalseValue, Copy0MBB ], [ %TrueValue, ThisMBB ]
1206 // ...
1207 BB = Copy1MBB;
1208 BuildMI(*BB, BB->begin(), DL, TII.get(BPF::PHI), MI.getOperand(0).getReg())
1209 .addReg(MI.getOperand(5).getReg())
1210 .addMBB(Copy0MBB)
1211 .addReg(MI.getOperand(4).getReg())
1212 .addMBB(ThisMBB);
1213
1214 MI.eraseFromParent(); // The pseudo instruction is gone now.
1215 return BB;
1216}
1217
1219 EVT VT) const {
1220 return getHasAlu32() ? MVT::i32 : MVT::i64;
1221}
1222
1224 EVT VT) const {
1225 return (getHasAlu32() && VT == MVT::i32) ? MVT::i32 : MVT::i64;
1226}
1227
1228bool BPFTargetLowering::isLegalAddressingMode(const DataLayout &DL,
1229 const AddrMode &AM, Type *Ty,
1230 unsigned AS,
1231 Instruction *I) const {
1232 // No global is ever allowed as a base.
1233 if (AM.BaseGV)
1234 return false;
1235
1236 switch (AM.Scale) {
1237 case 0: // "r+i" or just "i", depending on HasBaseReg.
1238 break;
1239 case 1:
1240 if (!AM.HasBaseReg) // allow "r+i".
1241 break;
1242 return false; // disallow "r+r" or "r+r+i".
1243 default:
1244 return false;
1245 }
1246
1247 return true;
1248}
1249
1250bool BPFTargetLowering::CanLowerReturn(
1251 CallingConv::ID CallConv, MachineFunction &MF, bool IsVarArg,
1253 const Type *RetTy) const {
1255 CCState CCInfo(CallConv, IsVarArg, MF, RVLocs, Context);
1256 return CCInfo.CheckReturn(Outs, getHasAlu32() ? RetCC_BPF32 : RetCC_BPF64);
1257}
return SDValue()
assert(UImm &&(UImm !=~static_cast< T >(0)) &&"Invalid immediate!")
MachineBasicBlock & MBB
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Function Alias Analysis Results
static uint32_t * regMaskFromTemplate(const TargetRegisterInfo *TRI, MachineFunction &MF, const uint32_t *BaseRegMask)
static Function * createBPFUnreachable(Module *M)
static cl::opt< bool > BPFAllowsLibcalls("bpf-allows-libcalls", cl::Hidden, cl::init(false), cl::desc("Allow libcalls instead of rejecting unsupported built-in " "functions"))
static SDValue getTargetNode(ConstantPoolSDNode *N, const SDLoc &DL, EVT Ty, SelectionDAG &DAG, unsigned Flags)
static cl::opt< bool > BPFExpandMemcpyInOrder("bpf-expand-memcpy-in-order", cl::Hidden, cl::init(false), cl::desc("Expand memcpy into load/store pairs in order"))
static SDValue convertLocValType(SelectionDAG &DAG, const SDLoc &DL, const CCValAssign &VA, EVT RegVT, SDValue ArgValue)
static void fail(const SDLoc &DL, SelectionDAG &DAG, const Twine &Msg, SDValue Val={})
static cl::opt< unsigned > BPFMinimumJumpTableEntries("bpf-min-jump-table-entries", cl::init(13), cl::Hidden, cl::desc("Set minimum number of entries to use a jump table on BPF"))
static void resetRegMaskBit(const TargetRegisterInfo *TRI, uint32_t *RegMask, MCRegister Reg)
static void NegateCC(SDValue &LHS, SDValue &RHS, ISD::CondCode &CC)
#define SET_NEWCC(X, Y)
#define BPF_TRAP
Definition BPF.h:25
static GCRegistry::Add< CoreCLRGC > E("coreclr", "CoreCLR-compatible GC")
static bool isSigned(unsigned Opcode)
const HexagonInstrInfo * TII
IRTranslator LLVM IR MI
Module.h This file contains the declarations for the Module class.
const AbstractManglingParser< Derived, Alloc >::OperatorInfo AbstractManglingParser< Derived, Alloc >::Ops[]
#define F(x, y, z)
Definition MD5.cpp:54
#define I(x, y, z)
Definition MD5.cpp:57
#define G(x, y, z)
Definition MD5.cpp:55
Register Reg
Register const TargetRegisterInfo * TRI
Promote Memory to Register
Definition Mem2Reg.cpp:110
Value * RHS
Value * LHS
unsigned getCommonMaxStoresPerMemFunc() const
bool hasSdivSmod() const
bool getAllowsMisalignedMemAccess() const
bool getHasJmpExt() const
const BPFSelectionDAGInfo * getSelectionDAGInfo() const override
bool hasLdsx() const
bool hasGotox() const
bool hasMovsx() const
bool getHasJmp32() const
const BPFRegisterInfo * getRegisterInfo() const override
bool getHasAlu32() const
BPFTargetLowering::ConstraintType getConstraintType(StringRef Constraint) const override
Given a constraint, return the type of constraint it is for this target.
unsigned getJumpTableEncoding() const override
Return the entry encoding for a jump table in the current function.
bool isOffsetFoldingLegal(const GlobalAddressSDNode *GA) const override
Return true if folding a constant offset with the given GlobalAddress is legal.
bool allowsMisalignedMemoryAccesses(EVT VT, unsigned, Align, MachineMemOperand::Flags, unsigned *) const override
Determine if the target supports unaligned memory accesses.
EVT getSetCCResultType(const DataLayout &DL, LLVMContext &Context, EVT VT) const override
Return the ValueType of the result of SETCC operations.
BPFTargetLowering(const TargetMachine &TM, const BPFSubtarget &STI)
SDValue LowerOperation(SDValue Op, SelectionDAG &DAG) const override
This callback is invoked for operations that are unsupported by the target, which are registered to u...
MachineBasicBlock * EmitInstrWithCustomInserter(MachineInstr &MI, MachineBasicBlock *BB) const override
This method should be implemented by targets that mark instructions with the 'usesCustomInserter' fla...
MVT getScalarShiftAmountTy(const DataLayout &, EVT) const override
Return the type to use for a scalar shift opcode, given the shifted amount type.
std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const override
Given a physical register constraint (e.g.
LLVM Basic Block Representation.
Definition BasicBlock.h:62
BasicBlock * getBasicBlock() const
Definition Constants.h:1117
CCValAssign - Represent assignment of one arg/retval to a location.
Register getLocReg() const
LocInfo getLocInfo() const
int64_t getLocMemOffset() const
bool hasFnAttr(Attribute::AttrKind Kind) const
Determine whether this call has the given attribute.
LLVM_ABI DISubroutineType * createSubroutineType(DITypeArray ParameterTypes, DINode::DIFlags Flags=DINode::FlagZero, unsigned CC=0)
Create subroutine type.
LLVM_ABI DISubprogram * createFunction(DIScope *Scope, StringRef Name, StringRef LinkageName, DIFile *File, unsigned LineNo, DISubroutineType *Ty, unsigned ScopeLine, DINode::DIFlags Flags=DINode::FlagZero, DISubprogram::DISPFlags SPFlags=DISubprogram::SPFlagZero, DITemplateParameterArray TParams=nullptr, DISubprogram *Decl=nullptr, DITypeArray ThrownTypes=nullptr, DINodeArray Annotations=nullptr, StringRef TargetFuncName="", bool UseKeyInstructions=false)
Create a new descriptor for the specified subprogram.
LLVM_ABI DITypeArray getOrCreateTypeArray(ArrayRef< Metadata * > Elements)
Get a DITypeArray, create one if required.
Subprogram description. Uses SubclassData1.
Type array for a subprogram.
A parsed version of the target data layout string in and methods for querying it.
Definition DataLayout.h:64
A debug info location.
Definition DebugLoc.h:123
Diagnostic information for unsupported feature in backend.
static LLVM_ABI FunctionType * get(Type *Result, ArrayRef< Type * > Params, bool isVarArg)
This static method is the primary way of constructing a FunctionType.
void setSubprogram(DISubprogram *SP)
Set the attached subprogram.
static Function * Create(FunctionType *Ty, LinkageTypes Linkage, unsigned AddrSpace, const Twine &N="", Module *M=nullptr)
Definition Function.h:168
void setCallingConv(CallingConv::ID CC)
Definition Function.h:276
LLVM_ABI void setSection(StringRef S)
Change the section for this global.
Definition Globals.cpp:339
LinkageTypes getLinkage() const
Module * getParent()
Get the module that this global value is contained inside of...
void setDSOLocal(bool Local)
@ PrivateLinkage
Like Internal, but omit from symbol table.
Definition GlobalValue.h:61
@ ExternalWeakLinkage
ExternalWeak linkage description.
Definition GlobalValue.h:62
This is an important class for using LLVM in a threaded context.
Definition LLVMContext.h:68
LLVM_ABI void diagnose(const DiagnosticInfo &DI)
Report a message to the currently installed diagnostic handler.
Wrapper class representing physical registers. Should be passed by value.
Definition MCRegister.h:41
Machine Value Type.
SimpleValueType SimpleTy
static auto integer_valuetypes()
LLVM_ABI void transferSuccessorsAndUpdatePHIs(MachineBasicBlock *FromMBB)
Transfers all the successors, as in transferSuccessors, and update PHI operands in the successor bloc...
const BasicBlock * getBasicBlock() const
Return the LLVM basic block that this instance corresponded to originally.
bool hasAddressTaken() const
Test whether this block is used as something other than the target of a terminator,...
LLVM_ABI void addSuccessor(MachineBasicBlock *Succ, BranchProbability Prob=BranchProbability::getUnknown())
Add Succ as a successor of this MachineBasicBlock.
const MachineFunction * getParent() const
Return the MachineFunction containing this basic block.
void splice(iterator Where, MachineBasicBlock *Other, iterator From)
Take an instruction from MBB 'Other' at the position From, and insert it into this MBB right before '...
MachineInstrBundleIterator< MachineInstr > iterator
const TargetSubtargetInfo & getSubtarget() const
getSubtarget - Return the subtarget for which this machine code is being compiled.
uint32_t * allocateRegMask()
Allocate and initialize a register mask with NumRegister bits.
MachineRegisterInfo & getRegInfo()
getRegInfo - Return information about the registers currently in use.
const DataLayout & getDataLayout() const
Return the DataLayout attached to the Module associated to this MF.
Function & getFunction()
Return the LLVM function that this machine code represents.
BasicBlockListType::iterator iterator
const MachineInstrBuilder & addReg(Register RegNo, RegState Flags={}, unsigned SubReg=0) const
Add a new virtual register operand.
const MachineInstrBuilder & addImm(int64_t Val) const
Add a new immediate operand.
const MachineInstrBuilder & addJumpTableIndex(unsigned Idx, unsigned TargetFlags=0) const
const MachineInstrBuilder & addMBB(MachineBasicBlock *MBB, unsigned TargetFlags=0) const
Representation of each machine instruction.
@ EK_BlockAddress
EK_BlockAddress - Each entry is a plain address of block, e.g.: .word LBB123.
Flags
Flags values. These may be or'd together.
const GlobalValue * getGlobal() const
const BlockAddress * getBlockAddress() const
static unsigned getRegMaskSize(unsigned NumRegs)
Returns number of elements needed for a regmask array.
bool isGlobal() const
isGlobal - Tests if this is a MO_GlobalAddress operand.
bool isBlockAddress() const
isBlockAddress - Tests if this is a MO_BlockAddress operand.
LLVM_ABI Register createVirtualRegister(const TargetRegisterClass *RegClass, StringRef Name="")
createVirtualRegister - Create and return a new virtual register in the function with the specified r...
void addLiveIn(MCRegister Reg, Register vreg=Register())
addLiveIn - Add the specified register as a live-in.
A Module instance is used to store all the information related to an LLVM module.
Definition Module.h:68
Wrapper class representing virtual and physical registers.
Definition Register.h:20
Wrapper class for IR location info (IR ordering and DebugLoc) to be passed into SDNode creation funct...
Represents one node in the SelectionDAG.
const SDValue & getOperand(unsigned Num) const
Unlike LLVM values, Selection DAG nodes may return multiple values as the result of a computation.
SDNode * getNode() const
get the SDNode which holds the desired result
SDValue getValue(unsigned R) const
EVT getValueType() const
Return the ValueType of the referenced return value.
unsigned getOpcode() const
This is used to represent a portion of an LLVM function in a low-level Data Dependence DAG representa...
SDValue getTargetGlobalAddress(const GlobalValue *GV, const SDLoc &DL, EVT VT, int64_t offset=0, unsigned TargetFlags=0)
SDValue getCopyToReg(SDValue Chain, const SDLoc &dl, Register Reg, SDValue N)
LLVM_ABI SDValue getMergeValues(ArrayRef< SDValue > Ops, const SDLoc &dl)
Create a MERGE_VALUES node from the given operands.
LLVM_ABI SDVTList getVTList(EVT VT)
Return an SDVTList that represents the list of values specified.
LLVM_ABI MachineSDNode * getMachineNode(unsigned Opcode, const SDLoc &dl, EVT VT)
These are used for target selectors to create a new node with specified return type(s),...
LLVM_ABI SDValue getRegister(Register Reg, EVT VT)
void addNoMergeSiteInfo(const SDNode *Node, bool NoMerge)
Set NoMergeSiteInfo to be associated with Node if NoMerge is true.
SDValue getTargetJumpTable(int JTI, EVT VT, unsigned TargetFlags=0)
SDValue getUNDEF(EVT VT)
Return an UNDEF node. UNDEF does not have a useful SDLoc.
SDValue getCALLSEQ_END(SDValue Chain, SDValue Op1, SDValue Op2, SDValue InGlue, const SDLoc &DL)
Return a new CALLSEQ_END node, which always must have a glue result (to ensure it's not CSE'd).
SDValue getCopyFromReg(SDValue Chain, const SDLoc &dl, Register Reg, EVT VT)
LLVM_ABI SDValue getConstant(uint64_t Val, const SDLoc &DL, EVT VT, bool isTarget=false, bool isOpaque=false)
Create a ConstantSDNode wrapping a constant value.
SDValue getCALLSEQ_START(SDValue Chain, uint64_t InSize, uint64_t OutSize, const SDLoc &DL)
Return a new CALLSEQ_START node, that starts new call frame, in which InSize bytes are set up inside ...
LLVM_ABI SDValue getValueType(EVT)
LLVM_ABI SDValue getNode(unsigned Opcode, const SDLoc &DL, EVT VT, ArrayRef< SDUse > Ops)
Gets or creates the specified node.
SDValue getTargetBlockAddress(const BlockAddress *BA, EVT VT, int64_t Offset=0, unsigned TargetFlags=0)
MachineFunction & getMachineFunction() const
LLVM_ABI SDValue getRegisterMask(const uint32_t *RegMask)
LLVMContext * getContext() const
LLVM_ABI SDValue getTargetExternalSymbol(const char *Sym, EVT VT, unsigned TargetFlags=0)
SDValue getTargetConstantPool(const Constant *C, EVT VT, MaybeAlign Align=std::nullopt, int Offset=0, unsigned TargetFlags=0)
This class consists of common code factored out of the SmallVector class to reduce code duplication b...
void push_back(const T &Elt)
Represent a constant reference to a string, i.e.
Definition StringRef.h:56
constexpr size_t size() const
Get the string size.
Definition StringRef.h:144
TargetInstrInfo - Interface to description of machine instruction set.
void setOperationAction(unsigned Op, MVT VT, LegalizeAction Action)
Indicate that the specified operation does not work with the specified type and indicate what to do a...
unsigned MaxStoresPerMemcpyOptSize
Likewise for functions with the OptSize attribute.
virtual const TargetRegisterClass * getRegClassFor(MVT VT, bool isDivergent=false) const
Return the register class that should be used for the specified value type.
unsigned MaxLoadsPerMemcmp
Specify maximum number of load instructions per memcmp call.
virtual bool isZExtFree(Type *FromTy, Type *ToTy) const
Return true if any actual instruction that defines a value of type FromTy implicitly zero-extends the...
void setMaxAtomicSizeInBitsSupported(unsigned SizeInBits)
Set the maximum atomic operation size supported by the backend.
void setMinFunctionAlignment(Align Alignment)
Set the target's minimum function alignment.
unsigned MaxStoresPerMemsetOptSize
Likewise for functions with the OptSize attribute.
void setBooleanContents(BooleanContent Ty)
Specify how the target extends the result of integer and floating point boolean values from i1 to a w...
unsigned MaxStoresPerMemmove
Specify maximum number of store instructions per memmove call.
void computeRegisterProperties(const TargetRegisterInfo *TRI)
Once all of the register classes are added, this allows us to compute derived properties we expose.
unsigned MaxStoresPerMemmoveOptSize
Likewise for functions with the OptSize attribute.
void addRegisterClass(MVT VT, const TargetRegisterClass *RC)
Add the specified register class as an available regclass for the specified value type.
virtual MVT getPointerTy(const DataLayout &DL, uint32_t AS=0) const
Return the pointer type for the given address space, defaults to the pointer type from the data layou...
void setPrefFunctionAlignment(Align Alignment)
Set the target's preferred function alignment.
unsigned MaxStoresPerMemset
Specify maximum number of store instructions per memset call.
void setMinimumJumpTableEntries(unsigned Val)
Indicate the minimum number of blocks to generate jump tables.
unsigned MaxLoadsPerMemcmpOptSize
Likewise for functions with the OptSize attribute.
void setStackPointerRegisterToSaveRestore(Register R)
If set to a physical register, this specifies the register that llvm.savestack/llvm....
void setLoadExtAction(unsigned ExtType, MVT ValVT, MVT MemVT, LegalizeAction Action)
Indicate that the specified load with extension does not work with the specified type and indicate wh...
unsigned MaxStoresPerMemcpy
Specify maximum number of store instructions per memcpy call.
virtual ConstraintType getConstraintType(StringRef Constraint) const
Given a constraint, return the type of constraint it is for this target.
virtual std::pair< unsigned, const TargetRegisterClass * > getRegForInlineAsmConstraint(const TargetRegisterInfo *TRI, StringRef Constraint, MVT VT) const
Given a physical register constraint (e.g.
TargetLowering(const TargetLowering &)=delete
void expandShiftParts(SDNode *N, SDValue &Lo, SDValue &Hi, SelectionDAG &DAG) const
Expand shift-by-parts.
Primary interface to the complete machine description for the target machine.
TargetRegisterInfo base class - We assume that the target defines a static array of TargetRegisterDes...
virtual const TargetInstrInfo * getInstrInfo() const
virtual const TargetRegisterInfo * getRegisterInfo() const =0
Return the target's register information.
Twine - A lightweight data structure for efficiently representing the concatenation of temporary valu...
Definition Twine.h:82
The instances of the Type class are immutable: once they are created, they are never changed.
Definition Type.h:46
static LLVM_ABI Type * getVoidTy(LLVMContext &C)
Definition Type.cpp:282
LLVM_ABI TypeSize getPrimitiveSizeInBits() const LLVM_READONLY
Return the basic size of this type if it is a primitive type.
Definition Type.cpp:197
bool isIntegerTy() const
True if this is an instance of IntegerType.
Definition Type.h:257
bool isVoidTy() const
Return true if this is 'void'.
Definition Type.h:141
Type * getType() const
All values are typed, get the type of this value.
Definition Value.h:255
self_iterator getIterator()
Definition ilist_node.h:123
A raw_ostream that writes to an std::string.
unsigned ID
LLVM IR allows to use arbitrary numbers as calling convention identifiers.
Definition CallingConv.h:24
@ PreserveAll
Used for runtime calls that preserves (almost) all registers.
Definition CallingConv.h:66
@ Fast
Attempts to make calls as fast as possible (e.g.
Definition CallingConv.h:41
@ C
The default llvm calling convention, compatible with C.
Definition CallingConv.h:34
@ SETCC
SetCC operator - This evaluates to a true value iff the condition is true.
Definition ISDOpcodes.h:823
@ STACKRESTORE
STACKRESTORE has two operands, an input chain and a pointer to restore to it returns an output chain.
@ STACKSAVE
STACKSAVE - STACKSAVE has one operand, an input chain.
@ SMUL_LOHI
SMUL_LOHI/UMUL_LOHI - Multiply two integers of type iN, producing a signed/unsigned value of type i[2...
Definition ISDOpcodes.h:275
@ BSWAP
Byte Swap and Counting operators.
Definition ISDOpcodes.h:783
@ ATOMIC_STORE
OUTCHAIN = ATOMIC_STORE(INCHAIN, val, ptr) This corresponds to "store atomic" instruction.
@ LOAD
LOAD and STORE have token chains as their first operand, then the same operands as an LLVM load/store...
@ ANY_EXTEND
ANY_EXTEND - Used for integer types. The high bits are undefined.
Definition ISDOpcodes.h:857
@ GlobalAddress
Definition ISDOpcodes.h:88
@ ATOMIC_CMP_SWAP_WITH_SUCCESS
Val, Success, OUTCHAIN = ATOMIC_CMP_SWAP_WITH_SUCCESS(INCHAIN, ptr, cmp, swap) N.b.
@ MEMBARRIER
MEMBARRIER - Compiler barrier only; generate a no-op.
@ ATOMIC_FENCE
OUTCHAIN = ATOMIC_FENCE(INCHAIN, ordering, scope) This corresponds to the fence instruction.
@ SDIVREM
SDIVREM/UDIVREM - Divide two integers and produce both a quotient and remainder result.
Definition ISDOpcodes.h:280
@ CTLZ_ZERO_POISON
Definition ISDOpcodes.h:792
@ SIGN_EXTEND
Conversion operators.
Definition ISDOpcodes.h:848
@ BR_CC
BR_CC - Conditional branch.
@ BRIND
BRIND - Indirect branch.
@ BR_JT
BR_JT - Jumptable branch.
@ SELECT
Select(COND, TRUEVAL, FALSEVAL).
Definition ISDOpcodes.h:800
@ ATOMIC_LOAD
Val, OUTCHAIN = ATOMIC_LOAD(INCHAIN, ptr) This corresponds to "load atomic" instruction.
@ MULHU
MULHU/MULHS - Multiply high - Multiply two integers of type iN, producing an unsigned/signed value of...
Definition ISDOpcodes.h:704
@ ZERO_EXTEND
ZERO_EXTEND - Used for integer types, zeroing the new bits.
Definition ISDOpcodes.h:854
@ SELECT_CC
Select with condition operator - This selects between a true value and a false value (ops #2 and #3) ...
Definition ISDOpcodes.h:815
@ DYNAMIC_STACKALLOC
DYNAMIC_STACKALLOC - Allocate some number of bytes on the stack aligned to a specified boundary.
@ SIGN_EXTEND_INREG
SIGN_EXTEND_INREG - This operator atomically performs a SHL/SRA pair to sign extend a small value in ...
Definition ISDOpcodes.h:892
@ TRAP
TRAP - Trapping instruction.
@ ATOMIC_SWAP
Val, OUTCHAIN = ATOMIC_SWAP(INCHAIN, ptr, amt) Val, OUTCHAIN = ATOMIC_LOAD_[OpName](INCHAIN,...
@ CTTZ_ZERO_POISON
Bit counting operators with a poisoned result for zero inputs.
Definition ISDOpcodes.h:791
@ TRUNCATE
TRUNCATE - Completely drop the high bits.
Definition ISDOpcodes.h:860
@ BRCOND
BRCOND - Conditional branch.
@ SHL_PARTS
SHL_PARTS/SRA_PARTS/SRL_PARTS - These operators are used for expanded integer shift operations.
Definition ISDOpcodes.h:837
@ AssertSext
AssertSext, AssertZext - These nodes record if a register contains a value that has already been zero...
Definition ISDOpcodes.h:62
LLVM_ABI CondCode getSetCCSwappedOperands(CondCode Operation)
Return the operation corresponding to (Y op X) when given the operation for (X op Y).
CondCode
ISD::CondCode enum - These are ordered carefully to make the bitfields below work out,...
@ SingleThread
Synchronized with respect to signal handlers executing in the same thread.
Definition LLVMContext.h:55
initializer< Ty > init(const Ty &Val)
This is an optimization pass for GlobalISel generic memory operations.
MachineInstrBuilder BuildMI(MachineFunction &MF, const MIMetadata &MIMD, const MCInstrDesc &MCID)
Builder interface. Specify how to create the initial instruction itself.
constexpr bool isInt(int64_t x)
Checks if an integer fits into the given bit width.
Definition MathExtras.h:165
@ Dead
Unused definition.
@ EarlyClobber
Register definition happens before uses.
@ Define
Register definition.
decltype(auto) dyn_cast(const From &Val)
dyn_cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:643
detail::concat_range< ValueT, RangeTs... > concat(RangeTs &&...Ranges)
Returns a concatenated range across two or more ranges.
Definition STLExtras.h:1151
LLVM_ABI void report_fatal_error(Error Err, bool gen_crash_diag=true)
Definition Error.cpp:163
class LLVM_GSL_OWNER SmallVector
Forward declaration of SmallVector so that calculateSmallVectorDefaultInlinedElements can reference s...
bool isa(const From &Val)
isa<X> - Return true if the parameter to the template is an instance of one of the template type argu...
Definition Casting.h:547
uint16_t MCPhysReg
An unsigned integer type large enough to represent all physical registers, but not necessarily virtua...
Definition MCRegister.h:21
DWARFExpression::Operation Op
decltype(auto) cast(const From &Val)
cast<X> - Return the argument parameter cast to the specified type.
Definition Casting.h:559
void swap(llvm::BitVector &LHS, llvm::BitVector &RHS)
Implement std::swap in terms of BitVector swap.
Definition BitVector.h:876
#define N
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition Alignment.h:39
Extended Value Type.
Definition ValueTypes.h:35
bool isSimple() const
Test if the given EVT is simple (as opposed to being extended).
Definition ValueTypes.h:145
TypeSize getSizeInBits() const
Return the size of the specified value type in bits.
Definition ValueTypes.h:396
MVT getSimpleVT() const
Return the SimpleValueType held in the specified simple EVT.
Definition ValueTypes.h:339
void print(raw_ostream &OS) const
Implement operator<<.
Definition ValueTypes.h:527
bool isInteger() const
Return true if this is an integer or a vector integer type.
Definition ValueTypes.h:160
This structure contains all information that is necessary for lowering calls.
SmallVector< ISD::InputArg, 32 > Ins
SmallVector< ISD::OutputArg, 32 > Outs