doxygen/X86LegalizerInfo_8cpp_source.html

//===- X86LegalizerInfo.cpp --------------------------------------*- C++ -*-==//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

/// \file

/// This file implements the targeting of the Machinelegalizer class for X86.

/// \todo This should be generated by TableGen.

//===----------------------------------------------------------------------===//


#include "X86LegalizerInfo.h"

#include "X86Subtarget.h"

#include "X86TargetMachine.h"

#include "llvm/CodeGen/GlobalISel/GenericMachineInstrs.h"

#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"

#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"

#include "llvm/CodeGen/MachineConstantPool.h"

#include "llvm/CodeGen/TargetOpcodes.h"

#include "llvm/CodeGen/ValueTypes.h"

#include "llvm/IR/DerivedTypes.h"

#include "llvm/IR/Type.h"


using namespace llvm;

using namespace TargetOpcode;

using namespace LegalizeActions;

using namespace LegalityPredicates;


X86LegalizerInfo::X86LegalizerInfo(const X86Subtarget &STI,

                                   const X86TargetMachine &TM)

    : Subtarget(STI) {


  bool Is64Bit = Subtarget.is64Bit();

  bool HasCMOV = Subtarget.canUseCMOV();

  bool HasSSE1 = Subtarget.hasSSE1();

  bool HasSSE2 = Subtarget.hasSSE2();

  bool HasSSE41 = Subtarget.hasSSE41();

  bool HasAVX = Subtarget.hasAVX();

  bool HasAVX2 = Subtarget.hasAVX2();

  bool HasAVX512 = Subtarget.hasAVX512();

  bool HasVLX = Subtarget.hasVLX();

  bool HasDQI = Subtarget.hasAVX512() && Subtarget.hasDQI();

  bool HasBWI = Subtarget.hasAVX512() && Subtarget.hasBWI();

  bool UseX87 = !Subtarget.useSoftFloat() && Subtarget.hasX87();


  const LLT p0 = LLT::pointer(0, TM.getPointerSizeInBits(0));

  const LLT s1 = LLT::scalar(1);

  const LLT s8 = LLT::scalar(8);

  const LLT s16 = LLT::scalar(16);

  const LLT s32 = LLT::scalar(32);

  const LLT s64 = LLT::scalar(64);

  const LLT s80 = LLT::scalar(80);

  const LLT s128 = LLT::scalar(128);

  const LLT sMaxScalar = Subtarget.is64Bit() ? s64 : s32;

  const LLT v2s32 = LLT::fixed_vector(2, 32);

  const LLT v4s8 = LLT::fixed_vector(4, 8);


  const LLT v16s8 = LLT::fixed_vector(16, 8);

  const LLT v8s16 = LLT::fixed_vector(8, 16);

  const LLT v4s32 = LLT::fixed_vector(4, 32);

  const LLT v2s64 = LLT::fixed_vector(2, 64);

  const LLT v2p0 = LLT::fixed_vector(2, p0);


  const LLT v32s8 = LLT::fixed_vector(32, 8);

  const LLT v16s16 = LLT::fixed_vector(16, 16);

  const LLT v8s32 = LLT::fixed_vector(8, 32);

  const LLT v4s64 = LLT::fixed_vector(4, 64);

  const LLT v4p0 = LLT::fixed_vector(4, p0);


  const LLT v64s8 = LLT::fixed_vector(64, 8);

  const LLT v32s16 = LLT::fixed_vector(32, 16);

  const LLT v16s32 = LLT::fixed_vector(16, 32);

  const LLT v8s64 = LLT::fixed_vector(8, 64);


  const LLT s8MaxVector = HasAVX512 ? v64s8 : HasAVX ? v32s8 : v16s8;

  const LLT s16MaxVector = HasAVX512 ? v32s16 : HasAVX ? v16s16 : v8s16;

  const LLT s32MaxVector = HasAVX512 ? v16s32 : HasAVX ? v8s32 : v4s32;

  const LLT s64MaxVector = HasAVX512 ? v8s64 : HasAVX ? v4s64 : v2s64;


  // todo: AVX512 bool vector predicate types


  // implicit/constants

  getActionDefinitionsBuilder(G_IMPLICIT_DEF)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        // 32/64-bits needs support for s64/s128 to handle cases:

        // s64 = EXTEND (G_IMPLICIT_DEF s32) -> s64 = G_IMPLICIT_DEF

        // s128 = EXTEND (G_IMPLICIT_DEF s32/s64) -> s128 = G_IMPLICIT_DEF

        return typeInSet(0, {p0, s1, s8, s16, s32, s64})(Query) ||

               (Is64Bit && typeInSet(0, {s128})(Query));

      });


  getActionDefinitionsBuilder(G_CONSTANT)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typeInSet(0, {p0, s8, s16, s32})(Query) ||

               (Is64Bit && typeInSet(0, {s64})(Query));

      })

      .widenScalarToNextPow2(0, /*Min=*/8)

      .clampScalar(0, s8, sMaxScalar);


  // merge/unmerge

  for (unsigned Op : {G_MERGE_VALUES, G_UNMERGE_VALUES}) {

    unsigned BigTyIdx = Op == G_MERGE_VALUES ? 0 : 1;

    unsigned LitTyIdx = Op == G_MERGE_VALUES ? 1 : 0;

    getActionDefinitionsBuilder(Op)

        .widenScalarToNextPow2(LitTyIdx, /*Min=*/8)

        .widenScalarToNextPow2(BigTyIdx, /*Min=*/16)

        .minScalar(LitTyIdx, s8)

        .minScalar(BigTyIdx, s32)

        .legalIf([=](const LegalityQuery &Q) {

          switch (Q.Types[BigTyIdx].getSizeInBits()) {

          case 16:

          case 32:

          case 64:

          case 128:

          case 256:

          case 512:

            break;

          default:

            return false;

          }

          switch (Q.Types[LitTyIdx].getSizeInBits()) {

          case 8:

          case 16:

          case 32:

          case 64:

          case 128:

          case 256:

            return true;

          default:

            return false;

          }

        });

  }


  // integer addition/subtraction

  getActionDefinitionsBuilder({G_ADD, G_SUB})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        if (typeInSet(0, {s8, s16, s32})(Query))

          return true;

        if (Is64Bit && typeInSet(0, {s64})(Query))

          return true;

        if (HasSSE2 && typeInSet(0, {v16s8, v8s16, v4s32, v2s64})(Query))

          return true;

        if (HasAVX2 && typeInSet(0, {v32s8, v16s16, v8s32, v4s64})(Query))

          return true;

        if (HasAVX512 && typeInSet(0, {v16s32, v8s64})(Query))

          return true;

        if (HasBWI && typeInSet(0, {v64s8, v32s16})(Query))

          return true;

        return false;

      })

      .clampMinNumElements(0, s8, 16)

      .clampMinNumElements(0, s16, 8)

      .clampMinNumElements(0, s32, 4)

      .clampMinNumElements(0, s64, 2)

      .clampMaxNumElements(0, s8, HasBWI ? 64 : (HasAVX2 ? 32 : 16))

      .clampMaxNumElements(0, s16, HasBWI ? 32 : (HasAVX2 ? 16 : 8))

      .clampMaxNumElements(0, s32, HasAVX512 ? 16 : (HasAVX2 ? 8 : 4))

      .clampMaxNumElements(0, s64, HasAVX512 ? 8 : (HasAVX2 ? 4 : 2))

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s8, sMaxScalar)

      .scalarize(0);


  getActionDefinitionsBuilder({G_UADDE, G_UADDO, G_USUBE, G_USUBO})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typePairInSet(0, 1, {{s8, s1}, {s16, s1}, {s32, s1}})(Query) ||

               (Is64Bit && typePairInSet(0, 1, {{s64, s1}})(Query));

      })

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s8, sMaxScalar)

      .clampScalar(1, s1, s1)

      .scalarize(0);


  // integer multiply

  getActionDefinitionsBuilder(G_MUL)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        if (typeInSet(0, {s8, s16, s32})(Query))

          return true;

        if (Is64Bit && typeInSet(0, {s64})(Query))

          return true;

        if (HasSSE2 && typeInSet(0, {v8s16})(Query))

          return true;

        if (HasSSE41 && typeInSet(0, {v4s32})(Query))

          return true;

        if (HasAVX2 && typeInSet(0, {v16s16, v8s32})(Query))

          return true;

        if (HasAVX512 && typeInSet(0, {v16s32})(Query))

          return true;

        if (HasDQI && typeInSet(0, {v8s64})(Query))

          return true;

        if (HasDQI && HasVLX && typeInSet(0, {v2s64, v4s64})(Query))

          return true;

        if (HasBWI && typeInSet(0, {v32s16})(Query))

          return true;

        return false;

      })

      .clampMinNumElements(0, s16, 8)

      .clampMinNumElements(0, s32, 4)

      .clampMinNumElements(0, s64, HasVLX ? 2 : 8)

      .clampMaxNumElements(0, s16, HasBWI ? 32 : (HasAVX2 ? 16 : 8))

      .clampMaxNumElements(0, s32, HasAVX512 ? 16 : (HasAVX2 ? 8 : 4))

      .clampMaxNumElements(0, s64, 8)

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s8, sMaxScalar)

      .scalarize(0);


  getActionDefinitionsBuilder({G_SMULH, G_UMULH})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typeInSet(0, {s8, s16, s32})(Query) ||

               (Is64Bit && typeInSet(0, {s64})(Query));

      })

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s8, sMaxScalar)

      .scalarize(0);


  // integer divisions

  getActionDefinitionsBuilder({G_SDIV, G_SREM, G_UDIV, G_UREM})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typeInSet(0, {s8, s16, s32})(Query) ||

               (Is64Bit && typeInSet(0, {s64})(Query));

      })

      .libcallFor({s64})

      .clampScalar(0, s8, sMaxScalar);


  // integer shifts

  getActionDefinitionsBuilder({G_SHL, G_LSHR, G_ASHR})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typePairInSet(0, 1, {{s8, s8}, {s16, s8}, {s32, s8}})(Query) ||

               (Is64Bit && typePairInSet(0, 1, {{s64, s8}})(Query));

      })

      .clampScalar(0, s8, sMaxScalar)

      .clampScalar(1, s8, s8);


  // integer logic

  getActionDefinitionsBuilder({G_AND, G_OR, G_XOR})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        if (typeInSet(0, {s8, s16, s32})(Query))

          return true;

        if (Is64Bit && typeInSet(0, {s64})(Query))

          return true;

        if (HasSSE2 && typeInSet(0, {v16s8, v8s16, v4s32, v2s64})(Query))

          return true;

        if (HasAVX && typeInSet(0, {v32s8, v16s16, v8s32, v4s64})(Query))

          return true;

        if (HasAVX512 && typeInSet(0, {v64s8, v32s16, v16s32, v8s64})(Query))

          return true;

        return false;

      })

      .clampMinNumElements(0, s8, 16)

      .clampMinNumElements(0, s16, 8)

      .clampMinNumElements(0, s32, 4)

      .clampMinNumElements(0, s64, 2)

      .clampMaxNumElements(0, s8, HasAVX512 ? 64 : (HasAVX ? 32 : 16))

      .clampMaxNumElements(0, s16, HasAVX512 ? 32 : (HasAVX ? 16 : 8))

      .clampMaxNumElements(0, s32, HasAVX512 ? 16 : (HasAVX ? 8 : 4))

      .clampMaxNumElements(0, s64, HasAVX512 ? 8 : (HasAVX ? 4 : 2))

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s8, sMaxScalar)

      .scalarize(0);


  // integer comparison

  const std::initializer_list<LLT> IntTypes32 = {s8, s16, s32, p0};

  const std::initializer_list<LLT> IntTypes64 = {s8, s16, s32, s64, p0};


  getActionDefinitionsBuilder(G_ICMP)

      .legalForCartesianProduct({s8}, Is64Bit ? IntTypes64 : IntTypes32)

      .clampScalar(0, s8, s8)

      .clampScalar(1, s8, sMaxScalar);


  // bswap

  getActionDefinitionsBuilder(G_BSWAP)

      .legalIf([=](const LegalityQuery &Query) {

        return Query.Types[0] == s32 ||

               (Subtarget.is64Bit() && Query.Types[0] == s64);

      })

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s32, sMaxScalar);


  // popcount

  getActionDefinitionsBuilder(G_CTPOP)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return Subtarget.hasPOPCNT() &&

               (typePairInSet(0, 1, {{s16, s16}, {s32, s32}})(Query) ||

                (Is64Bit && typePairInSet(0, 1, {{s64, s64}})(Query)));

      })

      .widenScalarToNextPow2(1, /*Min=*/16)

      .clampScalar(1, s16, sMaxScalar)

      .scalarSameSizeAs(0, 1);


  // count leading zeros (LZCNT)

  getActionDefinitionsBuilder(G_CTLZ)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return Subtarget.hasLZCNT() &&

               (typePairInSet(0, 1, {{s16, s16}, {s32, s32}})(Query) ||

                (Is64Bit && typePairInSet(0, 1, {{s64, s64}})(Query)));

      })

      .widenScalarToNextPow2(1, /*Min=*/16)

      .clampScalar(1, s16, sMaxScalar)

      .scalarSameSizeAs(0, 1);


  // count trailing zeros

  getActionDefinitionsBuilder({G_CTTZ_ZERO_UNDEF, G_CTTZ})

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return (Query.Opcode == G_CTTZ_ZERO_UNDEF || Subtarget.hasBMI()) &&

               (typePairInSet(0, 1, {{s16, s16}, {s32, s32}})(Query) ||

                (Is64Bit && typePairInSet(0, 1, {{s64, s64}})(Query)));

      })

      .widenScalarToNextPow2(1, /*Min=*/16)

      .clampScalar(1, s16, sMaxScalar)

      .scalarSameSizeAs(0, 1);


  // control flow

  getActionDefinitionsBuilder(G_PHI)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typeInSet(0, {s8, s16, s32, p0})(Query) ||

               (UseX87 && typeIs(0, s80)(Query)) ||

               (Is64Bit && typeIs(0, s64)(Query)) ||

               (HasSSE1 && typeInSet(0, {v16s8, v8s16, v4s32, v2s64})(Query)) ||

               (HasAVX && typeInSet(0, {v32s8, v16s16, v8s32, v4s64})(Query)) ||

               (HasAVX512 &&

                typeInSet(0, {v64s8, v32s16, v16s32, v8s64})(Query));

      })

      .clampMinNumElements(0, s8, 16)

      .clampMinNumElements(0, s16, 8)

      .clampMinNumElements(0, s32, 4)

      .clampMinNumElements(0, s64, 2)

      .clampMaxNumElements(0, s8, HasAVX512 ? 64 : (HasAVX ? 32 : 16))

      .clampMaxNumElements(0, s16, HasAVX512 ? 32 : (HasAVX ? 16 : 8))

      .clampMaxNumElements(0, s32, HasAVX512 ? 16 : (HasAVX ? 8 : 4))

      .clampMaxNumElements(0, s64, HasAVX512 ? 8 : (HasAVX ? 4 : 2))

      .widenScalarToNextPow2(0, /*Min=*/32)

      .clampScalar(0, s8, sMaxScalar)

      .scalarize(0);


  getActionDefinitionsBuilder(G_BRCOND).legalFor({s1});


  // pointer handling

  const std::initializer_list<LLT> PtrTypes32 = {s1, s8, s16, s32};

  const std::initializer_list<LLT> PtrTypes64 = {s1, s8, s16, s32, s64};


  getActionDefinitionsBuilder(G_PTRTOINT)

      .legalForCartesianProduct(Is64Bit ? PtrTypes64 : PtrTypes32, {p0})

      .maxScalar(0, sMaxScalar)

      .widenScalarToNextPow2(0, /*Min*/ 8);


  getActionDefinitionsBuilder(G_INTTOPTR).legalFor({{p0, sMaxScalar}});


  getActionDefinitionsBuilder(G_CONSTANT_POOL).legalFor({p0});


  getActionDefinitionsBuilder(G_PTR_ADD)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return typePairInSet(0, 1, {{p0, s32}})(Query) ||

               (Is64Bit && typePairInSet(0, 1, {{p0, s64}})(Query));

      })

      .widenScalarToNextPow2(1, /*Min*/ 32)

      .clampScalar(1, s32, sMaxScalar);


  getActionDefinitionsBuilder({G_FRAME_INDEX, G_GLOBAL_VALUE}).legalFor({p0});


  // load/store: add more corner cases

  for (unsigned Op : {G_LOAD, G_STORE}) {

    auto &Action = getActionDefinitionsBuilder(Op);

    Action.legalForTypesWithMemDesc({{s8, p0, s1, 1},

                                     {s8, p0, s8, 1},

                                     {s16, p0, s8, 1},

                                     {s16, p0, s16, 1},

                                     {s32, p0, s8, 1},

                                     {s32, p0, s16, 1},

                                     {s32, p0, s32, 1},

                                     {s80, p0, s80, 1},

                                     {p0, p0, p0, 1},

                                     {v4s8, p0, v4s8, 1}});

    if (Is64Bit)

      Action.legalForTypesWithMemDesc({{s64, p0, s8, 1},

                                       {s64, p0, s16, 1},

                                       {s64, p0, s32, 1},

                                       {s64, p0, s64, 1},

                                       {v2s32, p0, v2s32, 1}});

    if (HasSSE1)

      Action.legalForTypesWithMemDesc({{v4s32, p0, v4s32, 1}});

    if (HasSSE2)

      Action.legalForTypesWithMemDesc({{v16s8, p0, v16s8, 1},

                                       {v8s16, p0, v8s16, 1},

                                       {v2s64, p0, v2s64, 1},

                                       {v2p0, p0, v2p0, 1}});

    if (HasAVX)

      Action.legalForTypesWithMemDesc({{v32s8, p0, v32s8, 1},

                                       {v16s16, p0, v16s16, 1},

                                       {v8s32, p0, v8s32, 1},

                                       {v4s64, p0, v4s64, 1},

                                       {v4p0, p0, v4p0, 1}});

    if (HasAVX512)

      Action.legalForTypesWithMemDesc({{v64s8, p0, v64s8, 1},

                                       {v32s16, p0, v32s16, 1},

                                       {v16s32, p0, v16s32, 1},

                                       {v8s64, p0, v8s64, 1}});

    Action.widenScalarToNextPow2(0, /*Min=*/8)

        .clampScalar(0, s8, sMaxScalar)

        .scalarize(0);

  }


  for (unsigned Op : {G_SEXTLOAD, G_ZEXTLOAD}) {

    auto &Action = getActionDefinitionsBuilder(Op);

    Action.legalForTypesWithMemDesc({{s16, p0, s8, 1},

                                     {s32, p0, s8, 1},

                                     {s32, p0, s16, 1}});

    if (Is64Bit)

      Action.legalForTypesWithMemDesc({{s64, p0, s8, 1},

                                       {s64, p0, s16, 1},

                                       {s64, p0, s32, 1}});

    // TODO - SSE41/AVX2/AVX512F/AVX512BW vector extensions

  }


  // sext, zext, and anyext

  getActionDefinitionsBuilder({G_SEXT, G_ZEXT, G_ANYEXT})

      .legalIf([=](const LegalityQuery &Query) {

        return typeInSet(0, {s8, s16, s32})(Query) ||

          (Query.Opcode == G_ANYEXT && Query.Types[0] == s128) ||

          (Is64Bit && Query.Types[0] == s64);

      })

      .widenScalarToNextPow2(0, /*Min=*/8)

      .clampScalar(0, s8, sMaxScalar)

      .widenScalarToNextPow2(1, /*Min=*/8)

      .clampScalar(1, s8, sMaxScalar)

      .scalarize(0);


  getActionDefinitionsBuilder(G_SEXT_INREG).lower();


  // fp constants

  getActionDefinitionsBuilder(G_FCONSTANT)

      .legalIf([=](const LegalityQuery &Query) -> bool {

        return (typeInSet(0, {s32, s64})(Query)) ||

               (UseX87 && typeInSet(0, {s80})(Query));

      });


  // fp arithmetic

  getActionDefinitionsBuilder({G_FADD, G_FSUB, G_FMUL, G_FDIV})

      .legalIf([=](const LegalityQuery &Query) {

        return (typeInSet(0, {s32, s64})(Query)) ||

               (HasSSE1 && typeInSet(0, {v4s32})(Query)) ||

               (HasSSE2 && typeInSet(0, {v2s64})(Query)) ||

               (HasAVX && typeInSet(0, {v8s32, v4s64})(Query)) ||

               (HasAVX512 && typeInSet(0, {v16s32, v8s64})(Query)) ||

               (UseX87 && typeInSet(0, {s80})(Query));

      });


  // fp comparison

  getActionDefinitionsBuilder(G_FCMP)

      .legalIf([=](const LegalityQuery &Query) {

        return (HasSSE1 && typePairInSet(0, 1, {{s8, s32}})(Query)) ||

               (HasSSE2 && typePairInSet(0, 1, {{s8, s64}})(Query));

      })

      .clampScalar(0, s8, s8)

      .clampScalar(1, s32, HasSSE2 ? s64 : s32)

      .widenScalarToNextPow2(1);


  // fp conversions

  getActionDefinitionsBuilder(G_FPEXT).legalIf([=](const LegalityQuery &Query) {

    return (HasSSE2 && typePairInSet(0, 1, {{s64, s32}})(Query)) ||

           (HasAVX && typePairInSet(0, 1, {{v4s64, v4s32}})(Query)) ||

           (HasAVX512 && typePairInSet(0, 1, {{v8s64, v8s32}})(Query));

  });


  getActionDefinitionsBuilder(G_FPTRUNC).legalIf(

      [=](const LegalityQuery &Query) {

        return (HasSSE2 && typePairInSet(0, 1, {{s32, s64}})(Query)) ||

               (HasAVX && typePairInSet(0, 1, {{v4s32, v4s64}})(Query)) ||

               (HasAVX512 && typePairInSet(0, 1, {{v8s32, v8s64}})(Query));

      });


  getActionDefinitionsBuilder(G_SITOFP)

      .legalIf([=](const LegalityQuery &Query) {

        return (HasSSE1 &&

                (typePairInSet(0, 1, {{s32, s32}})(Query) ||

                 (Is64Bit && typePairInSet(0, 1, {{s32, s64}})(Query)))) ||

               (HasSSE2 &&

                (typePairInSet(0, 1, {{s64, s32}})(Query) ||

                 (Is64Bit && typePairInSet(0, 1, {{s64, s64}})(Query))));

      })

      .clampScalar(1, s32, sMaxScalar)

      .widenScalarToNextPow2(1)

      .clampScalar(0, s32, HasSSE2 ? s64 : s32)

      .widenScalarToNextPow2(0);


  getActionDefinitionsBuilder(G_FPTOSI)

      .legalIf([=](const LegalityQuery &Query) {

        return (HasSSE1 &&

                (typePairInSet(0, 1, {{s32, s32}})(Query) ||

                 (Is64Bit && typePairInSet(0, 1, {{s64, s32}})(Query)))) ||

               (HasSSE2 &&

                (typePairInSet(0, 1, {{s32, s64}})(Query) ||

                 (Is64Bit && typePairInSet(0, 1, {{s64, s64}})(Query))));

      })

      .clampScalar(1, s32, HasSSE2 ? s64 : s32)

      .widenScalarToNextPow2(0)

      .clampScalar(0, s32, sMaxScalar)

      .widenScalarToNextPow2(1);


  // vector ops

  getActionDefinitionsBuilder(G_BUILD_VECTOR)

      .customIf([=](const LegalityQuery &Query) {

        return (HasSSE1 && typeInSet(0, {v4s32})(Query)) ||

               (HasSSE2 && typeInSet(0, {v2s64, v8s16, v16s8})(Query)) ||

               (HasAVX && typeInSet(0, {v4s64, v8s32, v16s16, v32s8})(Query)) ||

               (HasAVX512 && typeInSet(0, {v8s64, v16s32, v32s16, v64s8}));

      })

      .clampNumElements(0, v16s8, s8MaxVector)

      .clampNumElements(0, v8s16, s16MaxVector)

      .clampNumElements(0, v4s32, s32MaxVector)

      .clampNumElements(0, v2s64, s64MaxVector)

      .moreElementsToNextPow2(0);


  getActionDefinitionsBuilder({G_EXTRACT, G_INSERT})

      .legalIf([=](const LegalityQuery &Query) {

        unsigned SubIdx = Query.Opcode == G_EXTRACT ? 0 : 1;

        unsigned FullIdx = Query.Opcode == G_EXTRACT ? 1 : 0;

        return (HasAVX && typePairInSet(SubIdx, FullIdx,

                                        {{v16s8, v32s8},

                                         {v8s16, v16s16},

                                         {v4s32, v8s32},

                                         {v2s64, v4s64}})(Query)) ||

               (HasAVX512 && typePairInSet(SubIdx, FullIdx,

                                           {{v16s8, v64s8},

                                            {v32s8, v64s8},

                                            {v8s16, v32s16},

                                            {v16s16, v32s16},

                                            {v4s32, v16s32},

                                            {v8s32, v16s32},

                                            {v2s64, v8s64},

                                            {v4s64, v8s64}})(Query));

      });


  // todo: only permit dst types up to max legal vector register size?

  getActionDefinitionsBuilder(G_CONCAT_VECTORS)

      .legalIf([=](const LegalityQuery &Query) {

        return (HasSSE1 && typePairInSet(1, 0,

                                         {{v16s8, v32s8},

                                          {v8s16, v16s16},

                                          {v4s32, v8s32},

                                          {v2s64, v4s64}})(Query)) ||

               (HasAVX && typePairInSet(1, 0,

                                        {{v16s8, v64s8},

                                         {v32s8, v64s8},

                                         {v8s16, v32s16},

                                         {v16s16, v32s16},

                                         {v4s32, v16s32},

                                         {v8s32, v16s32},

                                         {v2s64, v8s64},

                                         {v4s64, v8s64}})(Query));

      });


  // todo: vectors and address spaces

  getActionDefinitionsBuilder(G_SELECT)

      .legalFor({{s8, s32}, {s16, s32}, {s32, s32}, {s64, s32}, {p0, s32}})

      .widenScalarToNextPow2(0, /*Min=*/8)

      .clampScalar(0, HasCMOV ? s16 : s8, sMaxScalar)

      .clampScalar(1, s32, s32);


  // memory intrinsics

  getActionDefinitionsBuilder({G_MEMCPY, G_MEMMOVE, G_MEMSET}).libcall();


  getActionDefinitionsBuilder({G_DYN_STACKALLOC,

                               G_STACKSAVE,

                               G_STACKRESTORE}).lower();


  // fp intrinsics

  getActionDefinitionsBuilder(G_INTRINSIC_ROUNDEVEN)

      .scalarize(0)

      .minScalar(0, LLT::scalar(32))

      .libcall();


  getActionDefinitionsBuilder({G_FREEZE, G_CONSTANT_FOLD_BARRIER})

    .legalFor({s8, s16, s32, s64, p0})

    .widenScalarToNextPow2(0, /*Min=*/8)

    .clampScalar(0, s8, sMaxScalar);


  getLegacyLegalizerInfo().computeTables();

  verify(*STI.getInstrInfo());

}


bool X86LegalizerInfo::legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI,

                                      LostDebugLocObserver &LocObserver) const {

  MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;

  MachineRegisterInfo &MRI = *MIRBuilder.getMRI();

  switch (MI.getOpcode()) {

  default:

    // No idea what to do.

    return false;

  case TargetOpcode::G_BUILD_VECTOR:

    return legalizeBuildVector(MI, MRI, Helper);

  }

  llvm_unreachable("expected switch to return");

}


bool X86LegalizerInfo::legalizeBuildVector(MachineInstr &MI,

                                           MachineRegisterInfo &MRI,

                                           LegalizerHelper &Helper) const {

  MachineIRBuilder &MIRBuilder = Helper.MIRBuilder;

  const auto &BuildVector = cast<GBuildVector>(MI);

  Register Dst = BuildVector.getReg(0);

  LLT DstTy = MRI.getType(Dst);

  MachineFunction &MF = MIRBuilder.getMF();

  LLVMContext &Ctx = MF.getFunction().getContext();

  uint64_t DstTySize = DstTy.getScalarSizeInBits();


  SmallVector<Constant *, 4> CstIdxs;

  for (unsigned i = 0; i < BuildVector.getNumSources(); ++i) {

    Register Source = BuildVector.getSourceReg(i);


    auto ValueAndReg = getIConstantVRegValWithLookThrough(Source, MRI);

    if (ValueAndReg) {

      CstIdxs.emplace_back(ConstantInt::get(Ctx, ValueAndReg->Value));

      continue;

    }


    auto FPValueAndReg = getFConstantVRegValWithLookThrough(Source, MRI);

    if (FPValueAndReg) {

      CstIdxs.emplace_back(ConstantFP::get(Ctx, FPValueAndReg->Value));

      continue;

    }


    if (getOpcodeDef<GImplicitDef>(Source, MRI)) {

      CstIdxs.emplace_back(UndefValue::get(Type::getIntNTy(Ctx, DstTySize)));

      continue;

    }

    return false;

  }


  Constant *ConstVal = ConstantVector::get(CstIdxs);


  const DataLayout &DL = MIRBuilder.getDataLayout();

  unsigned AddrSpace = DL.getDefaultGlobalsAddressSpace();

  Align Alignment(DL.getABITypeAlign(ConstVal->getType()));

  auto Addr = MIRBuilder.buildConstantPool(

      LLT::pointer(AddrSpace, DL.getPointerSizeInBits(AddrSpace)),

      MF.getConstantPool()->getConstantPoolIndex(ConstVal, Alignment));

  MachineMemOperand *MMO =

      MF.getMachineMemOperand(MachinePointerInfo::getConstantPool(MF),

                              MachineMemOperand::MOLoad, DstTy, Alignment);


  MIRBuilder.buildLoad(Dst, Addr, *MMO);

  MI.eraseFromParent();

  return true;

}


bool X86LegalizerInfo::legalizeIntrinsic(LegalizerHelper &Helper,

                                         MachineInstr &MI) const {

  return true;

}

MRI
unsigned const MachineRegisterInfo * MRI
Definition: AArch64AdvSIMDScalarPass.cpp:105

DL
MachineBasicBlock MachineBasicBlock::iterator DebugLoc DL
Definition: ARMSLSHardening.cpp:73

DerivedTypes.h

Addr
uint64_t Addr
Definition: ELFObjHandler.cpp:79

GenericMachineInstrs.h
Declares convenience wrapper classes for interpreting MachineInstr instances as specific generic oper...

libcall
@ libcall
Definition: HWAddressSanitizer.cpp:211

MI
IRTranslator LLVM IR MI
Definition: IRTranslator.cpp:113

LegalizerHelper.h

MachineConstantPool.h
This file declares the MachineConstantPool class which is an abstract constant pool to keep track of ...

MachineIRBuilder.h
This file declares the MachineIRBuilder class.

verify
ppc ctr loops verify
Definition: PPCCTRLoopsVerify.cpp:74

TM
const char LLVMTargetMachineRef TM
Definition: PassBuilderBindings.cpp:52

TargetOpcodes.h

Type.h

ValueTypes.h

X86LegalizerInfo.h
This file declares the targeting of the Machinelegalizer class for X86.

X86Subtarget.h

X86TargetMachine.h

llvm::ConstantVector::get
static Constant * get(ArrayRef< Constant * > V)
Definition: Constants.cpp:1399

llvm::Constant
This is an important base class in LLVM.
Definition: Constant.h:42

llvm::DWARFExpression::Operation
This class represents an Operation in the Expression.
Definition: DWARFExpression.h:32

llvm::DataLayout
A parsed version of the target data layout string in and methods for querying it.
Definition: DataLayout.h:63

llvm::Function::getContext
LLVMContext & getContext() const
getContext - Return a reference to the LLVMContext associated with this function.
Definition: Function.cpp:380

llvm::LLT
Definition: LowLevelType.h:39

llvm::LLT::getScalarSizeInBits
constexpr unsigned getScalarSizeInBits() const
Definition: LowLevelType.h:267

llvm::LLT::scalar
static constexpr LLT scalar(unsigned SizeInBits)
Get a low-level scalar or aggregate "bag of bits".
Definition: LowLevelType.h:42

llvm::LLT::pointer
static constexpr LLT pointer(unsigned AddressSpace, unsigned SizeInBits)
Get a low-level pointer in the given address space.
Definition: LowLevelType.h:57

llvm::LLT::fixed_vector
static constexpr LLT fixed_vector(unsigned NumElements, unsigned ScalarSizeInBits)
Get a low-level fixed-width vector of some number of elements and element width.
Definition: LowLevelType.h:100

llvm::LLVMContext
This is an important class for using LLVM in a threaded context.
Definition: LLVMContext.h:67

llvm::LegacyLegalizerInfo::computeTables
void computeTables()
Compute any ancillary tables needed to quickly decide how an operation should be handled.
Definition: LegacyLegalizerInfo.cpp:105

llvm::LegalizeRuleSet::minScalar
LegalizeRuleSet & minScalar(unsigned TypeIdx, const LLT Ty)
Ensure the scalar is at least as wide as Ty.
Definition: LegalizerInfo.h:986

llvm::LegalizeRuleSet::legalFor
LegalizeRuleSet & legalFor(std::initializer_list< LLT > Types)
The instruction is legal when type index 0 is any type in the given list.
Definition: LegalizerInfo.h:599

llvm::LegalizeRuleSet::scalarSameSizeAs
LegalizeRuleSet & scalarSameSizeAs(unsigned TypeIdx, unsigned SameSizeIdx)
Change the type TypeIdx to have the same scalar size as type SameSizeIdx.
Definition: LegalizerInfo.h:1083

llvm::LegalizeRuleSet::libcall
LegalizeRuleSet & libcall()
The instruction is emitted as a library call.
Definition: LegalizerInfo.h:729

llvm::LegalizeRuleSet::clampMaxNumElements
LegalizeRuleSet & clampMaxNumElements(unsigned TypeIdx, const LLT EltTy, unsigned MaxElements)
Limit the number of elements in EltTy vectors to at most MaxElements.
Definition: LegalizerInfo.h:1172

llvm::LegalizeRuleSet::clampMinNumElements
LegalizeRuleSet & clampMinNumElements(unsigned TypeIdx, const LLT EltTy, unsigned MinElements)
Limit the number of elements in EltTy vectors to at least MinElements.
Definition: LegalizerInfo.h:1134

llvm::LegalizeRuleSet::moreElementsToNextPow2
LegalizeRuleSet & moreElementsToNextPow2(unsigned TypeIdx)
Add more elements to the vector to reach the next power of two.
Definition: LegalizerInfo.h:1126

llvm::LegalizeRuleSet::lower
LegalizeRuleSet & lower()
The instruction is lowered.
Definition: LegalizerInfo.h:665

llvm::LegalizeRuleSet::clampScalar
LegalizeRuleSet & clampScalar(unsigned TypeIdx, const LLT MinTy, const LLT MaxTy)
Limit the range of scalar sizes to MinTy and MaxTy.
Definition: LegalizerInfo.h:1047

llvm::LegalizeRuleSet::clampNumElements
LegalizeRuleSet & clampNumElements(unsigned TypeIdx, const LLT MinTy, const LLT MaxTy)
Limit the number of elements for the given vectors to at least MinTy's number of elements and at most...
Definition: LegalizerInfo.h:1196

llvm::LegalizeRuleSet::customIf
LegalizeRuleSet & customIf(LegalityPredicate Predicate)
Definition: LegalizerInfo.h:840

llvm::LegalizeRuleSet::widenScalarToNextPow2
LegalizeRuleSet & widenScalarToNextPow2(unsigned TypeIdx, unsigned MinSize=0)
Widen the scalar to the next power of two that is at least MinSize.
Definition: LegalizerInfo.h:884

llvm::LegalizeRuleSet::scalarize
LegalizeRuleSet & scalarize(unsigned TypeIdx)
Definition: LegalizerInfo.h:930

llvm::LegalizeRuleSet::legalForCartesianProduct
LegalizeRuleSet & legalForCartesianProduct(std::initializer_list< LLT > Types)
The instruction is legal when type indexes 0 and 1 are both in the given list.
Definition: LegalizerInfo.h:631

llvm::LegalizeRuleSet::legalIf
LegalizeRuleSet & legalIf(LegalityPredicate Predicate)
The instruction is legal if predicate is true.
Definition: LegalizerInfo.h:592

llvm::LegalizerHelper
Definition: LegalizerHelper.h:47

llvm::LegalizerHelper::MIRBuilder
MachineIRBuilder & MIRBuilder
Expose MIRBuilder so clients can set their own RecordInsertInstruction functions.
Definition: LegalizerHelper.h:51

llvm::LegalizerInfo::getActionDefinitionsBuilder
LegalizeRuleSet & getActionDefinitionsBuilder(unsigned Opcode)
Get the action definition builder for the given opcode.
Definition: LegalizerInfo.cpp:292

llvm::LegalizerInfo::getLegacyLegalizerInfo
const LegacyLegalizerInfo & getLegacyLegalizerInfo() const
Definition: LegalizerInfo.h:1243

llvm::LostDebugLocObserver
Definition: LostDebugLocObserver.h:19

llvm::MachineConstantPool::getConstantPoolIndex
unsigned getConstantPoolIndex(const Constant *C, Align Alignment)
getConstantPoolIndex - Create a new entry in the constant pool or return an existing one.
Definition: MachineFunction.cpp:1485

llvm::MachineFunction
Definition: MachineFunction.h:257

llvm::MachineFunction::getMachineMemOperand
MachineMemOperand * getMachineMemOperand(MachinePointerInfo PtrInfo, MachineMemOperand::Flags f, LLT MemTy, Align base_alignment, const AAMDNodes &AAInfo=AAMDNodes(), const MDNode *Ranges=nullptr, SyncScope::ID SSID=SyncScope::System, AtomicOrdering Ordering=AtomicOrdering::NotAtomic, AtomicOrdering FailureOrdering=AtomicOrdering::NotAtomic)
getMachineMemOperand - Allocate a new MachineMemOperand.
Definition: MachineFunction.cpp:502

llvm::MachineFunction::getFunction
Function & getFunction()
Return the LLVM function that this machine code represents.
Definition: MachineFunction.h:684

llvm::MachineFunction::getConstantPool
MachineConstantPool * getConstantPool()
getConstantPool - Return the constant pool object for the current function.
Definition: MachineFunction.h:750

llvm::MachineIRBuilder
Helper class to build MachineInstr.
Definition: MachineIRBuilder.h:224

llvm::MachineIRBuilder::buildConstantPool
MachineInstrBuilder buildConstantPool(const DstOp &Res, unsigned Idx)
Build and insert Res = G_CONSTANT_POOL Idx.
Definition: MachineIRBuilder.cpp:169

llvm::MachineIRBuilder::buildLoad
MachineInstrBuilder buildLoad(const DstOp &Res, const SrcOp &Addr, MachineMemOperand &MMO)
Build and insert Res = G_LOAD Addr, MMO.
Definition: MachineIRBuilder.h:948

llvm::MachineIRBuilder::getMF
MachineFunction & getMF()
Getter for the function we currently build.
Definition: MachineIRBuilder.h:276

llvm::MachineIRBuilder::getMRI
MachineRegisterInfo * getMRI()
Getter for MRI.
Definition: MachineIRBuilder.h:298

llvm::MachineIRBuilder::getDataLayout
const DataLayout & getDataLayout() const
Definition: MachineIRBuilder.h:286

llvm::MachineInstr
Representation of each machine instruction.
Definition: MachineInstr.h:69

llvm::MachineMemOperand
A description of a memory reference used in the backend.
Definition: MachineMemOperand.h:129

llvm::MachineMemOperand::MOLoad
@ MOLoad
The memory access reads data.
Definition: MachineMemOperand.h:136

llvm::MachineRegisterInfo
MachineRegisterInfo - Keep track of information for virtual and physical registers,...
Definition: MachineRegisterInfo.h:51

llvm::Register
Wrapper class representing virtual and physical registers.
Definition: Register.h:19

llvm::SmallVectorImpl::emplace_back
reference emplace_back(ArgTypes &&... Args)
Definition: SmallVector.h:951

llvm::SmallVector
This is a 'vector' (really, a variable-sized array), optimized for the case when the array is small.
Definition: SmallVector.h:1210

llvm::Type::getIntNTy
static IntegerType * getIntNTy(LLVMContext &C, unsigned N)

llvm::UndefValue::get
static UndefValue * get(Type *T)
Static factory methods - Return an 'undef' object of the specified type.
Definition: Constants.cpp:1833

llvm::Value::getType
Type * getType() const
All values are typed, get the type of this value.
Definition: Value.h:255

llvm::X86LegalizerInfo::legalizeCustom
bool legalizeCustom(LegalizerHelper &Helper, MachineInstr &MI, LostDebugLocObserver &LocObserver) const override
Called for instructions with the Custom LegalizationAction.
Definition: X86LegalizerInfo.cpp:583

llvm::X86LegalizerInfo::legalizeIntrinsic
bool legalizeIntrinsic(LegalizerHelper &Helper, MachineInstr &MI) const override
Definition: X86LegalizerInfo.cpp:648

llvm::X86LegalizerInfo::X86LegalizerInfo
X86LegalizerInfo(const X86Subtarget &STI, const X86TargetMachine &TM)
Definition: X86LegalizerInfo.cpp:30

llvm::X86Subtarget
Definition: X86Subtarget.h:53

llvm::X86Subtarget::hasSSE1
bool hasSSE1() const
Definition: X86Subtarget.h:193

llvm::X86Subtarget::canUseCMOV
bool canUseCMOV() const
Definition: X86Subtarget.h:192

llvm::X86Subtarget::getInstrInfo
const X86InstrInfo * getInstrInfo() const override
Definition: X86Subtarget.h:122

llvm::X86Subtarget::hasAVX512
bool hasAVX512() const
Definition: X86Subtarget.h:201

llvm::X86Subtarget::hasSSE41
bool hasSSE41() const
Definition: X86Subtarget.h:197

llvm::X86Subtarget::hasSSE2
bool hasSSE2() const
Definition: X86Subtarget.h:194

llvm::X86Subtarget::hasAVX
bool hasAVX() const
Definition: X86Subtarget.h:199

llvm::X86Subtarget::hasAVX2
bool hasAVX2() const
Definition: X86Subtarget.h:200

llvm::X86TargetMachine
Definition: X86TargetMachine.h:28

uint64_t

llvm_unreachable
#define llvm_unreachable(msg)
Marks that the current location is not supposed to be reachable.
Definition: ErrorHandling.h:143

llvm::LegalityPredicates::typeInSet
LegalityPredicate typeInSet(unsigned TypeIdx, std::initializer_list< LLT > TypesInit)
True iff the given type index is one of the specified types.
Definition: LegalityPredicates.cpp:34

llvm::LegalityPredicates::typePairInSet
LegalityPredicate typePairInSet(unsigned TypeIdx0, unsigned TypeIdx1, std::initializer_list< std::pair< LLT, LLT > > TypesInit)
True iff the given types for the given pair of type indexes is one of the specified type pairs.
Definition: LegalityPredicates.cpp:42

llvm::LegalityPredicates::typeIs
LegalityPredicate typeIs(unsigned TypeIdx, LLT TypesInit)
True iff the given type index is the specified type.
Definition: LegalityPredicates.cpp:28

llvm
This is an optimization pass for GlobalISel generic memory operations.
Definition: AddressRanges.h:18

llvm::getFConstantVRegValWithLookThrough
std::optional< FPValueAndVReg > getFConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_FCONSTANT returns it...
Definition: Utils.cpp:447

llvm::getIConstantVRegValWithLookThrough
std::optional< ValueAndVReg > getIConstantVRegValWithLookThrough(Register VReg, const MachineRegisterInfo &MRI, bool LookThroughInstrs=true)
If VReg is defined by a statically evaluable chain of instructions rooted on a G_CONSTANT returns its...
Definition: Utils.cpp:433

llvm::Align
This struct is a compact representation of a valid (non-zero power of two) alignment.
Definition: Alignment.h:39

llvm::LegalityQuery
The LegalityQuery object bundles together all the information that's needed to decide whether a given...
Definition: LegalizerInfo.h:109

llvm::LegalityQuery::Types
ArrayRef< LLT > Types
Definition: LegalizerInfo.h:111

llvm::LegalityQuery::Opcode
unsigned Opcode
Definition: LegalizerInfo.h:110

llvm::MachinePointerInfo::getConstantPool
static MachinePointerInfo getConstantPool(MachineFunction &MF)
Return a MachinePointerInfo record that refers to the constant pool.
Definition: MachineOperand.cpp:1056