Target/ARM/ARMLegalizerInfo.cpp

311116Sdim//===- ARMLegalizerInfo.cpp --------------------------------------*- C++ -*-==//
311116Sdim//
353358Sdim// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
353358Sdim// See https://llvm.org/LICENSE.txt for license information.
353358Sdim// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
311116Sdim//
311116Sdim//===----------------------------------------------------------------------===//
311116Sdim/// \file
311116Sdim/// This file implements the targeting of the Machinelegalizer class for ARM.
311116Sdim/// \todo This should be generated by TableGen.
311116Sdim//===----------------------------------------------------------------------===//
311116Sdim
311116Sdim#include "ARMLegalizerInfo.h"
321369Sdim#include "ARMCallLowering.h"
321369Sdim#include "ARMSubtarget.h"
321369Sdim#include "llvm/CodeGen/GlobalISel/LegalizerHelper.h"
321369Sdim#include "llvm/CodeGen/LowLevelType.h"
321369Sdim#include "llvm/CodeGen/MachineRegisterInfo.h"
327952Sdim#include "llvm/CodeGen/TargetOpcodes.h"
311116Sdim#include "llvm/CodeGen/ValueTypes.h"
311116Sdim#include "llvm/IR/DerivedTypes.h"
311116Sdim#include "llvm/IR/Type.h"
311116Sdim
311116Sdimusing namespace llvm;
341825Sdimusing namespace LegalizeActions;
311116Sdim
327952Sdim/// FIXME: The following static functions are SizeChangeStrategy functions
327952Sdim/// that are meant to temporarily mimic the behaviour of the old legalization
327952Sdim/// based on doubling/halving non-legal types as closely as possible. This is
327952Sdim/// not entirly possible as only legalizing the types that are exactly a power
327952Sdim/// of 2 times the size of the legal types would require specifying all those
327952Sdim/// sizes explicitly.
327952Sdim/// In practice, not specifying those isn't a problem, and the below functions
327952Sdim/// should disappear quickly as we add support for legalizing non-power-of-2
327952Sdim/// sized types further.
327952Sdimstatic void
327952SdimaddAndInterleaveWithUnsupported(LegalizerInfo::SizeAndActionsVec &result,
327952Sdim                                const LegalizerInfo::SizeAndActionsVec &v) {
327952Sdim  for (unsigned i = 0; i < v.size(); ++i) {
327952Sdim    result.push_back(v[i]);
327952Sdim    if (i + 1 < v[i].first && i + 1 < v.size() &&
327952Sdim        v[i + 1].first != v[i].first + 1)
341825Sdim      result.push_back({v[i].first + 1, Unsupported});
327952Sdim  }
327952Sdim}
311116Sdim
327952Sdimstatic LegalizerInfo::SizeAndActionsVec
327952Sdimwiden_8_16(const LegalizerInfo::SizeAndActionsVec &v) {
327952Sdim  assert(v.size() >= 1);
327952Sdim  assert(v[0].first > 17);
341825Sdim  LegalizerInfo::SizeAndActionsVec result = {{1, Unsupported},
341825Sdim                                             {8, WidenScalar},
341825Sdim                                             {9, Unsupported},
341825Sdim                                             {16, WidenScalar},
341825Sdim                                             {17, Unsupported}};
327952Sdim  addAndInterleaveWithUnsupported(result, v);
327952Sdim  auto Largest = result.back().first;
341825Sdim  result.push_back({Largest + 1, Unsupported});
327952Sdim  return result;
327952Sdim}
327952Sdim
321369Sdimstatic bool AEABI(const ARMSubtarget &ST) {
321369Sdim  return ST.isTargetAEABI() || ST.isTargetGNUAEABI() || ST.isTargetMuslAEABI();
321369Sdim}
321369Sdim
321369SdimARMLegalizerInfo::ARMLegalizerInfo(const ARMSubtarget &ST) {
311116Sdim  using namespace TargetOpcode;
311116Sdim
311116Sdim  const LLT p0 = LLT::pointer(0, 32);
311116Sdim
321369Sdim  const LLT s1 = LLT::scalar(1);
311116Sdim  const LLT s8 = LLT::scalar(8);
311116Sdim  const LLT s16 = LLT::scalar(16);
311116Sdim  const LLT s32 = LLT::scalar(32);
321369Sdim  const LLT s64 = LLT::scalar(64);
311116Sdim
344779Sdim  if (ST.isThumb1Only()) {
344779Sdim    // Thumb1 is not supported yet.
344779Sdim    computeTables();
344779Sdim    verify(*ST.getInstrInfo());
344779Sdim    return;
344779Sdim  }
311116Sdim
344779Sdim  getActionDefinitionsBuilder({G_SEXT, G_ZEXT, G_ANYEXT})
353358Sdim      .legalForCartesianProduct({s8, s16, s32}, {s1, s8, s16});
344779Sdim
360784Sdim  getActionDefinitionsBuilder(G_SEXT_INREG).lower();
360784Sdim
353358Sdim  getActionDefinitionsBuilder({G_MUL, G_AND, G_OR, G_XOR})
341825Sdim      .legalFor({s32})
341825Sdim      .minScalar(0, s32);
311116Sdim
353358Sdim  if (ST.hasNEON())
353358Sdim    getActionDefinitionsBuilder({G_ADD, G_SUB})
353358Sdim        .legalFor({s32, s64})
353358Sdim        .minScalar(0, s32);
353358Sdim  else
353358Sdim    getActionDefinitionsBuilder({G_ADD, G_SUB})
353358Sdim        .legalFor({s32})
353358Sdim        .minScalar(0, s32);
344779Sdim
353358Sdim  getActionDefinitionsBuilder({G_ASHR, G_LSHR, G_SHL})
353358Sdim    .legalFor({{s32, s32}})
353358Sdim    .minScalar(0, s32)
353358Sdim    .clampScalar(1, s32, s32);
344779Sdim
353358Sdim  bool HasHWDivide = (!ST.isThumb() && ST.hasDivideInARMMode()) ||
353358Sdim                     (ST.isThumb() && ST.hasDivideInThumbMode());
353358Sdim  if (HasHWDivide)
341825Sdim    getActionDefinitionsBuilder({G_SDIV, G_UDIV})
341825Sdim        .legalFor({s32})
341825Sdim        .clampScalar(0, s32, s32);
341825Sdim  else
341825Sdim    getActionDefinitionsBuilder({G_SDIV, G_UDIV})
341825Sdim        .libcallFor({s32})
341825Sdim        .clampScalar(0, s32, s32);
311116Sdim
321369Sdim  for (unsigned Op : {G_SREM, G_UREM}) {
327952Sdim    setLegalizeScalarToDifferentSizeStrategy(Op, 0, widen_8_16);
353358Sdim    if (HasHWDivide)
321369Sdim      setAction({Op, s32}, Lower);
321369Sdim    else if (AEABI(ST))
321369Sdim      setAction({Op, s32}, Custom);
321369Sdim    else
321369Sdim      setAction({Op, s32}, Libcall);
321369Sdim  }
321369Sdim
353358Sdim  getActionDefinitionsBuilder(G_INTTOPTR)
353358Sdim      .legalFor({{p0, s32}})
353358Sdim      .minScalar(1, s32);
353358Sdim  getActionDefinitionsBuilder(G_PTRTOINT)
353358Sdim      .legalFor({{s32, p0}})
353358Sdim      .minScalar(0, s32);
321369Sdim
353358Sdim  getActionDefinitionsBuilder(G_CONSTANT)
353358Sdim      .legalFor({s32, p0})
353358Sdim      .clampScalar(0, s32, s32);
327952Sdim
341825Sdim  getActionDefinitionsBuilder(G_ICMP)
341825Sdim      .legalForCartesianProduct({s1}, {s32, p0})
341825Sdim      .minScalar(1, s32);
321369Sdim
353358Sdim  getActionDefinitionsBuilder(G_SELECT)
353358Sdim      .legalForCartesianProduct({s32, p0}, {s1})
353358Sdim      .minScalar(0, s32);
353358Sdim
341825Sdim  // We're keeping these builders around because we'll want to add support for
341825Sdim  // floating point to them.
353358Sdim  auto &LoadStoreBuilder = getActionDefinitionsBuilder({G_LOAD, G_STORE})
353358Sdim                               .legalForTypesWithMemDesc({{s1, p0, 8, 8},
353358Sdim                                                          {s8, p0, 8, 8},
353358Sdim                                                          {s16, p0, 16, 8},
353358Sdim                                                          {s32, p0, 32, 8},
353358Sdim                                                          {p0, p0, 32, 8}})
353358Sdim                               .unsupportedIfMemSizeNotPow2();
353358Sdim
353358Sdim  getActionDefinitionsBuilder(G_FRAME_INDEX).legalFor({p0});
353358Sdim  getActionDefinitionsBuilder(G_GLOBAL_VALUE).legalFor({p0});
353358Sdim
341825Sdim  auto &PhiBuilder =
353358Sdim      getActionDefinitionsBuilder(G_PHI)
353358Sdim          .legalFor({s32, p0})
353358Sdim          .minScalar(0, s32);
341825Sdim
360784Sdim  getActionDefinitionsBuilder(G_PTR_ADD)
353358Sdim      .legalFor({{p0, s32}})
353358Sdim      .minScalar(1, s32);
353358Sdim
353358Sdim  getActionDefinitionsBuilder(G_BRCOND).legalFor({s1});
353358Sdim
353358Sdim  if (!ST.useSoftFloat() && ST.hasVFP2Base()) {
341825Sdim    getActionDefinitionsBuilder(
341825Sdim        {G_FADD, G_FSUB, G_FMUL, G_FDIV, G_FCONSTANT, G_FNEG})
341825Sdim        .legalFor({s32, s64});
321369Sdim
353358Sdim    LoadStoreBuilder
353358Sdim        .legalForTypesWithMemDesc({{s64, p0, 64, 32}})
353358Sdim        .maxScalar(0, s32);
341825Sdim    PhiBuilder.legalFor({s64});
321369Sdim
341825Sdim    getActionDefinitionsBuilder(G_FCMP).legalForCartesianProduct({s1},
341825Sdim                                                                 {s32, s64});
327952Sdim
341825Sdim    getActionDefinitionsBuilder(G_MERGE_VALUES).legalFor({{s64, s32}});
341825Sdim    getActionDefinitionsBuilder(G_UNMERGE_VALUES).legalFor({{s32, s64}});
341825Sdim
341825Sdim    getActionDefinitionsBuilder(G_FPEXT).legalFor({{s64, s32}});
341825Sdim    getActionDefinitionsBuilder(G_FPTRUNC).legalFor({{s32, s64}});
341825Sdim
341825Sdim    getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
341825Sdim        .legalForCartesianProduct({s32}, {s32, s64});
341825Sdim    getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
341825Sdim        .legalForCartesianProduct({s32, s64}, {s32});
321369Sdim  } else {
341825Sdim    getActionDefinitionsBuilder({G_FADD, G_FSUB, G_FMUL, G_FDIV})
341825Sdim        .libcallFor({s32, s64});
321369Sdim
341825Sdim    LoadStoreBuilder.maxScalar(0, s32);
321369Sdim
341825Sdim    for (auto Ty : {s32, s64})
341825Sdim      setAction({G_FNEG, Ty}, Lower);
341825Sdim
341825Sdim    getActionDefinitionsBuilder(G_FCONSTANT).customFor({s32, s64});
341825Sdim
341825Sdim    getActionDefinitionsBuilder(G_FCMP).customForCartesianProduct({s1},
341825Sdim                                                                  {s32, s64});
341825Sdim
321369Sdim    if (AEABI(ST))
321369Sdim      setFCmpLibcallsAEABI();
321369Sdim    else
321369Sdim      setFCmpLibcallsGNU();
341825Sdim
341825Sdim    getActionDefinitionsBuilder(G_FPEXT).libcallFor({{s64, s32}});
341825Sdim    getActionDefinitionsBuilder(G_FPTRUNC).libcallFor({{s32, s64}});
341825Sdim
341825Sdim    getActionDefinitionsBuilder({G_FPTOSI, G_FPTOUI})
341825Sdim        .libcallForCartesianProduct({s32}, {s32, s64});
341825Sdim    getActionDefinitionsBuilder({G_SITOFP, G_UITOFP})
341825Sdim        .libcallForCartesianProduct({s32, s64}, {s32});
321369Sdim  }
321369Sdim
353358Sdim  if (!ST.useSoftFloat() && ST.hasVFP4Base())
341825Sdim    getActionDefinitionsBuilder(G_FMA).legalFor({s32, s64});
341825Sdim  else
341825Sdim    getActionDefinitionsBuilder(G_FMA).libcallFor({s32, s64});
321369Sdim
341825Sdim  getActionDefinitionsBuilder({G_FREM, G_FPOW}).libcallFor({s32, s64});
341825Sdim
353358Sdim  if (ST.hasV5TOps()) {
353358Sdim    getActionDefinitionsBuilder(G_CTLZ)
353358Sdim        .legalFor({s32, s32})
353358Sdim        .clampScalar(1, s32, s32)
353358Sdim        .clampScalar(0, s32, s32);
353358Sdim    getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
353358Sdim        .lowerFor({s32, s32})
353358Sdim        .clampScalar(1, s32, s32)
353358Sdim        .clampScalar(0, s32, s32);
353358Sdim  } else {
353358Sdim    getActionDefinitionsBuilder(G_CTLZ_ZERO_UNDEF)
353358Sdim        .libcallFor({s32, s32})
353358Sdim        .clampScalar(1, s32, s32)
353358Sdim        .clampScalar(0, s32, s32);
353358Sdim    getActionDefinitionsBuilder(G_CTLZ)
353358Sdim        .lowerFor({s32, s32})
353358Sdim        .clampScalar(1, s32, s32)
353358Sdim        .clampScalar(0, s32, s32);
353358Sdim  }
353358Sdim
311116Sdim  computeTables();
341825Sdim  verify(*ST.getInstrInfo());
311116Sdim}
321369Sdim
321369Sdimvoid ARMLegalizerInfo::setFCmpLibcallsAEABI() {
321369Sdim  // FCMP_TRUE and FCMP_FALSE don't need libcalls, they should be
321369Sdim  // default-initialized.
321369Sdim  FCmp32Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1);
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OEQ] = {
321369Sdim      {RTLIB::OEQ_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OGE] = {
321369Sdim      {RTLIB::OGE_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OGT] = {
321369Sdim      {RTLIB::OGT_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OLE] = {
321369Sdim      {RTLIB::OLE_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OLT] = {
321369Sdim      {RTLIB::OLT_F32, CmpInst::BAD_ICMP_PREDICATE}};
360784Sdim  FCmp32Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UNO] = {
321369Sdim      {RTLIB::UO_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_ONE] = {
321369Sdim      {RTLIB::OGT_F32, CmpInst::BAD_ICMP_PREDICATE},
321369Sdim      {RTLIB::OLT_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UEQ] = {
321369Sdim      {RTLIB::OEQ_F32, CmpInst::BAD_ICMP_PREDICATE},
321369Sdim      {RTLIB::UO_F32, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim
321369Sdim  FCmp64Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1);
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OEQ] = {
321369Sdim      {RTLIB::OEQ_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OGE] = {
321369Sdim      {RTLIB::OGE_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OGT] = {
321369Sdim      {RTLIB::OGT_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OLE] = {
321369Sdim      {RTLIB::OLE_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OLT] = {
321369Sdim      {RTLIB::OLT_F64, CmpInst::BAD_ICMP_PREDICATE}};
360784Sdim  FCmp64Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UNO] = {
321369Sdim      {RTLIB::UO_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_ONE] = {
321369Sdim      {RTLIB::OGT_F64, CmpInst::BAD_ICMP_PREDICATE},
321369Sdim      {RTLIB::OLT_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UEQ] = {
321369Sdim      {RTLIB::OEQ_F64, CmpInst::BAD_ICMP_PREDICATE},
321369Sdim      {RTLIB::UO_F64, CmpInst::BAD_ICMP_PREDICATE}};
321369Sdim}
321369Sdim
321369Sdimvoid ARMLegalizerInfo::setFCmpLibcallsGNU() {
321369Sdim  // FCMP_TRUE and FCMP_FALSE don't need libcalls, they should be
321369Sdim  // default-initialized.
321369Sdim  FCmp32Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1);
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OEQ] = {{RTLIB::OEQ_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OGE] = {{RTLIB::OGE_F32, CmpInst::ICMP_SGE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OGT] = {{RTLIB::OGT_F32, CmpInst::ICMP_SGT}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OLE] = {{RTLIB::OLE_F32, CmpInst::ICMP_SLE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_OLT] = {{RTLIB::OLT_F32, CmpInst::ICMP_SLT}};
360784Sdim  FCmp32Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F32, CmpInst::ICMP_EQ}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F32, CmpInst::ICMP_SGE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F32, CmpInst::ICMP_SGT}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F32, CmpInst::ICMP_SLE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F32, CmpInst::ICMP_SLT}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F32, CmpInst::ICMP_NE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UNO] = {{RTLIB::UO_F32, CmpInst::ICMP_NE}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_ONE] = {{RTLIB::OGT_F32, CmpInst::ICMP_SGT},
321369Sdim                                       {RTLIB::OLT_F32, CmpInst::ICMP_SLT}};
321369Sdim  FCmp32Libcalls[CmpInst::FCMP_UEQ] = {{RTLIB::OEQ_F32, CmpInst::ICMP_EQ},
321369Sdim                                       {RTLIB::UO_F32, CmpInst::ICMP_NE}};
321369Sdim
321369Sdim  FCmp64Libcalls.resize(CmpInst::LAST_FCMP_PREDICATE + 1);
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OEQ] = {{RTLIB::OEQ_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OGE] = {{RTLIB::OGE_F64, CmpInst::ICMP_SGE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OGT] = {{RTLIB::OGT_F64, CmpInst::ICMP_SGT}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OLE] = {{RTLIB::OLE_F64, CmpInst::ICMP_SLE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_OLT] = {{RTLIB::OLT_F64, CmpInst::ICMP_SLT}};
360784Sdim  FCmp64Libcalls[CmpInst::FCMP_ORD] = {{RTLIB::UO_F64, CmpInst::ICMP_EQ}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UGE] = {{RTLIB::OLT_F64, CmpInst::ICMP_SGE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UGT] = {{RTLIB::OLE_F64, CmpInst::ICMP_SGT}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_ULE] = {{RTLIB::OGT_F64, CmpInst::ICMP_SLE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_ULT] = {{RTLIB::OGE_F64, CmpInst::ICMP_SLT}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UNE] = {{RTLIB::UNE_F64, CmpInst::ICMP_NE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UNO] = {{RTLIB::UO_F64, CmpInst::ICMP_NE}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_ONE] = {{RTLIB::OGT_F64, CmpInst::ICMP_SGT},
321369Sdim                                       {RTLIB::OLT_F64, CmpInst::ICMP_SLT}};
321369Sdim  FCmp64Libcalls[CmpInst::FCMP_UEQ] = {{RTLIB::OEQ_F64, CmpInst::ICMP_EQ},
321369Sdim                                       {RTLIB::UO_F64, CmpInst::ICMP_NE}};
321369Sdim}
321369Sdim
321369SdimARMLegalizerInfo::FCmpLibcallsList
321369SdimARMLegalizerInfo::getFCmpLibcalls(CmpInst::Predicate Predicate,
321369Sdim                                  unsigned Size) const {
321369Sdim  assert(CmpInst::isFPPredicate(Predicate) && "Unsupported FCmp predicate");
321369Sdim  if (Size == 32)
321369Sdim    return FCmp32Libcalls[Predicate];
321369Sdim  if (Size == 64)
321369Sdim    return FCmp64Libcalls[Predicate];
321369Sdim  llvm_unreachable("Unsupported size for FCmp predicate");
321369Sdim}
321369Sdim
321369Sdimbool ARMLegalizerInfo::legalizeCustom(MachineInstr &MI,
321369Sdim                                      MachineRegisterInfo &MRI,
344779Sdim                                      MachineIRBuilder &MIRBuilder,
344779Sdim                                      GISelChangeObserver &Observer) const {
321369Sdim  using namespace TargetOpcode;
321369Sdim
321369Sdim  MIRBuilder.setInstr(MI);
341825Sdim  LLVMContext &Ctx = MIRBuilder.getMF().getFunction().getContext();
321369Sdim
321369Sdim  switch (MI.getOpcode()) {
321369Sdim  default:
321369Sdim    return false;
321369Sdim  case G_SREM:
321369Sdim  case G_UREM: {
353358Sdim    Register OriginalResult = MI.getOperand(0).getReg();
321369Sdim    auto Size = MRI.getType(OriginalResult).getSizeInBits();
321369Sdim    if (Size != 32)
321369Sdim      return false;
321369Sdim
321369Sdim    auto Libcall =
321369Sdim        MI.getOpcode() == G_SREM ? RTLIB::SDIVREM_I32 : RTLIB::UDIVREM_I32;
321369Sdim
321369Sdim    // Our divmod libcalls return a struct containing the quotient and the
353358Sdim    // remainder. Create a new, unused register for the quotient and use the
353358Sdim    // destination of the original instruction for the remainder.
321369Sdim    Type *ArgTy = Type::getInt32Ty(Ctx);
321369Sdim    StructType *RetTy = StructType::get(Ctx, {ArgTy, ArgTy}, /* Packed */ true);
353358Sdim    Register RetRegs[] = {MRI.createGenericVirtualRegister(LLT::scalar(32)),
353358Sdim                          OriginalResult};
353358Sdim    auto Status = createLibcall(MIRBuilder, Libcall, {RetRegs, RetTy},
321369Sdim                                {{MI.getOperand(1).getReg(), ArgTy},
321369Sdim                                 {MI.getOperand(2).getReg(), ArgTy}});
321369Sdim    if (Status != LegalizerHelper::Legalized)
321369Sdim      return false;
321369Sdim    break;
321369Sdim  }
321369Sdim  case G_FCMP: {
321369Sdim    assert(MRI.getType(MI.getOperand(2).getReg()) ==
321369Sdim               MRI.getType(MI.getOperand(3).getReg()) &&
321369Sdim           "Mismatched operands for G_FCMP");
321369Sdim    auto OpSize = MRI.getType(MI.getOperand(2).getReg()).getSizeInBits();
321369Sdim
321369Sdim    auto OriginalResult = MI.getOperand(0).getReg();
321369Sdim    auto Predicate =
321369Sdim        static_cast<CmpInst::Predicate>(MI.getOperand(1).getPredicate());
321369Sdim    auto Libcalls = getFCmpLibcalls(Predicate, OpSize);
321369Sdim
321369Sdim    if (Libcalls.empty()) {
321369Sdim      assert((Predicate == CmpInst::FCMP_TRUE ||
321369Sdim              Predicate == CmpInst::FCMP_FALSE) &&
321369Sdim             "Predicate needs libcalls, but none specified");
321369Sdim      MIRBuilder.buildConstant(OriginalResult,
321369Sdim                               Predicate == CmpInst::FCMP_TRUE ? 1 : 0);
321369Sdim      MI.eraseFromParent();
321369Sdim      return true;
321369Sdim    }
321369Sdim
321369Sdim    assert((OpSize == 32 || OpSize == 64) && "Unsupported operand size");
321369Sdim    auto *ArgTy = OpSize == 32 ? Type::getFloatTy(Ctx) : Type::getDoubleTy(Ctx);
321369Sdim    auto *RetTy = Type::getInt32Ty(Ctx);
321369Sdim
353358Sdim    SmallVector<Register, 2> Results;
321369Sdim    for (auto Libcall : Libcalls) {
321369Sdim      auto LibcallResult = MRI.createGenericVirtualRegister(LLT::scalar(32));
321369Sdim      auto Status =
321369Sdim          createLibcall(MIRBuilder, Libcall.LibcallID, {LibcallResult, RetTy},
321369Sdim                        {{MI.getOperand(2).getReg(), ArgTy},
321369Sdim                         {MI.getOperand(3).getReg(), ArgTy}});
321369Sdim
321369Sdim      if (Status != LegalizerHelper::Legalized)
321369Sdim        return false;
321369Sdim
321369Sdim      auto ProcessedResult =
321369Sdim          Libcalls.size() == 1
321369Sdim              ? OriginalResult
321369Sdim              : MRI.createGenericVirtualRegister(MRI.getType(OriginalResult));
321369Sdim
321369Sdim      // We have a result, but we need to transform it into a proper 1-bit 0 or
321369Sdim      // 1, taking into account the different peculiarities of the values
321369Sdim      // returned by the comparison functions.
321369Sdim      CmpInst::Predicate ResultPred = Libcall.Predicate;
321369Sdim      if (ResultPred == CmpInst::BAD_ICMP_PREDICATE) {
321369Sdim        // We have a nice 0 or 1, and we just need to truncate it back to 1 bit
321369Sdim        // to keep the types consistent.
321369Sdim        MIRBuilder.buildTrunc(ProcessedResult, LibcallResult);
321369Sdim      } else {
321369Sdim        // We need to compare against 0.
321369Sdim        assert(CmpInst::isIntPredicate(ResultPred) && "Unsupported predicate");
321369Sdim        auto Zero = MRI.createGenericVirtualRegister(LLT::scalar(32));
321369Sdim        MIRBuilder.buildConstant(Zero, 0);
321369Sdim        MIRBuilder.buildICmp(ResultPred, ProcessedResult, LibcallResult, Zero);
321369Sdim      }
321369Sdim      Results.push_back(ProcessedResult);
321369Sdim    }
321369Sdim
321369Sdim    if (Results.size() != 1) {
321369Sdim      assert(Results.size() == 2 && "Unexpected number of results");
321369Sdim      MIRBuilder.buildOr(OriginalResult, Results[0], Results[1]);
321369Sdim    }
321369Sdim    break;
321369Sdim  }
341825Sdim  case G_FCONSTANT: {
341825Sdim    // Convert to integer constants, while preserving the binary representation.
341825Sdim    auto AsInteger =
341825Sdim        MI.getOperand(1).getFPImm()->getValueAPF().bitcastToAPInt();
341825Sdim    MIRBuilder.buildConstant(MI.getOperand(0).getReg(),
341825Sdim                             *ConstantInt::get(Ctx, AsInteger));
341825Sdim    break;
321369Sdim  }
341825Sdim  }
321369Sdim
321369Sdim  MI.eraseFromParent();
321369Sdim  return true;
321369Sdim}