Path: blob/main/contrib/llvm-project/llvm/lib/Target/ARM/ARMCallLowering.cpp
35294 views
//===- llvm/lib/Target/ARM/ARMCallLowering.cpp - Call lowering ------------===//1//2// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.3// See https://llvm.org/LICENSE.txt for license information.4// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception5//6//===----------------------------------------------------------------------===//7//8/// \file9/// This file implements the lowering of LLVM calls to machine code calls for10/// GlobalISel.11//12//===----------------------------------------------------------------------===//1314#include "ARMCallLowering.h"15#include "ARMBaseInstrInfo.h"16#include "ARMISelLowering.h"17#include "ARMSubtarget.h"18#include "Utils/ARMBaseInfo.h"19#include "llvm/ADT/SmallVector.h"20#include "llvm/CodeGen/Analysis.h"21#include "llvm/CodeGen/CallingConvLower.h"22#include "llvm/CodeGen/GlobalISel/MachineIRBuilder.h"23#include "llvm/CodeGen/GlobalISel/Utils.h"24#include "llvm/CodeGen/LowLevelTypeUtils.h"25#include "llvm/CodeGen/MachineBasicBlock.h"26#include "llvm/CodeGen/MachineFrameInfo.h"27#include "llvm/CodeGen/MachineFunction.h"28#include "llvm/CodeGen/MachineInstrBuilder.h"29#include "llvm/CodeGen/MachineMemOperand.h"30#include "llvm/CodeGen/MachineOperand.h"31#include "llvm/CodeGen/MachineRegisterInfo.h"32#include "llvm/CodeGen/TargetRegisterInfo.h"33#include "llvm/CodeGen/TargetSubtargetInfo.h"34#include "llvm/CodeGen/ValueTypes.h"35#include "llvm/CodeGenTypes/LowLevelType.h"36#include "llvm/CodeGenTypes/MachineValueType.h"37#include "llvm/IR/Attributes.h"38#include "llvm/IR/DataLayout.h"39#include "llvm/IR/DerivedTypes.h"40#include "llvm/IR/Function.h"41#include "llvm/IR/Type.h"42#include "llvm/IR/Value.h"43#include "llvm/Support/Casting.h"44#include <algorithm>45#include <cassert>46#include <cstdint>47#include <functional>48#include <utility>4950using namespace llvm;5152// Whether Big-endian GISel is enabled, defaults to off, can be enabled for53// testing.54static cl::opt<bool>55EnableGISelBigEndian("enable-arm-gisel-bigendian", cl::Hidden,56cl::init(false),57cl::desc("Enable Global-ISel Big Endian Lowering"));5859ARMCallLowering::ARMCallLowering(const ARMTargetLowering &TLI)60: CallLowering(&TLI) {}6162static bool isSupportedType(const DataLayout &DL, const ARMTargetLowering &TLI,63Type *T) {64if (T->isArrayTy())65return isSupportedType(DL, TLI, T->getArrayElementType());6667if (T->isStructTy()) {68// For now we only allow homogeneous structs that we can manipulate with69// G_MERGE_VALUES and G_UNMERGE_VALUES70auto StructT = cast<StructType>(T);71for (unsigned i = 1, e = StructT->getNumElements(); i != e; ++i)72if (StructT->getElementType(i) != StructT->getElementType(0))73return false;74return isSupportedType(DL, TLI, StructT->getElementType(0));75}7677EVT VT = TLI.getValueType(DL, T, true);78if (!VT.isSimple() || VT.isVector() ||79!(VT.isInteger() || VT.isFloatingPoint()))80return false;8182unsigned VTSize = VT.getSimpleVT().getSizeInBits();8384if (VTSize == 64)85// FIXME: Support i64 too86return VT.isFloatingPoint();8788return VTSize == 1 || VTSize == 8 || VTSize == 16 || VTSize == 32;89}9091namespace {9293/// Helper class for values going out through an ABI boundary (used for handling94/// function return values and call parameters).95struct ARMOutgoingValueHandler : public CallLowering::OutgoingValueHandler {96ARMOutgoingValueHandler(MachineIRBuilder &MIRBuilder,97MachineRegisterInfo &MRI, MachineInstrBuilder &MIB)98: OutgoingValueHandler(MIRBuilder, MRI), MIB(MIB) {}99100Register getStackAddress(uint64_t Size, int64_t Offset,101MachinePointerInfo &MPO,102ISD::ArgFlagsTy Flags) override {103assert((Size == 1 || Size == 2 || Size == 4 || Size == 8) &&104"Unsupported size");105106LLT p0 = LLT::pointer(0, 32);107LLT s32 = LLT::scalar(32);108auto SPReg = MIRBuilder.buildCopy(p0, Register(ARM::SP));109110auto OffsetReg = MIRBuilder.buildConstant(s32, Offset);111112auto AddrReg = MIRBuilder.buildPtrAdd(p0, SPReg, OffsetReg);113114MPO = MachinePointerInfo::getStack(MIRBuilder.getMF(), Offset);115return AddrReg.getReg(0);116}117118void assignValueToReg(Register ValVReg, Register PhysReg,119const CCValAssign &VA) override {120assert(VA.isRegLoc() && "Value shouldn't be assigned to reg");121assert(VA.getLocReg() == PhysReg && "Assigning to the wrong reg?");122123assert(VA.getValVT().getSizeInBits() <= 64 && "Unsupported value size");124assert(VA.getLocVT().getSizeInBits() <= 64 && "Unsupported location size");125126Register ExtReg = extendRegister(ValVReg, VA);127MIRBuilder.buildCopy(PhysReg, ExtReg);128MIB.addUse(PhysReg, RegState::Implicit);129}130131void assignValueToAddress(Register ValVReg, Register Addr, LLT MemTy,132const MachinePointerInfo &MPO,133const CCValAssign &VA) override {134Register ExtReg = extendRegister(ValVReg, VA);135auto MMO = MIRBuilder.getMF().getMachineMemOperand(136MPO, MachineMemOperand::MOStore, MemTy, Align(1));137MIRBuilder.buildStore(ExtReg, Addr, *MMO);138}139140unsigned assignCustomValue(CallLowering::ArgInfo &Arg,141ArrayRef<CCValAssign> VAs,142std::function<void()> *Thunk) override {143assert(Arg.Regs.size() == 1 && "Can't handle multple regs yet");144145const CCValAssign &VA = VAs[0];146assert(VA.needsCustom() && "Value doesn't need custom handling");147148// Custom lowering for other types, such as f16, is currently not supported149if (VA.getValVT() != MVT::f64)150return 0;151152const CCValAssign &NextVA = VAs[1];153assert(NextVA.needsCustom() && "Value doesn't need custom handling");154assert(NextVA.getValVT() == MVT::f64 && "Unsupported type");155156assert(VA.getValNo() == NextVA.getValNo() &&157"Values belong to different arguments");158159assert(VA.isRegLoc() && "Value should be in reg");160assert(NextVA.isRegLoc() && "Value should be in reg");161162Register NewRegs[] = {MRI.createGenericVirtualRegister(LLT::scalar(32)),163MRI.createGenericVirtualRegister(LLT::scalar(32))};164MIRBuilder.buildUnmerge(NewRegs, Arg.Regs[0]);165166bool IsLittle = MIRBuilder.getMF().getSubtarget<ARMSubtarget>().isLittle();167if (!IsLittle)168std::swap(NewRegs[0], NewRegs[1]);169170if (Thunk) {171*Thunk = [=]() {172assignValueToReg(NewRegs[0], VA.getLocReg(), VA);173assignValueToReg(NewRegs[1], NextVA.getLocReg(), NextVA);174};175return 2;176}177assignValueToReg(NewRegs[0], VA.getLocReg(), VA);178assignValueToReg(NewRegs[1], NextVA.getLocReg(), NextVA);179return 2;180}181182MachineInstrBuilder MIB;183};184185} // end anonymous namespace186187/// Lower the return value for the already existing \p Ret. This assumes that188/// \p MIRBuilder's insertion point is correct.189bool ARMCallLowering::lowerReturnVal(MachineIRBuilder &MIRBuilder,190const Value *Val, ArrayRef<Register> VRegs,191MachineInstrBuilder &Ret) const {192if (!Val)193// Nothing to do here.194return true;195196auto &MF = MIRBuilder.getMF();197const auto &F = MF.getFunction();198199const auto &DL = MF.getDataLayout();200auto &TLI = *getTLI<ARMTargetLowering>();201if (!isSupportedType(DL, TLI, Val->getType()))202return false;203204ArgInfo OrigRetInfo(VRegs, Val->getType(), 0);205setArgFlags(OrigRetInfo, AttributeList::ReturnIndex, DL, F);206207SmallVector<ArgInfo, 4> SplitRetInfos;208splitToValueTypes(OrigRetInfo, SplitRetInfos, DL, F.getCallingConv());209210CCAssignFn *AssignFn =211TLI.CCAssignFnForReturn(F.getCallingConv(), F.isVarArg());212213OutgoingValueAssigner RetAssigner(AssignFn);214ARMOutgoingValueHandler RetHandler(MIRBuilder, MF.getRegInfo(), Ret);215return determineAndHandleAssignments(RetHandler, RetAssigner, SplitRetInfos,216MIRBuilder, F.getCallingConv(),217F.isVarArg());218}219220bool ARMCallLowering::lowerReturn(MachineIRBuilder &MIRBuilder,221const Value *Val, ArrayRef<Register> VRegs,222FunctionLoweringInfo &FLI) const {223assert(!Val == VRegs.empty() && "Return value without a vreg");224225auto const &ST = MIRBuilder.getMF().getSubtarget<ARMSubtarget>();226unsigned Opcode = ST.getReturnOpcode();227auto Ret = MIRBuilder.buildInstrNoInsert(Opcode).add(predOps(ARMCC::AL));228229if (!lowerReturnVal(MIRBuilder, Val, VRegs, Ret))230return false;231232MIRBuilder.insertInstr(Ret);233return true;234}235236namespace {237238/// Helper class for values coming in through an ABI boundary (used for handling239/// formal arguments and call return values).240struct ARMIncomingValueHandler : public CallLowering::IncomingValueHandler {241ARMIncomingValueHandler(MachineIRBuilder &MIRBuilder,242MachineRegisterInfo &MRI)243: IncomingValueHandler(MIRBuilder, MRI) {}244245Register getStackAddress(uint64_t Size, int64_t Offset,246MachinePointerInfo &MPO,247ISD::ArgFlagsTy Flags) override {248assert((Size == 1 || Size == 2 || Size == 4 || Size == 8) &&249"Unsupported size");250251auto &MFI = MIRBuilder.getMF().getFrameInfo();252253// Byval is assumed to be writable memory, but other stack passed arguments254// are not.255const bool IsImmutable = !Flags.isByVal();256257int FI = MFI.CreateFixedObject(Size, Offset, IsImmutable);258MPO = MachinePointerInfo::getFixedStack(MIRBuilder.getMF(), FI);259260return MIRBuilder.buildFrameIndex(LLT::pointer(MPO.getAddrSpace(), 32), FI)261.getReg(0);262}263264void assignValueToAddress(Register ValVReg, Register Addr, LLT MemTy,265const MachinePointerInfo &MPO,266const CCValAssign &VA) override {267if (VA.getLocInfo() == CCValAssign::SExt ||268VA.getLocInfo() == CCValAssign::ZExt) {269// If the value is zero- or sign-extended, its size becomes 4 bytes, so270// that's what we should load.271MemTy = LLT::scalar(32);272assert(MRI.getType(ValVReg).isScalar() && "Only scalars supported atm");273274auto LoadVReg = buildLoad(LLT::scalar(32), Addr, MemTy, MPO);275MIRBuilder.buildTrunc(ValVReg, LoadVReg);276} else {277// If the value is not extended, a simple load will suffice.278buildLoad(ValVReg, Addr, MemTy, MPO);279}280}281282MachineInstrBuilder buildLoad(const DstOp &Res, Register Addr, LLT MemTy,283const MachinePointerInfo &MPO) {284MachineFunction &MF = MIRBuilder.getMF();285286auto MMO = MF.getMachineMemOperand(MPO, MachineMemOperand::MOLoad, MemTy,287inferAlignFromPtrInfo(MF, MPO));288return MIRBuilder.buildLoad(Res, Addr, *MMO);289}290291void assignValueToReg(Register ValVReg, Register PhysReg,292const CCValAssign &VA) override {293assert(VA.isRegLoc() && "Value shouldn't be assigned to reg");294assert(VA.getLocReg() == PhysReg && "Assigning to the wrong reg?");295296uint64_t ValSize = VA.getValVT().getFixedSizeInBits();297uint64_t LocSize = VA.getLocVT().getFixedSizeInBits();298299assert(ValSize <= 64 && "Unsupported value size");300assert(LocSize <= 64 && "Unsupported location size");301302markPhysRegUsed(PhysReg);303if (ValSize == LocSize) {304MIRBuilder.buildCopy(ValVReg, PhysReg);305} else {306assert(ValSize < LocSize && "Extensions not supported");307308// We cannot create a truncating copy, nor a trunc of a physical register.309// Therefore, we need to copy the content of the physical register into a310// virtual one and then truncate that.311auto PhysRegToVReg = MIRBuilder.buildCopy(LLT::scalar(LocSize), PhysReg);312MIRBuilder.buildTrunc(ValVReg, PhysRegToVReg);313}314}315316unsigned assignCustomValue(ARMCallLowering::ArgInfo &Arg,317ArrayRef<CCValAssign> VAs,318std::function<void()> *Thunk) override {319assert(Arg.Regs.size() == 1 && "Can't handle multple regs yet");320321const CCValAssign &VA = VAs[0];322assert(VA.needsCustom() && "Value doesn't need custom handling");323324// Custom lowering for other types, such as f16, is currently not supported325if (VA.getValVT() != MVT::f64)326return 0;327328const CCValAssign &NextVA = VAs[1];329assert(NextVA.needsCustom() && "Value doesn't need custom handling");330assert(NextVA.getValVT() == MVT::f64 && "Unsupported type");331332assert(VA.getValNo() == NextVA.getValNo() &&333"Values belong to different arguments");334335assert(VA.isRegLoc() && "Value should be in reg");336assert(NextVA.isRegLoc() && "Value should be in reg");337338Register NewRegs[] = {MRI.createGenericVirtualRegister(LLT::scalar(32)),339MRI.createGenericVirtualRegister(LLT::scalar(32))};340341assignValueToReg(NewRegs[0], VA.getLocReg(), VA);342assignValueToReg(NewRegs[1], NextVA.getLocReg(), NextVA);343344bool IsLittle = MIRBuilder.getMF().getSubtarget<ARMSubtarget>().isLittle();345if (!IsLittle)346std::swap(NewRegs[0], NewRegs[1]);347348MIRBuilder.buildMergeLikeInstr(Arg.Regs[0], NewRegs);349350return 2;351}352353/// Marking a physical register as used is different between formal354/// parameters, where it's a basic block live-in, and call returns, where it's355/// an implicit-def of the call instruction.356virtual void markPhysRegUsed(unsigned PhysReg) = 0;357};358359struct FormalArgHandler : public ARMIncomingValueHandler {360FormalArgHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI)361: ARMIncomingValueHandler(MIRBuilder, MRI) {}362363void markPhysRegUsed(unsigned PhysReg) override {364MIRBuilder.getMRI()->addLiveIn(PhysReg);365MIRBuilder.getMBB().addLiveIn(PhysReg);366}367};368369} // end anonymous namespace370371bool ARMCallLowering::lowerFormalArguments(MachineIRBuilder &MIRBuilder,372const Function &F,373ArrayRef<ArrayRef<Register>> VRegs,374FunctionLoweringInfo &FLI) const {375auto &TLI = *getTLI<ARMTargetLowering>();376auto Subtarget = TLI.getSubtarget();377378if (Subtarget->isThumb1Only())379return false;380381// Quick exit if there aren't any args382if (F.arg_empty())383return true;384385if (F.isVarArg())386return false;387388auto &MF = MIRBuilder.getMF();389auto &MBB = MIRBuilder.getMBB();390const auto &DL = MF.getDataLayout();391392for (auto &Arg : F.args()) {393if (!isSupportedType(DL, TLI, Arg.getType()))394return false;395if (Arg.hasPassPointeeByValueCopyAttr())396return false;397}398399CCAssignFn *AssignFn =400TLI.CCAssignFnForCall(F.getCallingConv(), F.isVarArg());401402OutgoingValueAssigner ArgAssigner(AssignFn);403FormalArgHandler ArgHandler(MIRBuilder, MIRBuilder.getMF().getRegInfo());404405SmallVector<ArgInfo, 8> SplitArgInfos;406unsigned Idx = 0;407for (auto &Arg : F.args()) {408ArgInfo OrigArgInfo(VRegs[Idx], Arg.getType(), Idx);409410setArgFlags(OrigArgInfo, Idx + AttributeList::FirstArgIndex, DL, F);411splitToValueTypes(OrigArgInfo, SplitArgInfos, DL, F.getCallingConv());412413Idx++;414}415416if (!MBB.empty())417MIRBuilder.setInstr(*MBB.begin());418419if (!determineAndHandleAssignments(ArgHandler, ArgAssigner, SplitArgInfos,420MIRBuilder, F.getCallingConv(),421F.isVarArg()))422return false;423424// Move back to the end of the basic block.425MIRBuilder.setMBB(MBB);426return true;427}428429namespace {430431struct CallReturnHandler : public ARMIncomingValueHandler {432CallReturnHandler(MachineIRBuilder &MIRBuilder, MachineRegisterInfo &MRI,433MachineInstrBuilder MIB)434: ARMIncomingValueHandler(MIRBuilder, MRI), MIB(MIB) {}435436void markPhysRegUsed(unsigned PhysReg) override {437MIB.addDef(PhysReg, RegState::Implicit);438}439440MachineInstrBuilder MIB;441};442443// FIXME: This should move to the ARMSubtarget when it supports all the opcodes.444unsigned getCallOpcode(const MachineFunction &MF, const ARMSubtarget &STI,445bool isDirect) {446if (isDirect)447return STI.isThumb() ? ARM::tBL : ARM::BL;448449if (STI.isThumb())450return gettBLXrOpcode(MF);451452if (STI.hasV5TOps())453return getBLXOpcode(MF);454455if (STI.hasV4TOps())456return ARM::BX_CALL;457458return ARM::BMOVPCRX_CALL;459}460} // end anonymous namespace461462bool ARMCallLowering::lowerCall(MachineIRBuilder &MIRBuilder, CallLoweringInfo &Info) const {463MachineFunction &MF = MIRBuilder.getMF();464const auto &TLI = *getTLI<ARMTargetLowering>();465const auto &DL = MF.getDataLayout();466const auto &STI = MF.getSubtarget<ARMSubtarget>();467const TargetRegisterInfo *TRI = STI.getRegisterInfo();468MachineRegisterInfo &MRI = MF.getRegInfo();469470if (STI.genLongCalls())471return false;472473if (STI.isThumb1Only())474return false;475476auto CallSeqStart = MIRBuilder.buildInstr(ARM::ADJCALLSTACKDOWN);477478// Create the call instruction so we can add the implicit uses of arg479// registers, but don't insert it yet.480bool IsDirect = !Info.Callee.isReg();481auto CallOpcode = getCallOpcode(MF, STI, IsDirect);482auto MIB = MIRBuilder.buildInstrNoInsert(CallOpcode);483484bool IsThumb = STI.isThumb();485if (IsThumb)486MIB.add(predOps(ARMCC::AL));487488MIB.add(Info.Callee);489if (!IsDirect) {490auto CalleeReg = Info.Callee.getReg();491if (CalleeReg && !CalleeReg.isPhysical()) {492unsigned CalleeIdx = IsThumb ? 2 : 0;493MIB->getOperand(CalleeIdx).setReg(constrainOperandRegClass(494MF, *TRI, MRI, *STI.getInstrInfo(), *STI.getRegBankInfo(),495*MIB.getInstr(), MIB->getDesc(), Info.Callee, CalleeIdx));496}497}498499MIB.addRegMask(TRI->getCallPreservedMask(MF, Info.CallConv));500501SmallVector<ArgInfo, 8> ArgInfos;502for (auto Arg : Info.OrigArgs) {503if (!isSupportedType(DL, TLI, Arg.Ty))504return false;505506if (Arg.Flags[0].isByVal())507return false;508509splitToValueTypes(Arg, ArgInfos, DL, Info.CallConv);510}511512auto ArgAssignFn = TLI.CCAssignFnForCall(Info.CallConv, Info.IsVarArg);513OutgoingValueAssigner ArgAssigner(ArgAssignFn);514ARMOutgoingValueHandler ArgHandler(MIRBuilder, MRI, MIB);515if (!determineAndHandleAssignments(ArgHandler, ArgAssigner, ArgInfos,516MIRBuilder, Info.CallConv, Info.IsVarArg))517return false;518519// Now we can add the actual call instruction to the correct basic block.520MIRBuilder.insertInstr(MIB);521522if (!Info.OrigRet.Ty->isVoidTy()) {523if (!isSupportedType(DL, TLI, Info.OrigRet.Ty))524return false;525526ArgInfos.clear();527splitToValueTypes(Info.OrigRet, ArgInfos, DL, Info.CallConv);528auto RetAssignFn = TLI.CCAssignFnForReturn(Info.CallConv, Info.IsVarArg);529OutgoingValueAssigner Assigner(RetAssignFn);530CallReturnHandler RetHandler(MIRBuilder, MRI, MIB);531if (!determineAndHandleAssignments(RetHandler, Assigner, ArgInfos,532MIRBuilder, Info.CallConv,533Info.IsVarArg))534return false;535}536537// We now know the size of the stack - update the ADJCALLSTACKDOWN538// accordingly.539CallSeqStart.addImm(ArgAssigner.StackSize).addImm(0).add(predOps(ARMCC::AL));540541MIRBuilder.buildInstr(ARM::ADJCALLSTACKUP)542.addImm(ArgAssigner.StackSize)543.addImm(-1ULL)544.add(predOps(ARMCC::AL));545546return true;547}548549bool ARMCallLowering::enableBigEndian() const { return EnableGISelBigEndian; }550551