Path: blob/main/contrib/llvm-project/llvm/lib/Target/AArch64/AArch64AsmPrinter.cpp
35267 views
//===- AArch64AsmPrinter.cpp - AArch64 LLVM assembly writer ---------------===//1//2// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.3// See https://llvm.org/LICENSE.txt for license information.4// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception5//6//===----------------------------------------------------------------------===//7//8// This file contains a printer that converts from our internal representation9// of machine-dependent LLVM code to the AArch64 assembly language.10//11//===----------------------------------------------------------------------===//1213#include "AArch64.h"14#include "AArch64MCInstLower.h"15#include "AArch64MachineFunctionInfo.h"16#include "AArch64RegisterInfo.h"17#include "AArch64Subtarget.h"18#include "AArch64TargetObjectFile.h"19#include "MCTargetDesc/AArch64AddressingModes.h"20#include "MCTargetDesc/AArch64InstPrinter.h"21#include "MCTargetDesc/AArch64MCExpr.h"22#include "MCTargetDesc/AArch64MCTargetDesc.h"23#include "MCTargetDesc/AArch64TargetStreamer.h"24#include "TargetInfo/AArch64TargetInfo.h"25#include "Utils/AArch64BaseInfo.h"26#include "llvm/ADT/SmallString.h"27#include "llvm/ADT/SmallVector.h"28#include "llvm/ADT/StringRef.h"29#include "llvm/ADT/Twine.h"30#include "llvm/BinaryFormat/COFF.h"31#include "llvm/BinaryFormat/ELF.h"32#include "llvm/BinaryFormat/MachO.h"33#include "llvm/CodeGen/AsmPrinter.h"34#include "llvm/CodeGen/FaultMaps.h"35#include "llvm/CodeGen/MachineBasicBlock.h"36#include "llvm/CodeGen/MachineFunction.h"37#include "llvm/CodeGen/MachineInstr.h"38#include "llvm/CodeGen/MachineJumpTableInfo.h"39#include "llvm/CodeGen/MachineModuleInfoImpls.h"40#include "llvm/CodeGen/MachineOperand.h"41#include "llvm/CodeGen/StackMaps.h"42#include "llvm/CodeGen/TargetRegisterInfo.h"43#include "llvm/IR/DataLayout.h"44#include "llvm/IR/DebugInfoMetadata.h"45#include "llvm/IR/Module.h"46#include "llvm/MC/MCAsmInfo.h"47#include "llvm/MC/MCContext.h"48#include "llvm/MC/MCInst.h"49#include "llvm/MC/MCInstBuilder.h"50#include "llvm/MC/MCSectionELF.h"51#include "llvm/MC/MCSectionMachO.h"52#include "llvm/MC/MCStreamer.h"53#include "llvm/MC/MCSymbol.h"54#include "llvm/MC/TargetRegistry.h"55#include "llvm/Support/Casting.h"56#include "llvm/Support/CommandLine.h"57#include "llvm/Support/ErrorHandling.h"58#include "llvm/Support/raw_ostream.h"59#include "llvm/Target/TargetMachine.h"60#include "llvm/TargetParser/Triple.h"61#include "llvm/Transforms/Instrumentation/HWAddressSanitizer.h"62#include <algorithm>63#include <cassert>64#include <cstdint>65#include <map>66#include <memory>6768using namespace llvm;6970enum PtrauthCheckMode { Default, Unchecked, Poison, Trap };71static cl::opt<PtrauthCheckMode> PtrauthAuthChecks(72"aarch64-ptrauth-auth-checks", cl::Hidden,73cl::values(clEnumValN(Unchecked, "none", "don't test for failure"),74clEnumValN(Poison, "poison", "poison on failure"),75clEnumValN(Trap, "trap", "trap on failure")),76cl::desc("Check pointer authentication auth/resign failures"),77cl::init(Default));7879#define DEBUG_TYPE "asm-printer"8081namespace {8283class AArch64AsmPrinter : public AsmPrinter {84AArch64MCInstLower MCInstLowering;85FaultMaps FM;86const AArch64Subtarget *STI;87bool ShouldEmitWeakSwiftAsyncExtendedFramePointerFlags = false;8889public:90AArch64AsmPrinter(TargetMachine &TM, std::unique_ptr<MCStreamer> Streamer)91: AsmPrinter(TM, std::move(Streamer)), MCInstLowering(OutContext, *this),92FM(*this) {}9394StringRef getPassName() const override { return "AArch64 Assembly Printer"; }9596/// Wrapper for MCInstLowering.lowerOperand() for the97/// tblgen'erated pseudo lowering.98bool lowerOperand(const MachineOperand &MO, MCOperand &MCOp) const {99return MCInstLowering.lowerOperand(MO, MCOp);100}101102const MCExpr *lowerConstantPtrAuth(const ConstantPtrAuth &CPA) override;103104const MCExpr *lowerBlockAddressConstant(const BlockAddress &BA) override;105106void emitStartOfAsmFile(Module &M) override;107void emitJumpTableInfo() override;108std::tuple<const MCSymbol *, uint64_t, const MCSymbol *,109codeview::JumpTableEntrySize>110getCodeViewJumpTableInfo(int JTI, const MachineInstr *BranchInstr,111const MCSymbol *BranchLabel) const override;112113void emitFunctionEntryLabel() override;114115void LowerJumpTableDest(MCStreamer &OutStreamer, const MachineInstr &MI);116117void LowerHardenedBRJumpTable(const MachineInstr &MI);118119void LowerMOPS(MCStreamer &OutStreamer, const MachineInstr &MI);120121void LowerSTACKMAP(MCStreamer &OutStreamer, StackMaps &SM,122const MachineInstr &MI);123void LowerPATCHPOINT(MCStreamer &OutStreamer, StackMaps &SM,124const MachineInstr &MI);125void LowerSTATEPOINT(MCStreamer &OutStreamer, StackMaps &SM,126const MachineInstr &MI);127void LowerFAULTING_OP(const MachineInstr &MI);128129void LowerPATCHABLE_FUNCTION_ENTER(const MachineInstr &MI);130void LowerPATCHABLE_FUNCTION_EXIT(const MachineInstr &MI);131void LowerPATCHABLE_TAIL_CALL(const MachineInstr &MI);132void LowerPATCHABLE_EVENT_CALL(const MachineInstr &MI, bool Typed);133134typedef std::tuple<unsigned, bool, uint32_t, bool, uint64_t>135HwasanMemaccessTuple;136std::map<HwasanMemaccessTuple, MCSymbol *> HwasanMemaccessSymbols;137void LowerKCFI_CHECK(const MachineInstr &MI);138void LowerHWASAN_CHECK_MEMACCESS(const MachineInstr &MI);139void emitHwasanMemaccessSymbols(Module &M);140141void emitSled(const MachineInstr &MI, SledKind Kind);142143// Emit the sequence for BRA/BLRA (authenticate + branch/call).144void emitPtrauthBranch(const MachineInstr *MI);145146// Emit the sequence for AUT or AUTPAC.147void emitPtrauthAuthResign(const MachineInstr *MI);148149// Emit the sequence to compute a discriminator into x17, or reuse AddrDisc.150unsigned emitPtrauthDiscriminator(uint16_t Disc, unsigned AddrDisc,151unsigned &InstsEmitted);152153// Emit the sequence for LOADauthptrstatic154void LowerLOADauthptrstatic(const MachineInstr &MI);155156// Emit the sequence for LOADgotPAC/MOVaddrPAC (either GOT adrp-ldr or157// adrp-add followed by PAC sign)158void LowerMOVaddrPAC(const MachineInstr &MI);159160/// tblgen'erated driver function for lowering simple MI->MC161/// pseudo instructions.162bool emitPseudoExpansionLowering(MCStreamer &OutStreamer,163const MachineInstr *MI);164165void emitInstruction(const MachineInstr *MI) override;166167void emitFunctionHeaderComment() override;168169void getAnalysisUsage(AnalysisUsage &AU) const override {170AsmPrinter::getAnalysisUsage(AU);171AU.setPreservesAll();172}173174bool runOnMachineFunction(MachineFunction &MF) override {175AArch64FI = MF.getInfo<AArch64FunctionInfo>();176STI = &MF.getSubtarget<AArch64Subtarget>();177178SetupMachineFunction(MF);179180if (STI->isTargetCOFF()) {181bool Local = MF.getFunction().hasLocalLinkage();182COFF::SymbolStorageClass Scl =183Local ? COFF::IMAGE_SYM_CLASS_STATIC : COFF::IMAGE_SYM_CLASS_EXTERNAL;184int Type =185COFF::IMAGE_SYM_DTYPE_FUNCTION << COFF::SCT_COMPLEX_TYPE_SHIFT;186187OutStreamer->beginCOFFSymbolDef(CurrentFnSym);188OutStreamer->emitCOFFSymbolStorageClass(Scl);189OutStreamer->emitCOFFSymbolType(Type);190OutStreamer->endCOFFSymbolDef();191}192193// Emit the rest of the function body.194emitFunctionBody();195196// Emit the XRay table for this function.197emitXRayTable();198199// We didn't modify anything.200return false;201}202203const MCExpr *lowerConstant(const Constant *CV) override;204205private:206void printOperand(const MachineInstr *MI, unsigned OpNum, raw_ostream &O);207bool printAsmMRegister(const MachineOperand &MO, char Mode, raw_ostream &O);208bool printAsmRegInClass(const MachineOperand &MO,209const TargetRegisterClass *RC, unsigned AltName,210raw_ostream &O);211212bool PrintAsmOperand(const MachineInstr *MI, unsigned OpNum,213const char *ExtraCode, raw_ostream &O) override;214bool PrintAsmMemoryOperand(const MachineInstr *MI, unsigned OpNum,215const char *ExtraCode, raw_ostream &O) override;216217void PrintDebugValueComment(const MachineInstr *MI, raw_ostream &OS);218219void emitFunctionBodyEnd() override;220void emitGlobalAlias(const Module &M, const GlobalAlias &GA) override;221222MCSymbol *GetCPISymbol(unsigned CPID) const override;223void emitEndOfAsmFile(Module &M) override;224225AArch64FunctionInfo *AArch64FI = nullptr;226227/// Emit the LOHs contained in AArch64FI.228void emitLOHs();229230/// Emit instruction to set float register to zero.231void emitFMov0(const MachineInstr &MI);232233using MInstToMCSymbol = std::map<const MachineInstr *, MCSymbol *>;234235MInstToMCSymbol LOHInstToLabel;236237bool shouldEmitWeakSwiftAsyncExtendedFramePointerFlags() const override {238return ShouldEmitWeakSwiftAsyncExtendedFramePointerFlags;239}240241const MCSubtargetInfo *getIFuncMCSubtargetInfo() const override {242assert(STI);243return STI;244}245void emitMachOIFuncStubBody(Module &M, const GlobalIFunc &GI,246MCSymbol *LazyPointer) override;247void emitMachOIFuncStubHelperBody(Module &M, const GlobalIFunc &GI,248MCSymbol *LazyPointer) override;249};250251} // end anonymous namespace252253void AArch64AsmPrinter::emitStartOfAsmFile(Module &M) {254const Triple &TT = TM.getTargetTriple();255256if (TT.isOSBinFormatCOFF()) {257// Emit an absolute @feat.00 symbol258MCSymbol *S = MMI->getContext().getOrCreateSymbol(StringRef("@feat.00"));259OutStreamer->beginCOFFSymbolDef(S);260OutStreamer->emitCOFFSymbolStorageClass(COFF::IMAGE_SYM_CLASS_STATIC);261OutStreamer->emitCOFFSymbolType(COFF::IMAGE_SYM_DTYPE_NULL);262OutStreamer->endCOFFSymbolDef();263int64_t Feat00Value = 0;264265if (M.getModuleFlag("cfguard")) {266// Object is CFG-aware.267Feat00Value |= COFF::Feat00Flags::GuardCF;268}269270if (M.getModuleFlag("ehcontguard")) {271// Object also has EHCont.272Feat00Value |= COFF::Feat00Flags::GuardEHCont;273}274275if (M.getModuleFlag("ms-kernel")) {276// Object is compiled with /kernel.277Feat00Value |= COFF::Feat00Flags::Kernel;278}279280OutStreamer->emitSymbolAttribute(S, MCSA_Global);281OutStreamer->emitAssignment(282S, MCConstantExpr::create(Feat00Value, MMI->getContext()));283}284285if (!TT.isOSBinFormatELF())286return;287288// Assemble feature flags that may require creation of a note section.289unsigned Flags = 0;290if (const auto *BTE = mdconst::extract_or_null<ConstantInt>(291M.getModuleFlag("branch-target-enforcement")))292if (!BTE->isZero())293Flags |= ELF::GNU_PROPERTY_AARCH64_FEATURE_1_BTI;294295if (const auto *GCS = mdconst::extract_or_null<ConstantInt>(296M.getModuleFlag("guarded-control-stack")))297if (!GCS->isZero())298Flags |= ELF::GNU_PROPERTY_AARCH64_FEATURE_1_GCS;299300if (const auto *Sign = mdconst::extract_or_null<ConstantInt>(301M.getModuleFlag("sign-return-address")))302if (!Sign->isZero())303Flags |= ELF::GNU_PROPERTY_AARCH64_FEATURE_1_PAC;304305uint64_t PAuthABIPlatform = -1;306if (const auto *PAP = mdconst::extract_or_null<ConstantInt>(307M.getModuleFlag("aarch64-elf-pauthabi-platform")))308PAuthABIPlatform = PAP->getZExtValue();309uint64_t PAuthABIVersion = -1;310if (const auto *PAV = mdconst::extract_or_null<ConstantInt>(311M.getModuleFlag("aarch64-elf-pauthabi-version")))312PAuthABIVersion = PAV->getZExtValue();313314// Emit a .note.gnu.property section with the flags.315auto *TS =316static_cast<AArch64TargetStreamer *>(OutStreamer->getTargetStreamer());317TS->emitNoteSection(Flags, PAuthABIPlatform, PAuthABIVersion);318}319320void AArch64AsmPrinter::emitFunctionHeaderComment() {321const AArch64FunctionInfo *FI = MF->getInfo<AArch64FunctionInfo>();322std::optional<std::string> OutlinerString = FI->getOutliningStyle();323if (OutlinerString != std::nullopt)324OutStreamer->getCommentOS() << ' ' << OutlinerString;325}326327void AArch64AsmPrinter::LowerPATCHABLE_FUNCTION_ENTER(const MachineInstr &MI)328{329const Function &F = MF->getFunction();330if (F.hasFnAttribute("patchable-function-entry")) {331unsigned Num;332if (F.getFnAttribute("patchable-function-entry")333.getValueAsString()334.getAsInteger(10, Num))335return;336emitNops(Num);337return;338}339340emitSled(MI, SledKind::FUNCTION_ENTER);341}342343void AArch64AsmPrinter::LowerPATCHABLE_FUNCTION_EXIT(const MachineInstr &MI) {344emitSled(MI, SledKind::FUNCTION_EXIT);345}346347void AArch64AsmPrinter::LowerPATCHABLE_TAIL_CALL(const MachineInstr &MI) {348emitSled(MI, SledKind::TAIL_CALL);349}350351void AArch64AsmPrinter::emitSled(const MachineInstr &MI, SledKind Kind) {352static const int8_t NoopsInSledCount = 7;353// We want to emit the following pattern:354//355// .Lxray_sled_N:356// ALIGN357// B #32358// ; 7 NOP instructions (28 bytes)359// .tmpN360//361// We need the 28 bytes (7 instructions) because at runtime, we'd be patching362// over the full 32 bytes (8 instructions) with the following pattern:363//364// STP X0, X30, [SP, #-16]! ; push X0 and the link register to the stack365// LDR W17, #12 ; W17 := function ID366// LDR X16,#12 ; X16 := addr of __xray_FunctionEntry or __xray_FunctionExit367// BLR X16 ; call the tracing trampoline368// ;DATA: 32 bits of function ID369// ;DATA: lower 32 bits of the address of the trampoline370// ;DATA: higher 32 bits of the address of the trampoline371// LDP X0, X30, [SP], #16 ; pop X0 and the link register from the stack372//373OutStreamer->emitCodeAlignment(Align(4), &getSubtargetInfo());374auto CurSled = OutContext.createTempSymbol("xray_sled_", true);375OutStreamer->emitLabel(CurSled);376auto Target = OutContext.createTempSymbol();377378// Emit "B #32" instruction, which jumps over the next 28 bytes.379// The operand has to be the number of 4-byte instructions to jump over,380// including the current instruction.381EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::B).addImm(8));382383for (int8_t I = 0; I < NoopsInSledCount; I++)384EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::HINT).addImm(0));385386OutStreamer->emitLabel(Target);387recordSled(CurSled, MI, Kind, 2);388}389390// Emit the following code for Intrinsic::{xray_customevent,xray_typedevent}391// (built-in functions __xray_customevent/__xray_typedevent).392//393// .Lxray_event_sled_N:394// b 1f395// save x0 and x1 (and also x2 for TYPED_EVENT_CALL)396// set up x0 and x1 (and also x2 for TYPED_EVENT_CALL)397// bl __xray_CustomEvent or __xray_TypedEvent398// restore x0 and x1 (and also x2 for TYPED_EVENT_CALL)399// 1:400//401// There are 6 instructions for EVENT_CALL and 9 for TYPED_EVENT_CALL.402//403// Then record a sled of kind CUSTOM_EVENT or TYPED_EVENT.404// After patching, b .+N will become a nop.405void AArch64AsmPrinter::LowerPATCHABLE_EVENT_CALL(const MachineInstr &MI,406bool Typed) {407auto &O = *OutStreamer;408MCSymbol *CurSled = OutContext.createTempSymbol("xray_sled_", true);409O.emitLabel(CurSled);410MCInst MovX0Op0 = MCInstBuilder(AArch64::ORRXrs)411.addReg(AArch64::X0)412.addReg(AArch64::XZR)413.addReg(MI.getOperand(0).getReg())414.addImm(0);415MCInst MovX1Op1 = MCInstBuilder(AArch64::ORRXrs)416.addReg(AArch64::X1)417.addReg(AArch64::XZR)418.addReg(MI.getOperand(1).getReg())419.addImm(0);420bool MachO = TM.getTargetTriple().isOSBinFormatMachO();421auto *Sym = MCSymbolRefExpr::create(422OutContext.getOrCreateSymbol(423Twine(MachO ? "_" : "") +424(Typed ? "__xray_TypedEvent" : "__xray_CustomEvent")),425OutContext);426if (Typed) {427O.AddComment("Begin XRay typed event");428EmitToStreamer(O, MCInstBuilder(AArch64::B).addImm(9));429EmitToStreamer(O, MCInstBuilder(AArch64::STPXpre)430.addReg(AArch64::SP)431.addReg(AArch64::X0)432.addReg(AArch64::X1)433.addReg(AArch64::SP)434.addImm(-4));435EmitToStreamer(O, MCInstBuilder(AArch64::STRXui)436.addReg(AArch64::X2)437.addReg(AArch64::SP)438.addImm(2));439EmitToStreamer(O, MovX0Op0);440EmitToStreamer(O, MovX1Op1);441EmitToStreamer(O, MCInstBuilder(AArch64::ORRXrs)442.addReg(AArch64::X2)443.addReg(AArch64::XZR)444.addReg(MI.getOperand(2).getReg())445.addImm(0));446EmitToStreamer(O, MCInstBuilder(AArch64::BL).addExpr(Sym));447EmitToStreamer(O, MCInstBuilder(AArch64::LDRXui)448.addReg(AArch64::X2)449.addReg(AArch64::SP)450.addImm(2));451O.AddComment("End XRay typed event");452EmitToStreamer(O, MCInstBuilder(AArch64::LDPXpost)453.addReg(AArch64::SP)454.addReg(AArch64::X0)455.addReg(AArch64::X1)456.addReg(AArch64::SP)457.addImm(4));458459recordSled(CurSled, MI, SledKind::TYPED_EVENT, 2);460} else {461O.AddComment("Begin XRay custom event");462EmitToStreamer(O, MCInstBuilder(AArch64::B).addImm(6));463EmitToStreamer(O, MCInstBuilder(AArch64::STPXpre)464.addReg(AArch64::SP)465.addReg(AArch64::X0)466.addReg(AArch64::X1)467.addReg(AArch64::SP)468.addImm(-2));469EmitToStreamer(O, MovX0Op0);470EmitToStreamer(O, MovX1Op1);471EmitToStreamer(O, MCInstBuilder(AArch64::BL).addExpr(Sym));472O.AddComment("End XRay custom event");473EmitToStreamer(O, MCInstBuilder(AArch64::LDPXpost)474.addReg(AArch64::SP)475.addReg(AArch64::X0)476.addReg(AArch64::X1)477.addReg(AArch64::SP)478.addImm(2));479480recordSled(CurSled, MI, SledKind::CUSTOM_EVENT, 2);481}482}483484void AArch64AsmPrinter::LowerKCFI_CHECK(const MachineInstr &MI) {485Register AddrReg = MI.getOperand(0).getReg();486assert(std::next(MI.getIterator())->isCall() &&487"KCFI_CHECK not followed by a call instruction");488assert(std::next(MI.getIterator())->getOperand(0).getReg() == AddrReg &&489"KCFI_CHECK call target doesn't match call operand");490491// Default to using the intra-procedure-call temporary registers for492// comparing the hashes.493unsigned ScratchRegs[] = {AArch64::W16, AArch64::W17};494if (AddrReg == AArch64::XZR) {495// Checking XZR makes no sense. Instead of emitting a load, zero496// ScratchRegs[0] and use it for the ESR AddrIndex below.497AddrReg = getXRegFromWReg(ScratchRegs[0]);498EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ORRXrs)499.addReg(AddrReg)500.addReg(AArch64::XZR)501.addReg(AArch64::XZR)502.addImm(0));503} else {504// If one of the scratch registers is used for the call target (e.g.505// with AArch64::TCRETURNriBTI), we can clobber another caller-saved506// temporary register instead (in this case, AArch64::W9) as the check507// is immediately followed by the call instruction.508for (auto &Reg : ScratchRegs) {509if (Reg == getWRegFromXReg(AddrReg)) {510Reg = AArch64::W9;511break;512}513}514assert(ScratchRegs[0] != AddrReg && ScratchRegs[1] != AddrReg &&515"Invalid scratch registers for KCFI_CHECK");516517// Adjust the offset for patchable-function-prefix. This assumes that518// patchable-function-prefix is the same for all functions.519int64_t PrefixNops = 0;520(void)MI.getMF()521->getFunction()522.getFnAttribute("patchable-function-prefix")523.getValueAsString()524.getAsInteger(10, PrefixNops);525526// Load the target function type hash.527EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::LDURWi)528.addReg(ScratchRegs[0])529.addReg(AddrReg)530.addImm(-(PrefixNops * 4 + 4)));531}532533// Load the expected type hash.534const int64_t Type = MI.getOperand(1).getImm();535EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::MOVKWi)536.addReg(ScratchRegs[1])537.addReg(ScratchRegs[1])538.addImm(Type & 0xFFFF)539.addImm(0));540EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::MOVKWi)541.addReg(ScratchRegs[1])542.addReg(ScratchRegs[1])543.addImm((Type >> 16) & 0xFFFF)544.addImm(16));545546// Compare the hashes and trap if there's a mismatch.547EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::SUBSWrs)548.addReg(AArch64::WZR)549.addReg(ScratchRegs[0])550.addReg(ScratchRegs[1])551.addImm(0));552553MCSymbol *Pass = OutContext.createTempSymbol();554EmitToStreamer(*OutStreamer,555MCInstBuilder(AArch64::Bcc)556.addImm(AArch64CC::EQ)557.addExpr(MCSymbolRefExpr::create(Pass, OutContext)));558559// The base ESR is 0x8000 and the register information is encoded in bits560// 0-9 as follows:561// - 0-4: n, where the register Xn contains the target address562// - 5-9: m, where the register Wm contains the expected type hash563// Where n, m are in [0, 30].564unsigned TypeIndex = ScratchRegs[1] - AArch64::W0;565unsigned AddrIndex;566switch (AddrReg) {567default:568AddrIndex = AddrReg - AArch64::X0;569break;570case AArch64::FP:571AddrIndex = 29;572break;573case AArch64::LR:574AddrIndex = 30;575break;576}577578assert(AddrIndex < 31 && TypeIndex < 31);579580unsigned ESR = 0x8000 | ((TypeIndex & 31) << 5) | (AddrIndex & 31);581EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::BRK).addImm(ESR));582OutStreamer->emitLabel(Pass);583}584585void AArch64AsmPrinter::LowerHWASAN_CHECK_MEMACCESS(const MachineInstr &MI) {586Register Reg = MI.getOperand(0).getReg();587bool IsShort =588((MI.getOpcode() == AArch64::HWASAN_CHECK_MEMACCESS_SHORTGRANULES) ||589(MI.getOpcode() ==590AArch64::HWASAN_CHECK_MEMACCESS_SHORTGRANULES_FIXEDSHADOW));591uint32_t AccessInfo = MI.getOperand(1).getImm();592bool IsFixedShadow =593((MI.getOpcode() == AArch64::HWASAN_CHECK_MEMACCESS_FIXEDSHADOW) ||594(MI.getOpcode() ==595AArch64::HWASAN_CHECK_MEMACCESS_SHORTGRANULES_FIXEDSHADOW));596uint64_t FixedShadowOffset = IsFixedShadow ? MI.getOperand(2).getImm() : 0;597598MCSymbol *&Sym = HwasanMemaccessSymbols[HwasanMemaccessTuple(599Reg, IsShort, AccessInfo, IsFixedShadow, FixedShadowOffset)];600if (!Sym) {601// FIXME: Make this work on non-ELF.602if (!TM.getTargetTriple().isOSBinFormatELF())603report_fatal_error("llvm.hwasan.check.memaccess only supported on ELF");604605std::string SymName = "__hwasan_check_x" + utostr(Reg - AArch64::X0) + "_" +606utostr(AccessInfo);607if (IsFixedShadow)608SymName += "_fixed_" + utostr(FixedShadowOffset);609if (IsShort)610SymName += "_short_v2";611Sym = OutContext.getOrCreateSymbol(SymName);612}613614EmitToStreamer(*OutStreamer,615MCInstBuilder(AArch64::BL)616.addExpr(MCSymbolRefExpr::create(Sym, OutContext)));617}618619void AArch64AsmPrinter::emitHwasanMemaccessSymbols(Module &M) {620if (HwasanMemaccessSymbols.empty())621return;622623const Triple &TT = TM.getTargetTriple();624assert(TT.isOSBinFormatELF());625std::unique_ptr<MCSubtargetInfo> STI(626TM.getTarget().createMCSubtargetInfo(TT.str(), "", ""));627assert(STI && "Unable to create subtarget info");628629MCSymbol *HwasanTagMismatchV1Sym =630OutContext.getOrCreateSymbol("__hwasan_tag_mismatch");631MCSymbol *HwasanTagMismatchV2Sym =632OutContext.getOrCreateSymbol("__hwasan_tag_mismatch_v2");633634const MCSymbolRefExpr *HwasanTagMismatchV1Ref =635MCSymbolRefExpr::create(HwasanTagMismatchV1Sym, OutContext);636const MCSymbolRefExpr *HwasanTagMismatchV2Ref =637MCSymbolRefExpr::create(HwasanTagMismatchV2Sym, OutContext);638639for (auto &P : HwasanMemaccessSymbols) {640unsigned Reg = std::get<0>(P.first);641bool IsShort = std::get<1>(P.first);642uint32_t AccessInfo = std::get<2>(P.first);643bool IsFixedShadow = std::get<3>(P.first);644uint64_t FixedShadowOffset = std::get<4>(P.first);645const MCSymbolRefExpr *HwasanTagMismatchRef =646IsShort ? HwasanTagMismatchV2Ref : HwasanTagMismatchV1Ref;647MCSymbol *Sym = P.second;648649bool HasMatchAllTag =650(AccessInfo >> HWASanAccessInfo::HasMatchAllShift) & 1;651uint8_t MatchAllTag =652(AccessInfo >> HWASanAccessInfo::MatchAllShift) & 0xff;653unsigned Size =6541 << ((AccessInfo >> HWASanAccessInfo::AccessSizeShift) & 0xf);655bool CompileKernel =656(AccessInfo >> HWASanAccessInfo::CompileKernelShift) & 1;657658OutStreamer->switchSection(OutContext.getELFSection(659".text.hot", ELF::SHT_PROGBITS,660ELF::SHF_EXECINSTR | ELF::SHF_ALLOC | ELF::SHF_GROUP, 0, Sym->getName(),661/*IsComdat=*/true));662663OutStreamer->emitSymbolAttribute(Sym, MCSA_ELF_TypeFunction);664OutStreamer->emitSymbolAttribute(Sym, MCSA_Weak);665OutStreamer->emitSymbolAttribute(Sym, MCSA_Hidden);666OutStreamer->emitLabel(Sym);667668OutStreamer->emitInstruction(MCInstBuilder(AArch64::SBFMXri)669.addReg(AArch64::X16)670.addReg(Reg)671.addImm(4)672.addImm(55),673*STI);674675if (IsFixedShadow) {676// Aarch64 makes it difficult to embed large constants in the code.677// Fortuitously, kShadowBaseAlignment == 32, so we use the 32-bit678// left-shift option in the MOV instruction. Combined with the 16-bit679// immediate, this is enough to represent any offset up to 2**48.680OutStreamer->emitInstruction(MCInstBuilder(AArch64::MOVZXi)681.addReg(AArch64::X17)682.addImm(FixedShadowOffset >> 32)683.addImm(32),684*STI);685OutStreamer->emitInstruction(MCInstBuilder(AArch64::LDRBBroX)686.addReg(AArch64::W16)687.addReg(AArch64::X17)688.addReg(AArch64::X16)689.addImm(0)690.addImm(0),691*STI);692} else {693OutStreamer->emitInstruction(694MCInstBuilder(AArch64::LDRBBroX)695.addReg(AArch64::W16)696.addReg(IsShort ? AArch64::X20 : AArch64::X9)697.addReg(AArch64::X16)698.addImm(0)699.addImm(0),700*STI);701}702703OutStreamer->emitInstruction(704MCInstBuilder(AArch64::SUBSXrs)705.addReg(AArch64::XZR)706.addReg(AArch64::X16)707.addReg(Reg)708.addImm(AArch64_AM::getShifterImm(AArch64_AM::LSR, 56)),709*STI);710MCSymbol *HandleMismatchOrPartialSym = OutContext.createTempSymbol();711OutStreamer->emitInstruction(712MCInstBuilder(AArch64::Bcc)713.addImm(AArch64CC::NE)714.addExpr(MCSymbolRefExpr::create(HandleMismatchOrPartialSym,715OutContext)),716*STI);717MCSymbol *ReturnSym = OutContext.createTempSymbol();718OutStreamer->emitLabel(ReturnSym);719OutStreamer->emitInstruction(720MCInstBuilder(AArch64::RET).addReg(AArch64::LR), *STI);721OutStreamer->emitLabel(HandleMismatchOrPartialSym);722723if (HasMatchAllTag) {724OutStreamer->emitInstruction(MCInstBuilder(AArch64::UBFMXri)725.addReg(AArch64::X17)726.addReg(Reg)727.addImm(56)728.addImm(63),729*STI);730OutStreamer->emitInstruction(MCInstBuilder(AArch64::SUBSXri)731.addReg(AArch64::XZR)732.addReg(AArch64::X17)733.addImm(MatchAllTag)734.addImm(0),735*STI);736OutStreamer->emitInstruction(737MCInstBuilder(AArch64::Bcc)738.addImm(AArch64CC::EQ)739.addExpr(MCSymbolRefExpr::create(ReturnSym, OutContext)),740*STI);741}742743if (IsShort) {744OutStreamer->emitInstruction(MCInstBuilder(AArch64::SUBSWri)745.addReg(AArch64::WZR)746.addReg(AArch64::W16)747.addImm(15)748.addImm(0),749*STI);750MCSymbol *HandleMismatchSym = OutContext.createTempSymbol();751OutStreamer->emitInstruction(752MCInstBuilder(AArch64::Bcc)753.addImm(AArch64CC::HI)754.addExpr(MCSymbolRefExpr::create(HandleMismatchSym, OutContext)),755*STI);756757OutStreamer->emitInstruction(758MCInstBuilder(AArch64::ANDXri)759.addReg(AArch64::X17)760.addReg(Reg)761.addImm(AArch64_AM::encodeLogicalImmediate(0xf, 64)),762*STI);763if (Size != 1)764OutStreamer->emitInstruction(MCInstBuilder(AArch64::ADDXri)765.addReg(AArch64::X17)766.addReg(AArch64::X17)767.addImm(Size - 1)768.addImm(0),769*STI);770OutStreamer->emitInstruction(MCInstBuilder(AArch64::SUBSWrs)771.addReg(AArch64::WZR)772.addReg(AArch64::W16)773.addReg(AArch64::W17)774.addImm(0),775*STI);776OutStreamer->emitInstruction(777MCInstBuilder(AArch64::Bcc)778.addImm(AArch64CC::LS)779.addExpr(MCSymbolRefExpr::create(HandleMismatchSym, OutContext)),780*STI);781782OutStreamer->emitInstruction(783MCInstBuilder(AArch64::ORRXri)784.addReg(AArch64::X16)785.addReg(Reg)786.addImm(AArch64_AM::encodeLogicalImmediate(0xf, 64)),787*STI);788OutStreamer->emitInstruction(MCInstBuilder(AArch64::LDRBBui)789.addReg(AArch64::W16)790.addReg(AArch64::X16)791.addImm(0),792*STI);793OutStreamer->emitInstruction(794MCInstBuilder(AArch64::SUBSXrs)795.addReg(AArch64::XZR)796.addReg(AArch64::X16)797.addReg(Reg)798.addImm(AArch64_AM::getShifterImm(AArch64_AM::LSR, 56)),799*STI);800OutStreamer->emitInstruction(801MCInstBuilder(AArch64::Bcc)802.addImm(AArch64CC::EQ)803.addExpr(MCSymbolRefExpr::create(ReturnSym, OutContext)),804*STI);805806OutStreamer->emitLabel(HandleMismatchSym);807}808809OutStreamer->emitInstruction(MCInstBuilder(AArch64::STPXpre)810.addReg(AArch64::SP)811.addReg(AArch64::X0)812.addReg(AArch64::X1)813.addReg(AArch64::SP)814.addImm(-32),815*STI);816OutStreamer->emitInstruction(MCInstBuilder(AArch64::STPXi)817.addReg(AArch64::FP)818.addReg(AArch64::LR)819.addReg(AArch64::SP)820.addImm(29),821*STI);822823if (Reg != AArch64::X0)824OutStreamer->emitInstruction(MCInstBuilder(AArch64::ORRXrs)825.addReg(AArch64::X0)826.addReg(AArch64::XZR)827.addReg(Reg)828.addImm(0),829*STI);830OutStreamer->emitInstruction(831MCInstBuilder(AArch64::MOVZXi)832.addReg(AArch64::X1)833.addImm(AccessInfo & HWASanAccessInfo::RuntimeMask)834.addImm(0),835*STI);836837if (CompileKernel) {838// The Linux kernel's dynamic loader doesn't support GOT relative839// relocations, but it doesn't support late binding either, so just call840// the function directly.841OutStreamer->emitInstruction(842MCInstBuilder(AArch64::B).addExpr(HwasanTagMismatchRef), *STI);843} else {844// Intentionally load the GOT entry and branch to it, rather than possibly845// late binding the function, which may clobber the registers before we846// have a chance to save them.847OutStreamer->emitInstruction(848MCInstBuilder(AArch64::ADRP)849.addReg(AArch64::X16)850.addExpr(AArch64MCExpr::create(851HwasanTagMismatchRef, AArch64MCExpr::VariantKind::VK_GOT_PAGE,852OutContext)),853*STI);854OutStreamer->emitInstruction(855MCInstBuilder(AArch64::LDRXui)856.addReg(AArch64::X16)857.addReg(AArch64::X16)858.addExpr(AArch64MCExpr::create(859HwasanTagMismatchRef, AArch64MCExpr::VariantKind::VK_GOT_LO12,860OutContext)),861*STI);862OutStreamer->emitInstruction(863MCInstBuilder(AArch64::BR).addReg(AArch64::X16), *STI);864}865}866}867868static void emitAuthenticatedPointer(MCStreamer &OutStreamer,869MCSymbol *StubLabel,870const MCExpr *StubAuthPtrRef) {871// sym$auth_ptr$key$disc:872OutStreamer.emitLabel(StubLabel);873OutStreamer.emitValue(StubAuthPtrRef, /*size=*/8);874}875876void AArch64AsmPrinter::emitEndOfAsmFile(Module &M) {877emitHwasanMemaccessSymbols(M);878879const Triple &TT = TM.getTargetTriple();880if (TT.isOSBinFormatMachO()) {881// Output authenticated pointers as indirect symbols, if we have any.882MachineModuleInfoMachO &MMIMacho =883MMI->getObjFileInfo<MachineModuleInfoMachO>();884885auto Stubs = MMIMacho.getAuthGVStubList();886887if (!Stubs.empty()) {888// Switch to the "__auth_ptr" section.889OutStreamer->switchSection(890OutContext.getMachOSection("__DATA", "__auth_ptr", MachO::S_REGULAR,891SectionKind::getMetadata()));892emitAlignment(Align(8));893894for (const auto &Stub : Stubs)895emitAuthenticatedPointer(*OutStreamer, Stub.first, Stub.second);896897OutStreamer->addBlankLine();898}899900// Funny Darwin hack: This flag tells the linker that no global symbols901// contain code that falls through to other global symbols (e.g. the obvious902// implementation of multiple entry points). If this doesn't occur, the903// linker can safely perform dead code stripping. Since LLVM never904// generates code that does this, it is always safe to set.905OutStreamer->emitAssemblerFlag(MCAF_SubsectionsViaSymbols);906}907908if (TT.isOSBinFormatELF()) {909// Output authenticated pointers as indirect symbols, if we have any.910MachineModuleInfoELF &MMIELF = MMI->getObjFileInfo<MachineModuleInfoELF>();911912auto Stubs = MMIELF.getAuthGVStubList();913914if (!Stubs.empty()) {915const TargetLoweringObjectFile &TLOF = getObjFileLowering();916OutStreamer->switchSection(TLOF.getDataSection());917emitAlignment(Align(8));918919for (const auto &Stub : Stubs)920emitAuthenticatedPointer(*OutStreamer, Stub.first, Stub.second);921922OutStreamer->addBlankLine();923}924}925926// Emit stack and fault map information.927FM.serializeToFaultMapSection();928929}930931void AArch64AsmPrinter::emitLOHs() {932SmallVector<MCSymbol *, 3> MCArgs;933934for (const auto &D : AArch64FI->getLOHContainer()) {935for (const MachineInstr *MI : D.getArgs()) {936MInstToMCSymbol::iterator LabelIt = LOHInstToLabel.find(MI);937assert(LabelIt != LOHInstToLabel.end() &&938"Label hasn't been inserted for LOH related instruction");939MCArgs.push_back(LabelIt->second);940}941OutStreamer->emitLOHDirective(D.getKind(), MCArgs);942MCArgs.clear();943}944}945946void AArch64AsmPrinter::emitFunctionBodyEnd() {947if (!AArch64FI->getLOHRelated().empty())948emitLOHs();949}950951/// GetCPISymbol - Return the symbol for the specified constant pool entry.952MCSymbol *AArch64AsmPrinter::GetCPISymbol(unsigned CPID) const {953// Darwin uses a linker-private symbol name for constant-pools (to954// avoid addends on the relocation?), ELF has no such concept and955// uses a normal private symbol.956if (!getDataLayout().getLinkerPrivateGlobalPrefix().empty())957return OutContext.getOrCreateSymbol(958Twine(getDataLayout().getLinkerPrivateGlobalPrefix()) + "CPI" +959Twine(getFunctionNumber()) + "_" + Twine(CPID));960961return AsmPrinter::GetCPISymbol(CPID);962}963964void AArch64AsmPrinter::printOperand(const MachineInstr *MI, unsigned OpNum,965raw_ostream &O) {966const MachineOperand &MO = MI->getOperand(OpNum);967switch (MO.getType()) {968default:969llvm_unreachable("<unknown operand type>");970case MachineOperand::MO_Register: {971Register Reg = MO.getReg();972assert(Reg.isPhysical());973assert(!MO.getSubReg() && "Subregs should be eliminated!");974O << AArch64InstPrinter::getRegisterName(Reg);975break;976}977case MachineOperand::MO_Immediate: {978O << MO.getImm();979break;980}981case MachineOperand::MO_GlobalAddress: {982PrintSymbolOperand(MO, O);983break;984}985case MachineOperand::MO_BlockAddress: {986MCSymbol *Sym = GetBlockAddressSymbol(MO.getBlockAddress());987Sym->print(O, MAI);988break;989}990}991}992993bool AArch64AsmPrinter::printAsmMRegister(const MachineOperand &MO, char Mode,994raw_ostream &O) {995Register Reg = MO.getReg();996switch (Mode) {997default:998return true; // Unknown mode.999case 'w':1000Reg = getWRegFromXReg(Reg);1001break;1002case 'x':1003Reg = getXRegFromWReg(Reg);1004break;1005case 't':1006Reg = getXRegFromXRegTuple(Reg);1007break;1008}10091010O << AArch64InstPrinter::getRegisterName(Reg);1011return false;1012}10131014// Prints the register in MO using class RC using the offset in the1015// new register class. This should not be used for cross class1016// printing.1017bool AArch64AsmPrinter::printAsmRegInClass(const MachineOperand &MO,1018const TargetRegisterClass *RC,1019unsigned AltName, raw_ostream &O) {1020assert(MO.isReg() && "Should only get here with a register!");1021const TargetRegisterInfo *RI = STI->getRegisterInfo();1022Register Reg = MO.getReg();1023unsigned RegToPrint = RC->getRegister(RI->getEncodingValue(Reg));1024if (!RI->regsOverlap(RegToPrint, Reg))1025return true;1026O << AArch64InstPrinter::getRegisterName(RegToPrint, AltName);1027return false;1028}10291030bool AArch64AsmPrinter::PrintAsmOperand(const MachineInstr *MI, unsigned OpNum,1031const char *ExtraCode, raw_ostream &O) {1032const MachineOperand &MO = MI->getOperand(OpNum);10331034// First try the generic code, which knows about modifiers like 'c' and 'n'.1035if (!AsmPrinter::PrintAsmOperand(MI, OpNum, ExtraCode, O))1036return false;10371038// Does this asm operand have a single letter operand modifier?1039if (ExtraCode && ExtraCode[0]) {1040if (ExtraCode[1] != 0)1041return true; // Unknown modifier.10421043switch (ExtraCode[0]) {1044default:1045return true; // Unknown modifier.1046case 'w': // Print W register1047case 'x': // Print X register1048if (MO.isReg())1049return printAsmMRegister(MO, ExtraCode[0], O);1050if (MO.isImm() && MO.getImm() == 0) {1051unsigned Reg = ExtraCode[0] == 'w' ? AArch64::WZR : AArch64::XZR;1052O << AArch64InstPrinter::getRegisterName(Reg);1053return false;1054}1055printOperand(MI, OpNum, O);1056return false;1057case 'b': // Print B register.1058case 'h': // Print H register.1059case 's': // Print S register.1060case 'd': // Print D register.1061case 'q': // Print Q register.1062case 'z': // Print Z register.1063if (MO.isReg()) {1064const TargetRegisterClass *RC;1065switch (ExtraCode[0]) {1066case 'b':1067RC = &AArch64::FPR8RegClass;1068break;1069case 'h':1070RC = &AArch64::FPR16RegClass;1071break;1072case 's':1073RC = &AArch64::FPR32RegClass;1074break;1075case 'd':1076RC = &AArch64::FPR64RegClass;1077break;1078case 'q':1079RC = &AArch64::FPR128RegClass;1080break;1081case 'z':1082RC = &AArch64::ZPRRegClass;1083break;1084default:1085return true;1086}1087return printAsmRegInClass(MO, RC, AArch64::NoRegAltName, O);1088}1089printOperand(MI, OpNum, O);1090return false;1091}1092}10931094// According to ARM, we should emit x and v registers unless we have a1095// modifier.1096if (MO.isReg()) {1097Register Reg = MO.getReg();10981099// If this is a w or x register, print an x register.1100if (AArch64::GPR32allRegClass.contains(Reg) ||1101AArch64::GPR64allRegClass.contains(Reg))1102return printAsmMRegister(MO, 'x', O);11031104// If this is an x register tuple, print an x register.1105if (AArch64::GPR64x8ClassRegClass.contains(Reg))1106return printAsmMRegister(MO, 't', O);11071108unsigned AltName = AArch64::NoRegAltName;1109const TargetRegisterClass *RegClass;1110if (AArch64::ZPRRegClass.contains(Reg)) {1111RegClass = &AArch64::ZPRRegClass;1112} else if (AArch64::PPRRegClass.contains(Reg)) {1113RegClass = &AArch64::PPRRegClass;1114} else if (AArch64::PNRRegClass.contains(Reg)) {1115RegClass = &AArch64::PNRRegClass;1116} else {1117RegClass = &AArch64::FPR128RegClass;1118AltName = AArch64::vreg;1119}11201121// If this is a b, h, s, d, or q register, print it as a v register.1122return printAsmRegInClass(MO, RegClass, AltName, O);1123}11241125printOperand(MI, OpNum, O);1126return false;1127}11281129bool AArch64AsmPrinter::PrintAsmMemoryOperand(const MachineInstr *MI,1130unsigned OpNum,1131const char *ExtraCode,1132raw_ostream &O) {1133if (ExtraCode && ExtraCode[0] && ExtraCode[0] != 'a')1134return true; // Unknown modifier.11351136const MachineOperand &MO = MI->getOperand(OpNum);1137assert(MO.isReg() && "unexpected inline asm memory operand");1138O << "[" << AArch64InstPrinter::getRegisterName(MO.getReg()) << "]";1139return false;1140}11411142void AArch64AsmPrinter::PrintDebugValueComment(const MachineInstr *MI,1143raw_ostream &OS) {1144unsigned NOps = MI->getNumOperands();1145assert(NOps == 4);1146OS << '\t' << MAI->getCommentString() << "DEBUG_VALUE: ";1147// cast away const; DIetc do not take const operands for some reason.1148OS << MI->getDebugVariable()->getName();1149OS << " <- ";1150// Frame address. Currently handles register +- offset only.1151assert(MI->isIndirectDebugValue());1152OS << '[';1153for (unsigned I = 0, E = std::distance(MI->debug_operands().begin(),1154MI->debug_operands().end());1155I < E; ++I) {1156if (I != 0)1157OS << ", ";1158printOperand(MI, I, OS);1159}1160OS << ']';1161OS << "+";1162printOperand(MI, NOps - 2, OS);1163}11641165void AArch64AsmPrinter::emitJumpTableInfo() {1166const MachineJumpTableInfo *MJTI = MF->getJumpTableInfo();1167if (!MJTI) return;11681169const std::vector<MachineJumpTableEntry> &JT = MJTI->getJumpTables();1170if (JT.empty()) return;11711172const TargetLoweringObjectFile &TLOF = getObjFileLowering();1173MCSection *ReadOnlySec = TLOF.getSectionForJumpTable(MF->getFunction(), TM);1174OutStreamer->switchSection(ReadOnlySec);11751176auto AFI = MF->getInfo<AArch64FunctionInfo>();1177for (unsigned JTI = 0, e = JT.size(); JTI != e; ++JTI) {1178const std::vector<MachineBasicBlock*> &JTBBs = JT[JTI].MBBs;11791180// If this jump table was deleted, ignore it.1181if (JTBBs.empty()) continue;11821183unsigned Size = AFI->getJumpTableEntrySize(JTI);1184emitAlignment(Align(Size));1185OutStreamer->emitLabel(GetJTISymbol(JTI));11861187const MCSymbol *BaseSym = AArch64FI->getJumpTableEntryPCRelSymbol(JTI);1188const MCExpr *Base = MCSymbolRefExpr::create(BaseSym, OutContext);11891190for (auto *JTBB : JTBBs) {1191const MCExpr *Value =1192MCSymbolRefExpr::create(JTBB->getSymbol(), OutContext);11931194// Each entry is:1195// .byte/.hword (LBB - Lbase)>>21196// or plain:1197// .word LBB - Lbase1198Value = MCBinaryExpr::createSub(Value, Base, OutContext);1199if (Size != 4)1200Value = MCBinaryExpr::createLShr(1201Value, MCConstantExpr::create(2, OutContext), OutContext);12021203OutStreamer->emitValue(Value, Size);1204}1205}1206}12071208std::tuple<const MCSymbol *, uint64_t, const MCSymbol *,1209codeview::JumpTableEntrySize>1210AArch64AsmPrinter::getCodeViewJumpTableInfo(int JTI,1211const MachineInstr *BranchInstr,1212const MCSymbol *BranchLabel) const {1213const auto AFI = MF->getInfo<AArch64FunctionInfo>();1214const auto Base = AArch64FI->getJumpTableEntryPCRelSymbol(JTI);1215codeview::JumpTableEntrySize EntrySize;1216switch (AFI->getJumpTableEntrySize(JTI)) {1217case 1:1218EntrySize = codeview::JumpTableEntrySize::UInt8ShiftLeft;1219break;1220case 2:1221EntrySize = codeview::JumpTableEntrySize::UInt16ShiftLeft;1222break;1223case 4:1224EntrySize = codeview::JumpTableEntrySize::Int32;1225break;1226default:1227llvm_unreachable("Unexpected jump table entry size");1228}1229return std::make_tuple(Base, 0, BranchLabel, EntrySize);1230}12311232void AArch64AsmPrinter::emitFunctionEntryLabel() {1233if (MF->getFunction().getCallingConv() == CallingConv::AArch64_VectorCall ||1234MF->getFunction().getCallingConv() ==1235CallingConv::AArch64_SVE_VectorCall ||1236MF->getInfo<AArch64FunctionInfo>()->isSVECC()) {1237auto *TS =1238static_cast<AArch64TargetStreamer *>(OutStreamer->getTargetStreamer());1239TS->emitDirectiveVariantPCS(CurrentFnSym);1240}12411242AsmPrinter::emitFunctionEntryLabel();12431244if (TM.getTargetTriple().isWindowsArm64EC() &&1245!MF->getFunction().hasLocalLinkage()) {1246// For ARM64EC targets, a function definition's name is mangled differently1247// from the normal symbol, emit required aliases here.1248auto emitFunctionAlias = [&](MCSymbol *Src, MCSymbol *Dst) {1249OutStreamer->emitSymbolAttribute(Src, MCSA_WeakAntiDep);1250OutStreamer->emitAssignment(1251Src, MCSymbolRefExpr::create(Dst, MCSymbolRefExpr::VK_None,1252MMI->getContext()));1253};12541255auto getSymbolFromMetadata = [&](StringRef Name) {1256MCSymbol *Sym = nullptr;1257if (MDNode *Node = MF->getFunction().getMetadata(Name)) {1258StringRef NameStr = cast<MDString>(Node->getOperand(0))->getString();1259Sym = MMI->getContext().getOrCreateSymbol(NameStr);1260}1261return Sym;1262};12631264if (MCSymbol *UnmangledSym =1265getSymbolFromMetadata("arm64ec_unmangled_name")) {1266MCSymbol *ECMangledSym = getSymbolFromMetadata("arm64ec_ecmangled_name");12671268if (ECMangledSym) {1269// An external function, emit the alias from the unmangled symbol to1270// mangled symbol name and the alias from the mangled symbol to guest1271// exit thunk.1272emitFunctionAlias(UnmangledSym, ECMangledSym);1273emitFunctionAlias(ECMangledSym, CurrentFnSym);1274} else {1275// A function implementation, emit the alias from the unmangled symbol1276// to mangled symbol name.1277emitFunctionAlias(UnmangledSym, CurrentFnSym);1278}1279}1280}1281}12821283void AArch64AsmPrinter::emitGlobalAlias(const Module &M,1284const GlobalAlias &GA) {1285if (auto F = dyn_cast_or_null<Function>(GA.getAliasee())) {1286// Global aliases must point to a definition, but unmangled patchable1287// symbols are special and need to point to an undefined symbol with "EXP+"1288// prefix. Such undefined symbol is resolved by the linker by creating1289// x86 thunk that jumps back to the actual EC target.1290if (MDNode *Node = F->getMetadata("arm64ec_exp_name")) {1291StringRef ExpStr = cast<MDString>(Node->getOperand(0))->getString();1292MCSymbol *ExpSym = MMI->getContext().getOrCreateSymbol(ExpStr);1293MCSymbol *Sym = MMI->getContext().getOrCreateSymbol(GA.getName());12941295OutStreamer->beginCOFFSymbolDef(ExpSym);1296OutStreamer->emitCOFFSymbolStorageClass(COFF::IMAGE_SYM_CLASS_EXTERNAL);1297OutStreamer->emitCOFFSymbolType(COFF::IMAGE_SYM_DTYPE_FUNCTION1298<< COFF::SCT_COMPLEX_TYPE_SHIFT);1299OutStreamer->endCOFFSymbolDef();13001301OutStreamer->beginCOFFSymbolDef(Sym);1302OutStreamer->emitCOFFSymbolStorageClass(COFF::IMAGE_SYM_CLASS_EXTERNAL);1303OutStreamer->emitCOFFSymbolType(COFF::IMAGE_SYM_DTYPE_FUNCTION1304<< COFF::SCT_COMPLEX_TYPE_SHIFT);1305OutStreamer->endCOFFSymbolDef();1306OutStreamer->emitSymbolAttribute(Sym, MCSA_Weak);1307OutStreamer->emitAssignment(1308Sym, MCSymbolRefExpr::create(ExpSym, MCSymbolRefExpr::VK_None,1309MMI->getContext()));1310return;1311}1312}1313AsmPrinter::emitGlobalAlias(M, GA);1314}13151316/// Small jump tables contain an unsigned byte or half, representing the offset1317/// from the lowest-addressed possible destination to the desired basic1318/// block. Since all instructions are 4-byte aligned, this is further compressed1319/// by counting in instructions rather than bytes (i.e. divided by 4). So, to1320/// materialize the correct destination we need:1321///1322/// adr xDest, .LBB0_01323/// ldrb wScratch, [xTable, xEntry] (with "lsl #1" for ldrh).1324/// add xDest, xDest, xScratch (with "lsl #2" for smaller entries)1325void AArch64AsmPrinter::LowerJumpTableDest(llvm::MCStreamer &OutStreamer,1326const llvm::MachineInstr &MI) {1327Register DestReg = MI.getOperand(0).getReg();1328Register ScratchReg = MI.getOperand(1).getReg();1329Register ScratchRegW =1330STI->getRegisterInfo()->getSubReg(ScratchReg, AArch64::sub_32);1331Register TableReg = MI.getOperand(2).getReg();1332Register EntryReg = MI.getOperand(3).getReg();1333int JTIdx = MI.getOperand(4).getIndex();1334int Size = AArch64FI->getJumpTableEntrySize(JTIdx);13351336// This has to be first because the compression pass based its reachability1337// calculations on the start of the JumpTableDest instruction.1338auto Label =1339MF->getInfo<AArch64FunctionInfo>()->getJumpTableEntryPCRelSymbol(JTIdx);13401341// If we don't already have a symbol to use as the base, use the ADR1342// instruction itself.1343if (!Label) {1344Label = MF->getContext().createTempSymbol();1345AArch64FI->setJumpTableEntryInfo(JTIdx, Size, Label);1346OutStreamer.emitLabel(Label);1347}13481349auto LabelExpr = MCSymbolRefExpr::create(Label, MF->getContext());1350EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::ADR)1351.addReg(DestReg)1352.addExpr(LabelExpr));13531354// Load the number of instruction-steps to offset from the label.1355unsigned LdrOpcode;1356switch (Size) {1357case 1: LdrOpcode = AArch64::LDRBBroX; break;1358case 2: LdrOpcode = AArch64::LDRHHroX; break;1359case 4: LdrOpcode = AArch64::LDRSWroX; break;1360default:1361llvm_unreachable("Unknown jump table size");1362}13631364EmitToStreamer(OutStreamer, MCInstBuilder(LdrOpcode)1365.addReg(Size == 4 ? ScratchReg : ScratchRegW)1366.addReg(TableReg)1367.addReg(EntryReg)1368.addImm(0)1369.addImm(Size == 1 ? 0 : 1));13701371// Add to the already materialized base label address, multiplying by 4 if1372// compressed.1373EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::ADDXrs)1374.addReg(DestReg)1375.addReg(DestReg)1376.addReg(ScratchReg)1377.addImm(Size == 4 ? 0 : 2));1378}13791380void AArch64AsmPrinter::LowerHardenedBRJumpTable(const MachineInstr &MI) {1381unsigned InstsEmitted = 0;13821383const MachineJumpTableInfo *MJTI = MF->getJumpTableInfo();1384assert(MJTI && "Can't lower jump-table dispatch without JTI");13851386const std::vector<MachineJumpTableEntry> &JTs = MJTI->getJumpTables();1387assert(!JTs.empty() && "Invalid JT index for jump-table dispatch");13881389// Emit:1390// mov x17, #<size of table> ; depending on table size, with MOVKs1391// cmp x16, x17 ; or #imm if table size fits in 12-bit1392// csel x16, x16, xzr, ls ; check for index overflow1393//1394// adrp x17, Ltable@PAGE ; materialize table address1395// add x17, Ltable@PAGEOFF1396// ldrsw x16, [x17, x16, lsl #2] ; load table entry1397//1398// Lanchor:1399// adr x17, Lanchor ; compute target address1400// add x16, x17, x161401// br x16 ; branch to target14021403MachineOperand JTOp = MI.getOperand(0);14041405unsigned JTI = JTOp.getIndex();1406assert(!AArch64FI->getJumpTableEntryPCRelSymbol(JTI) &&1407"unsupported compressed jump table");14081409const uint64_t NumTableEntries = JTs[JTI].MBBs.size();14101411// cmp only supports a 12-bit immediate. If we need more, materialize the1412// immediate, using x17 as a scratch register.1413uint64_t MaxTableEntry = NumTableEntries - 1;1414if (isUInt<12>(MaxTableEntry)) {1415EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::SUBSXri)1416.addReg(AArch64::XZR)1417.addReg(AArch64::X16)1418.addImm(MaxTableEntry)1419.addImm(0));1420++InstsEmitted;1421} else {1422EmitToStreamer(*OutStreamer,1423MCInstBuilder(AArch64::MOVZXi)1424.addReg(AArch64::X17)1425.addImm(static_cast<uint16_t>(MaxTableEntry))1426.addImm(0));1427++InstsEmitted;1428// It's sad that we have to manually materialize instructions, but we can't1429// trivially reuse the main pseudo expansion logic.1430// A MOVK sequence is easy enough to generate and handles the general case.1431for (int Offset = 16; Offset < 64; Offset += 16) {1432if ((MaxTableEntry >> Offset) == 0)1433break;1434EmitToStreamer(*OutStreamer,1435MCInstBuilder(AArch64::MOVKXi)1436.addReg(AArch64::X17)1437.addReg(AArch64::X17)1438.addImm(static_cast<uint16_t>(MaxTableEntry >> Offset))1439.addImm(Offset));1440++InstsEmitted;1441}1442EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::SUBSXrs)1443.addReg(AArch64::XZR)1444.addReg(AArch64::X16)1445.addReg(AArch64::X17)1446.addImm(0));1447++InstsEmitted;1448}14491450// This picks entry #0 on failure.1451// We might want to trap instead.1452EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::CSELXr)1453.addReg(AArch64::X16)1454.addReg(AArch64::X16)1455.addReg(AArch64::XZR)1456.addImm(AArch64CC::LS));1457++InstsEmitted;14581459// Prepare the @PAGE/@PAGEOFF low/high operands.1460MachineOperand JTMOHi(JTOp), JTMOLo(JTOp);1461MCOperand JTMCHi, JTMCLo;14621463JTMOHi.setTargetFlags(AArch64II::MO_PAGE);1464JTMOLo.setTargetFlags(AArch64II::MO_PAGEOFF | AArch64II::MO_NC);14651466MCInstLowering.lowerOperand(JTMOHi, JTMCHi);1467MCInstLowering.lowerOperand(JTMOLo, JTMCLo);14681469EmitToStreamer(1470*OutStreamer,1471MCInstBuilder(AArch64::ADRP).addReg(AArch64::X17).addOperand(JTMCHi));1472++InstsEmitted;14731474EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ADDXri)1475.addReg(AArch64::X17)1476.addReg(AArch64::X17)1477.addOperand(JTMCLo)1478.addImm(0));1479++InstsEmitted;14801481EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::LDRSWroX)1482.addReg(AArch64::X16)1483.addReg(AArch64::X17)1484.addReg(AArch64::X16)1485.addImm(0)1486.addImm(1));1487++InstsEmitted;14881489MCSymbol *AdrLabel = MF->getContext().createTempSymbol();1490const auto *AdrLabelE = MCSymbolRefExpr::create(AdrLabel, MF->getContext());1491AArch64FI->setJumpTableEntryInfo(JTI, 4, AdrLabel);14921493OutStreamer->emitLabel(AdrLabel);1494EmitToStreamer(1495*OutStreamer,1496MCInstBuilder(AArch64::ADR).addReg(AArch64::X17).addExpr(AdrLabelE));1497++InstsEmitted;14981499EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ADDXrs)1500.addReg(AArch64::X16)1501.addReg(AArch64::X17)1502.addReg(AArch64::X16)1503.addImm(0));1504++InstsEmitted;15051506EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::BR).addReg(AArch64::X16));1507++InstsEmitted;15081509(void)InstsEmitted;1510assert(STI->getInstrInfo()->getInstSizeInBytes(MI) >= InstsEmitted * 4);1511}15121513void AArch64AsmPrinter::LowerMOPS(llvm::MCStreamer &OutStreamer,1514const llvm::MachineInstr &MI) {1515unsigned Opcode = MI.getOpcode();1516assert(STI->hasMOPS());1517assert(STI->hasMTE() || Opcode != AArch64::MOPSMemorySetTaggingPseudo);15181519const auto Ops = [Opcode]() -> std::array<unsigned, 3> {1520if (Opcode == AArch64::MOPSMemoryCopyPseudo)1521return {AArch64::CPYFP, AArch64::CPYFM, AArch64::CPYFE};1522if (Opcode == AArch64::MOPSMemoryMovePseudo)1523return {AArch64::CPYP, AArch64::CPYM, AArch64::CPYE};1524if (Opcode == AArch64::MOPSMemorySetPseudo)1525return {AArch64::SETP, AArch64::SETM, AArch64::SETE};1526if (Opcode == AArch64::MOPSMemorySetTaggingPseudo)1527return {AArch64::SETGP, AArch64::SETGM, AArch64::MOPSSETGE};1528llvm_unreachable("Unhandled memory operation pseudo");1529}();1530const bool IsSet = Opcode == AArch64::MOPSMemorySetPseudo ||1531Opcode == AArch64::MOPSMemorySetTaggingPseudo;15321533for (auto Op : Ops) {1534int i = 0;1535auto MCIB = MCInstBuilder(Op);1536// Destination registers1537MCIB.addReg(MI.getOperand(i++).getReg());1538MCIB.addReg(MI.getOperand(i++).getReg());1539if (!IsSet)1540MCIB.addReg(MI.getOperand(i++).getReg());1541// Input registers1542MCIB.addReg(MI.getOperand(i++).getReg());1543MCIB.addReg(MI.getOperand(i++).getReg());1544MCIB.addReg(MI.getOperand(i++).getReg());15451546EmitToStreamer(OutStreamer, MCIB);1547}1548}15491550void AArch64AsmPrinter::LowerSTACKMAP(MCStreamer &OutStreamer, StackMaps &SM,1551const MachineInstr &MI) {1552unsigned NumNOPBytes = StackMapOpers(&MI).getNumPatchBytes();15531554auto &Ctx = OutStreamer.getContext();1555MCSymbol *MILabel = Ctx.createTempSymbol();1556OutStreamer.emitLabel(MILabel);15571558SM.recordStackMap(*MILabel, MI);1559assert(NumNOPBytes % 4 == 0 && "Invalid number of NOP bytes requested!");15601561// Scan ahead to trim the shadow.1562const MachineBasicBlock &MBB = *MI.getParent();1563MachineBasicBlock::const_iterator MII(MI);1564++MII;1565while (NumNOPBytes > 0) {1566if (MII == MBB.end() || MII->isCall() ||1567MII->getOpcode() == AArch64::DBG_VALUE ||1568MII->getOpcode() == TargetOpcode::PATCHPOINT ||1569MII->getOpcode() == TargetOpcode::STACKMAP)1570break;1571++MII;1572NumNOPBytes -= 4;1573}15741575// Emit nops.1576for (unsigned i = 0; i < NumNOPBytes; i += 4)1577EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::HINT).addImm(0));1578}15791580// Lower a patchpoint of the form:1581// [<def>], <id>, <numBytes>, <target>, <numArgs>1582void AArch64AsmPrinter::LowerPATCHPOINT(MCStreamer &OutStreamer, StackMaps &SM,1583const MachineInstr &MI) {1584auto &Ctx = OutStreamer.getContext();1585MCSymbol *MILabel = Ctx.createTempSymbol();1586OutStreamer.emitLabel(MILabel);1587SM.recordPatchPoint(*MILabel, MI);15881589PatchPointOpers Opers(&MI);15901591int64_t CallTarget = Opers.getCallTarget().getImm();1592unsigned EncodedBytes = 0;1593if (CallTarget) {1594assert((CallTarget & 0xFFFFFFFFFFFF) == CallTarget &&1595"High 16 bits of call target should be zero.");1596Register ScratchReg = MI.getOperand(Opers.getNextScratchIdx()).getReg();1597EncodedBytes = 16;1598// Materialize the jump address:1599EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::MOVZXi)1600.addReg(ScratchReg)1601.addImm((CallTarget >> 32) & 0xFFFF)1602.addImm(32));1603EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::MOVKXi)1604.addReg(ScratchReg)1605.addReg(ScratchReg)1606.addImm((CallTarget >> 16) & 0xFFFF)1607.addImm(16));1608EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::MOVKXi)1609.addReg(ScratchReg)1610.addReg(ScratchReg)1611.addImm(CallTarget & 0xFFFF)1612.addImm(0));1613EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::BLR).addReg(ScratchReg));1614}1615// Emit padding.1616unsigned NumBytes = Opers.getNumPatchBytes();1617assert(NumBytes >= EncodedBytes &&1618"Patchpoint can't request size less than the length of a call.");1619assert((NumBytes - EncodedBytes) % 4 == 0 &&1620"Invalid number of NOP bytes requested!");1621for (unsigned i = EncodedBytes; i < NumBytes; i += 4)1622EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::HINT).addImm(0));1623}16241625void AArch64AsmPrinter::LowerSTATEPOINT(MCStreamer &OutStreamer, StackMaps &SM,1626const MachineInstr &MI) {1627StatepointOpers SOpers(&MI);1628if (unsigned PatchBytes = SOpers.getNumPatchBytes()) {1629assert(PatchBytes % 4 == 0 && "Invalid number of NOP bytes requested!");1630for (unsigned i = 0; i < PatchBytes; i += 4)1631EmitToStreamer(OutStreamer, MCInstBuilder(AArch64::HINT).addImm(0));1632} else {1633// Lower call target and choose correct opcode1634const MachineOperand &CallTarget = SOpers.getCallTarget();1635MCOperand CallTargetMCOp;1636unsigned CallOpcode;1637switch (CallTarget.getType()) {1638case MachineOperand::MO_GlobalAddress:1639case MachineOperand::MO_ExternalSymbol:1640MCInstLowering.lowerOperand(CallTarget, CallTargetMCOp);1641CallOpcode = AArch64::BL;1642break;1643case MachineOperand::MO_Immediate:1644CallTargetMCOp = MCOperand::createImm(CallTarget.getImm());1645CallOpcode = AArch64::BL;1646break;1647case MachineOperand::MO_Register:1648CallTargetMCOp = MCOperand::createReg(CallTarget.getReg());1649CallOpcode = AArch64::BLR;1650break;1651default:1652llvm_unreachable("Unsupported operand type in statepoint call target");1653break;1654}16551656EmitToStreamer(OutStreamer,1657MCInstBuilder(CallOpcode).addOperand(CallTargetMCOp));1658}16591660auto &Ctx = OutStreamer.getContext();1661MCSymbol *MILabel = Ctx.createTempSymbol();1662OutStreamer.emitLabel(MILabel);1663SM.recordStatepoint(*MILabel, MI);1664}16651666void AArch64AsmPrinter::LowerFAULTING_OP(const MachineInstr &FaultingMI) {1667// FAULTING_LOAD_OP <def>, <faltinf type>, <MBB handler>,1668// <opcode>, <operands>16691670Register DefRegister = FaultingMI.getOperand(0).getReg();1671FaultMaps::FaultKind FK =1672static_cast<FaultMaps::FaultKind>(FaultingMI.getOperand(1).getImm());1673MCSymbol *HandlerLabel = FaultingMI.getOperand(2).getMBB()->getSymbol();1674unsigned Opcode = FaultingMI.getOperand(3).getImm();1675unsigned OperandsBeginIdx = 4;16761677auto &Ctx = OutStreamer->getContext();1678MCSymbol *FaultingLabel = Ctx.createTempSymbol();1679OutStreamer->emitLabel(FaultingLabel);16801681assert(FK < FaultMaps::FaultKindMax && "Invalid Faulting Kind!");1682FM.recordFaultingOp(FK, FaultingLabel, HandlerLabel);16831684MCInst MI;1685MI.setOpcode(Opcode);16861687if (DefRegister != (Register)0)1688MI.addOperand(MCOperand::createReg(DefRegister));16891690for (const MachineOperand &MO :1691llvm::drop_begin(FaultingMI.operands(), OperandsBeginIdx)) {1692MCOperand Dest;1693lowerOperand(MO, Dest);1694MI.addOperand(Dest);1695}16961697OutStreamer->AddComment("on-fault: " + HandlerLabel->getName());1698OutStreamer->emitInstruction(MI, getSubtargetInfo());1699}17001701void AArch64AsmPrinter::emitFMov0(const MachineInstr &MI) {1702Register DestReg = MI.getOperand(0).getReg();1703if (STI->hasZeroCycleZeroingFP() && !STI->hasZeroCycleZeroingFPWorkaround() &&1704STI->isNeonAvailable()) {1705// Convert H/S register to corresponding D register1706if (AArch64::H0 <= DestReg && DestReg <= AArch64::H31)1707DestReg = AArch64::D0 + (DestReg - AArch64::H0);1708else if (AArch64::S0 <= DestReg && DestReg <= AArch64::S31)1709DestReg = AArch64::D0 + (DestReg - AArch64::S0);1710else1711assert(AArch64::D0 <= DestReg && DestReg <= AArch64::D31);17121713MCInst MOVI;1714MOVI.setOpcode(AArch64::MOVID);1715MOVI.addOperand(MCOperand::createReg(DestReg));1716MOVI.addOperand(MCOperand::createImm(0));1717EmitToStreamer(*OutStreamer, MOVI);1718} else {1719MCInst FMov;1720switch (MI.getOpcode()) {1721default: llvm_unreachable("Unexpected opcode");1722case AArch64::FMOVH0:1723FMov.setOpcode(STI->hasFullFP16() ? AArch64::FMOVWHr : AArch64::FMOVWSr);1724if (!STI->hasFullFP16())1725DestReg = (AArch64::S0 + (DestReg - AArch64::H0));1726FMov.addOperand(MCOperand::createReg(DestReg));1727FMov.addOperand(MCOperand::createReg(AArch64::WZR));1728break;1729case AArch64::FMOVS0:1730FMov.setOpcode(AArch64::FMOVWSr);1731FMov.addOperand(MCOperand::createReg(DestReg));1732FMov.addOperand(MCOperand::createReg(AArch64::WZR));1733break;1734case AArch64::FMOVD0:1735FMov.setOpcode(AArch64::FMOVXDr);1736FMov.addOperand(MCOperand::createReg(DestReg));1737FMov.addOperand(MCOperand::createReg(AArch64::XZR));1738break;1739}1740EmitToStreamer(*OutStreamer, FMov);1741}1742}17431744unsigned AArch64AsmPrinter::emitPtrauthDiscriminator(uint16_t Disc,1745unsigned AddrDisc,1746unsigned &InstsEmitted) {1747// So far we've used NoRegister in pseudos. Now we need real encodings.1748if (AddrDisc == AArch64::NoRegister)1749AddrDisc = AArch64::XZR;17501751// If there is no constant discriminator, there's no blend involved:1752// just use the address discriminator register as-is (XZR or not).1753if (!Disc)1754return AddrDisc;17551756// If there's only a constant discriminator, MOV it into x17.1757if (AddrDisc == AArch64::XZR) {1758EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::MOVZXi)1759.addReg(AArch64::X17)1760.addImm(Disc)1761.addImm(/*shift=*/0));1762++InstsEmitted;1763return AArch64::X17;1764}17651766// If there are both, emit a blend into x17.1767EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ORRXrs)1768.addReg(AArch64::X17)1769.addReg(AArch64::XZR)1770.addReg(AddrDisc)1771.addImm(0));1772++InstsEmitted;1773EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::MOVKXi)1774.addReg(AArch64::X17)1775.addReg(AArch64::X17)1776.addImm(Disc)1777.addImm(/*shift=*/48));1778++InstsEmitted;1779return AArch64::X17;1780}17811782void AArch64AsmPrinter::emitPtrauthAuthResign(const MachineInstr *MI) {1783unsigned InstsEmitted = 0;1784const bool IsAUTPAC = MI->getOpcode() == AArch64::AUTPAC;17851786// We can expand AUT/AUTPAC into 3 possible sequences:1787// - unchecked:1788// autia x16, x01789// pacib x16, x1 ; if AUTPAC1790//1791// - checked and clearing:1792// mov x17, x01793// movk x17, #disc, lsl #481794// autia x16, x171795// mov x17, x161796// xpaci x171797// cmp x16, x171798// b.eq Lsuccess1799// mov x16, x171800// b Lend1801// Lsuccess:1802// mov x17, x11803// movk x17, #disc, lsl #481804// pacib x16, x171805// Lend:1806// Where we only emit the AUT if we started with an AUT.1807//1808// - checked and trapping:1809// mov x17, x01810// movk x17, #disc, lsl #481811// autia x16, x01812// mov x17, x161813// xpaci x171814// cmp x16, x171815// b.eq Lsuccess1816// brk #<0xc470 + aut key>1817// Lsuccess:1818// mov x17, x11819// movk x17, #disc, lsl #481820// pacib x16, x17 ; if AUTPAC1821// Where the b.eq skips over the trap if the PAC is valid.1822//1823// This sequence is expensive, but we need more information to be able to1824// do better.1825//1826// We can't TBZ the poison bit because EnhancedPAC2 XORs the PAC bits1827// on failure.1828// We can't TST the PAC bits because we don't always know how the address1829// space is setup for the target environment (and the bottom PAC bit is1830// based on that).1831// Either way, we also don't always know whether TBI is enabled or not for1832// the specific target environment.18331834// By default, auth/resign sequences check for auth failures.1835bool ShouldCheck = true;1836// In the checked sequence, we only trap if explicitly requested.1837bool ShouldTrap = MF->getFunction().hasFnAttribute("ptrauth-auth-traps");18381839// On an FPAC CPU, you get traps whether you want them or not: there's1840// no point in emitting checks or traps.1841if (STI->hasFPAC())1842ShouldCheck = ShouldTrap = false;18431844// However, command-line flags can override this, for experimentation.1845switch (PtrauthAuthChecks) {1846case PtrauthCheckMode::Default:1847break;1848case PtrauthCheckMode::Unchecked:1849ShouldCheck = ShouldTrap = false;1850break;1851case PtrauthCheckMode::Poison:1852ShouldCheck = true;1853ShouldTrap = false;1854break;1855case PtrauthCheckMode::Trap:1856ShouldCheck = ShouldTrap = true;1857break;1858}18591860auto AUTKey = (AArch64PACKey::ID)MI->getOperand(0).getImm();1861uint64_t AUTDisc = MI->getOperand(1).getImm();1862unsigned AUTAddrDisc = MI->getOperand(2).getReg();18631864unsigned XPACOpc = getXPACOpcodeForKey(AUTKey);18651866// Compute aut discriminator into x171867assert(isUInt<16>(AUTDisc));1868unsigned AUTDiscReg =1869emitPtrauthDiscriminator(AUTDisc, AUTAddrDisc, InstsEmitted);1870bool AUTZero = AUTDiscReg == AArch64::XZR;1871unsigned AUTOpc = getAUTOpcodeForKey(AUTKey, AUTZero);18721873// autiza x16 ; if AUTZero1874// autia x16, x17 ; if !AUTZero1875MCInst AUTInst;1876AUTInst.setOpcode(AUTOpc);1877AUTInst.addOperand(MCOperand::createReg(AArch64::X16));1878AUTInst.addOperand(MCOperand::createReg(AArch64::X16));1879if (!AUTZero)1880AUTInst.addOperand(MCOperand::createReg(AUTDiscReg));1881EmitToStreamer(*OutStreamer, AUTInst);1882++InstsEmitted;18831884// Unchecked or checked-but-non-trapping AUT is just an "AUT": we're done.1885if (!IsAUTPAC && (!ShouldCheck || !ShouldTrap)) {1886assert(STI->getInstrInfo()->getInstSizeInBytes(*MI) >= InstsEmitted * 4);1887return;1888}18891890MCSymbol *EndSym = nullptr;18911892// Checked sequences do an additional strip-and-compare.1893if (ShouldCheck) {1894MCSymbol *SuccessSym = createTempSymbol("auth_success_");18951896// XPAC has tied src/dst: use x17 as a temporary copy.1897// mov x17, x161898EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ORRXrs)1899.addReg(AArch64::X17)1900.addReg(AArch64::XZR)1901.addReg(AArch64::X16)1902.addImm(0));1903++InstsEmitted;19041905// xpaci x171906EmitToStreamer(1907*OutStreamer,1908MCInstBuilder(XPACOpc).addReg(AArch64::X17).addReg(AArch64::X17));1909++InstsEmitted;19101911// cmp x16, x171912EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::SUBSXrs)1913.addReg(AArch64::XZR)1914.addReg(AArch64::X16)1915.addReg(AArch64::X17)1916.addImm(0));1917++InstsEmitted;19181919// b.eq Lsuccess1920EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::Bcc)1921.addImm(AArch64CC::EQ)1922.addExpr(MCSymbolRefExpr::create(1923SuccessSym, OutContext)));1924++InstsEmitted;19251926if (ShouldTrap) {1927// Trapping sequences do a 'brk'.1928// brk #<0xc470 + aut key>1929EmitToStreamer(*OutStreamer,1930MCInstBuilder(AArch64::BRK).addImm(0xc470 | AUTKey));1931++InstsEmitted;1932} else {1933// Non-trapping checked sequences return the stripped result in x16,1934// skipping over the PAC if there is one.19351936// FIXME: can we simply return the AUT result, already in x16? without..1937// ..traps this is usable as an oracle anyway, based on high bits1938// mov x17, x161939EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ORRXrs)1940.addReg(AArch64::X16)1941.addReg(AArch64::XZR)1942.addReg(AArch64::X17)1943.addImm(0));1944++InstsEmitted;19451946if (IsAUTPAC) {1947EndSym = createTempSymbol("resign_end_");19481949// b Lend1950EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::B)1951.addExpr(MCSymbolRefExpr::create(1952EndSym, OutContext)));1953++InstsEmitted;1954}1955}19561957// If the auth check succeeds, we can continue.1958// Lsuccess:1959OutStreamer->emitLabel(SuccessSym);1960}19611962// We already emitted unchecked and checked-but-non-trapping AUTs.1963// That left us with trapping AUTs, and AUTPACs.1964// Trapping AUTs don't need PAC: we're done.1965if (!IsAUTPAC) {1966assert(STI->getInstrInfo()->getInstSizeInBytes(*MI) >= InstsEmitted * 4);1967return;1968}19691970auto PACKey = (AArch64PACKey::ID)MI->getOperand(3).getImm();1971uint64_t PACDisc = MI->getOperand(4).getImm();1972unsigned PACAddrDisc = MI->getOperand(5).getReg();19731974// Compute pac discriminator into x171975assert(isUInt<16>(PACDisc));1976unsigned PACDiscReg =1977emitPtrauthDiscriminator(PACDisc, PACAddrDisc, InstsEmitted);1978bool PACZero = PACDiscReg == AArch64::XZR;1979unsigned PACOpc = getPACOpcodeForKey(PACKey, PACZero);19801981// pacizb x16 ; if PACZero1982// pacib x16, x17 ; if !PACZero1983MCInst PACInst;1984PACInst.setOpcode(PACOpc);1985PACInst.addOperand(MCOperand::createReg(AArch64::X16));1986PACInst.addOperand(MCOperand::createReg(AArch64::X16));1987if (!PACZero)1988PACInst.addOperand(MCOperand::createReg(PACDiscReg));1989EmitToStreamer(*OutStreamer, PACInst);1990++InstsEmitted;19911992assert(STI->getInstrInfo()->getInstSizeInBytes(*MI) >= InstsEmitted * 4);1993// Lend:1994if (EndSym)1995OutStreamer->emitLabel(EndSym);1996}19971998void AArch64AsmPrinter::emitPtrauthBranch(const MachineInstr *MI) {1999unsigned InstsEmitted = 0;2000bool IsCall = MI->getOpcode() == AArch64::BLRA;2001unsigned BrTarget = MI->getOperand(0).getReg();20022003auto Key = (AArch64PACKey::ID)MI->getOperand(1).getImm();2004assert((Key == AArch64PACKey::IA || Key == AArch64PACKey::IB) &&2005"Invalid auth call key");20062007uint64_t Disc = MI->getOperand(2).getImm();2008assert(isUInt<16>(Disc));20092010unsigned AddrDisc = MI->getOperand(3).getReg();20112012// Compute discriminator into x172013unsigned DiscReg = emitPtrauthDiscriminator(Disc, AddrDisc, InstsEmitted);2014bool IsZeroDisc = DiscReg == AArch64::XZR;20152016unsigned Opc;2017if (IsCall) {2018if (Key == AArch64PACKey::IA)2019Opc = IsZeroDisc ? AArch64::BLRAAZ : AArch64::BLRAA;2020else2021Opc = IsZeroDisc ? AArch64::BLRABZ : AArch64::BLRAB;2022} else {2023if (Key == AArch64PACKey::IA)2024Opc = IsZeroDisc ? AArch64::BRAAZ : AArch64::BRAA;2025else2026Opc = IsZeroDisc ? AArch64::BRABZ : AArch64::BRAB;2027}20282029MCInst BRInst;2030BRInst.setOpcode(Opc);2031BRInst.addOperand(MCOperand::createReg(BrTarget));2032if (!IsZeroDisc)2033BRInst.addOperand(MCOperand::createReg(DiscReg));2034EmitToStreamer(*OutStreamer, BRInst);2035++InstsEmitted;20362037assert(STI->getInstrInfo()->getInstSizeInBytes(*MI) >= InstsEmitted * 4);2038}20392040const MCExpr *2041AArch64AsmPrinter::lowerConstantPtrAuth(const ConstantPtrAuth &CPA) {2042MCContext &Ctx = OutContext;20432044// Figure out the base symbol and the addend, if any.2045APInt Offset(64, 0);2046const Value *BaseGV = CPA.getPointer()->stripAndAccumulateConstantOffsets(2047getDataLayout(), Offset, /*AllowNonInbounds=*/true);20482049auto *BaseGVB = dyn_cast<GlobalValue>(BaseGV);20502051// If we can't understand the referenced ConstantExpr, there's nothing2052// else we can do: emit an error.2053if (!BaseGVB) {2054BaseGV->getContext().emitError(2055"cannot resolve target base/addend of ptrauth constant");2056return nullptr;2057}20582059// If there is an addend, turn that into the appropriate MCExpr.2060const MCExpr *Sym = MCSymbolRefExpr::create(getSymbol(BaseGVB), Ctx);2061if (Offset.sgt(0))2062Sym = MCBinaryExpr::createAdd(2063Sym, MCConstantExpr::create(Offset.getSExtValue(), Ctx), Ctx);2064else if (Offset.slt(0))2065Sym = MCBinaryExpr::createSub(2066Sym, MCConstantExpr::create((-Offset).getSExtValue(), Ctx), Ctx);20672068uint64_t KeyID = CPA.getKey()->getZExtValue();2069// We later rely on valid KeyID value in AArch64PACKeyIDToString call from2070// AArch64AuthMCExpr::printImpl, so fail fast.2071if (KeyID > AArch64PACKey::LAST)2072report_fatal_error("AArch64 PAC Key ID '" + Twine(KeyID) +2073"' out of range [0, " +2074Twine((unsigned)AArch64PACKey::LAST) + "]");20752076uint64_t Disc = CPA.getDiscriminator()->getZExtValue();2077if (!isUInt<16>(Disc))2078report_fatal_error("AArch64 PAC Discriminator '" + Twine(Disc) +2079"' out of range [0, 0xFFFF]");20802081// Finally build the complete @AUTH expr.2082return AArch64AuthMCExpr::create(Sym, Disc, AArch64PACKey::ID(KeyID),2083CPA.hasAddressDiscriminator(), Ctx);2084}20852086void AArch64AsmPrinter::LowerLOADauthptrstatic(const MachineInstr &MI) {2087unsigned DstReg = MI.getOperand(0).getReg();2088const MachineOperand &GAOp = MI.getOperand(1);2089const uint64_t KeyC = MI.getOperand(2).getImm();2090assert(KeyC <= AArch64PACKey::LAST &&2091"key is out of range [0, AArch64PACKey::LAST]");2092const auto Key = (AArch64PACKey::ID)KeyC;2093const uint64_t Disc = MI.getOperand(3).getImm();2094assert(isUInt<16>(Disc) &&2095"constant discriminator is out of range [0, 0xffff]");20962097// Emit instruction sequence like the following:2098// ADRP x16, symbol$auth_ptr$key$disc2099// LDR x16, [x16, :lo12:symbol$auth_ptr$key$disc]2100//2101// Where the $auth_ptr$ symbol is the stub slot containing the signed pointer2102// to symbol.2103MCSymbol *AuthPtrStubSym;2104if (TM.getTargetTriple().isOSBinFormatELF()) {2105const auto &TLOF =2106static_cast<const AArch64_ELFTargetObjectFile &>(getObjFileLowering());21072108assert(GAOp.getOffset() == 0 &&2109"non-zero offset for $auth_ptr$ stub slots is not supported");2110const MCSymbol *GASym = TM.getSymbol(GAOp.getGlobal());2111AuthPtrStubSym = TLOF.getAuthPtrSlotSymbol(TM, MMI, GASym, Key, Disc);2112} else {2113assert(TM.getTargetTriple().isOSBinFormatMachO() &&2114"LOADauthptrstatic is implemented only for MachO/ELF");21152116const auto &TLOF = static_cast<const AArch64_MachoTargetObjectFile &>(2117getObjFileLowering());21182119assert(GAOp.getOffset() == 0 &&2120"non-zero offset for $auth_ptr$ stub slots is not supported");2121const MCSymbol *GASym = TM.getSymbol(GAOp.getGlobal());2122AuthPtrStubSym = TLOF.getAuthPtrSlotSymbol(TM, MMI, GASym, Key, Disc);2123}21242125MachineOperand StubMOHi =2126MachineOperand::CreateMCSymbol(AuthPtrStubSym, AArch64II::MO_PAGE);2127MachineOperand StubMOLo = MachineOperand::CreateMCSymbol(2128AuthPtrStubSym, AArch64II::MO_PAGEOFF | AArch64II::MO_NC);2129MCOperand StubMCHi, StubMCLo;21302131MCInstLowering.lowerOperand(StubMOHi, StubMCHi);2132MCInstLowering.lowerOperand(StubMOLo, StubMCLo);21332134EmitToStreamer(2135*OutStreamer,2136MCInstBuilder(AArch64::ADRP).addReg(DstReg).addOperand(StubMCHi));21372138EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::LDRXui)2139.addReg(DstReg)2140.addReg(DstReg)2141.addOperand(StubMCLo));2142}21432144void AArch64AsmPrinter::LowerMOVaddrPAC(const MachineInstr &MI) {2145unsigned InstsEmitted = 0;2146auto EmitAndIncrement = [this, &InstsEmitted](const MCInst &Inst) {2147EmitToStreamer(*OutStreamer, Inst);2148++InstsEmitted;2149};21502151const bool IsGOTLoad = MI.getOpcode() == AArch64::LOADgotPAC;2152MachineOperand GAOp = MI.getOperand(0);2153const uint64_t KeyC = MI.getOperand(1).getImm();2154assert(KeyC <= AArch64PACKey::LAST &&2155"key is out of range [0, AArch64PACKey::LAST]");2156const auto Key = (AArch64PACKey::ID)KeyC;2157const unsigned AddrDisc = MI.getOperand(2).getReg();2158const uint64_t Disc = MI.getOperand(3).getImm();2159assert(isUInt<16>(Disc) &&2160"constant discriminator is out of range [0, 0xffff]");21612162const int64_t Offset = GAOp.getOffset();2163GAOp.setOffset(0);21642165// Emit:2166// target materialization:2167// - via GOT:2168// adrp x16, :got:target2169// ldr x16, [x16, :got_lo12:target]2170// add offset to x16 if offset != 02171//2172// - direct:2173// adrp x16, target2174// add x16, x16, :lo12:target2175// add offset to x16 if offset != 02176//2177// add offset to x16:2178// - abs(offset) fits 24 bits:2179// add/sub x16, x16, #<offset>[, #lsl 12] (up to 2 instructions)2180// - abs(offset) does not fit 24 bits:2181// - offset < 0:2182// movn+movk sequence filling x17 register with the offset (up to 42183// instructions)2184// add x16, x16, x172185// - offset > 0:2186// movz+movk sequence filling x17 register with the offset (up to 42187// instructions)2188// add x16, x16, x172189//2190// signing:2191// - 0 discriminator:2192// paciza x162193// - Non-0 discriminator, no address discriminator:2194// mov x17, #Disc2195// pacia x16, x172196// - address discriminator (with potentially folded immediate discriminator):2197// pacia x16, xAddrDisc21982199MachineOperand GAMOHi(GAOp), GAMOLo(GAOp);2200MCOperand GAMCHi, GAMCLo;22012202GAMOHi.setTargetFlags(AArch64II::MO_PAGE);2203GAMOLo.setTargetFlags(AArch64II::MO_PAGEOFF | AArch64II::MO_NC);2204if (IsGOTLoad) {2205GAMOHi.addTargetFlag(AArch64II::MO_GOT);2206GAMOLo.addTargetFlag(AArch64II::MO_GOT);2207}22082209MCInstLowering.lowerOperand(GAMOHi, GAMCHi);2210MCInstLowering.lowerOperand(GAMOLo, GAMCLo);22112212EmitAndIncrement(2213MCInstBuilder(AArch64::ADRP).addReg(AArch64::X16).addOperand(GAMCHi));22142215if (IsGOTLoad) {2216EmitAndIncrement(MCInstBuilder(AArch64::LDRXui)2217.addReg(AArch64::X16)2218.addReg(AArch64::X16)2219.addOperand(GAMCLo));2220} else {2221EmitAndIncrement(MCInstBuilder(AArch64::ADDXri)2222.addReg(AArch64::X16)2223.addReg(AArch64::X16)2224.addOperand(GAMCLo)2225.addImm(0));2226}22272228if (Offset != 0) {2229const uint64_t AbsOffset = (Offset > 0 ? Offset : -((uint64_t)Offset));2230const bool IsNeg = Offset < 0;2231if (isUInt<24>(AbsOffset)) {2232for (int BitPos = 0; BitPos != 24 && (AbsOffset >> BitPos);2233BitPos += 12) {2234EmitAndIncrement(2235MCInstBuilder(IsNeg ? AArch64::SUBXri : AArch64::ADDXri)2236.addReg(AArch64::X16)2237.addReg(AArch64::X16)2238.addImm((AbsOffset >> BitPos) & 0xfff)2239.addImm(AArch64_AM::getShifterImm(AArch64_AM::LSL, BitPos)));2240}2241} else {2242const uint64_t UOffset = Offset;2243EmitAndIncrement(MCInstBuilder(IsNeg ? AArch64::MOVNXi : AArch64::MOVZXi)2244.addReg(AArch64::X17)2245.addImm((IsNeg ? ~UOffset : UOffset) & 0xffff)2246.addImm(/*shift=*/0));2247auto NeedMovk = [IsNeg, UOffset](int BitPos) -> bool {2248assert(BitPos == 16 || BitPos == 32 || BitPos == 48);2249uint64_t Shifted = UOffset >> BitPos;2250if (!IsNeg)2251return Shifted != 0;2252for (int I = 0; I != 64 - BitPos; I += 16)2253if (((Shifted >> I) & 0xffff) != 0xffff)2254return true;2255return false;2256};2257for (int BitPos = 16; BitPos != 64 && NeedMovk(BitPos); BitPos += 16) {2258EmitAndIncrement(MCInstBuilder(AArch64::MOVKXi)2259.addReg(AArch64::X17)2260.addReg(AArch64::X17)2261.addImm((UOffset >> BitPos) & 0xffff)2262.addImm(/*shift=*/BitPos));2263}2264EmitAndIncrement(MCInstBuilder(AArch64::ADDXrs)2265.addReg(AArch64::X16)2266.addReg(AArch64::X16)2267.addReg(AArch64::X17)2268.addImm(/*shift=*/0));2269}2270}22712272unsigned DiscReg = AddrDisc;2273if (Disc != 0) {2274if (AddrDisc != AArch64::XZR) {2275EmitAndIncrement(MCInstBuilder(AArch64::ORRXrs)2276.addReg(AArch64::X17)2277.addReg(AArch64::XZR)2278.addReg(AddrDisc)2279.addImm(0));2280EmitAndIncrement(MCInstBuilder(AArch64::MOVKXi)2281.addReg(AArch64::X17)2282.addReg(AArch64::X17)2283.addImm(Disc)2284.addImm(/*shift=*/48));2285} else {2286EmitAndIncrement(MCInstBuilder(AArch64::MOVZXi)2287.addReg(AArch64::X17)2288.addImm(Disc)2289.addImm(/*shift=*/0));2290}2291DiscReg = AArch64::X17;2292}22932294auto MIB = MCInstBuilder(getPACOpcodeForKey(Key, DiscReg == AArch64::XZR))2295.addReg(AArch64::X16)2296.addReg(AArch64::X16);2297if (DiscReg != AArch64::XZR)2298MIB.addReg(DiscReg);2299EmitAndIncrement(MIB);23002301assert(STI->getInstrInfo()->getInstSizeInBytes(MI) >= InstsEmitted * 4);2302}23032304const MCExpr *2305AArch64AsmPrinter::lowerBlockAddressConstant(const BlockAddress &BA) {2306const MCExpr *BAE = AsmPrinter::lowerBlockAddressConstant(BA);2307const Function &Fn = *BA.getFunction();23082309if (std::optional<uint16_t> BADisc =2310STI->getPtrAuthBlockAddressDiscriminatorIfEnabled(Fn))2311return AArch64AuthMCExpr::create(BAE, *BADisc, AArch64PACKey::IA,2312/*HasAddressDiversity=*/false, OutContext);23132314return BAE;2315}23162317// Simple pseudo-instructions have their lowering (with expansion to real2318// instructions) auto-generated.2319#include "AArch64GenMCPseudoLowering.inc"23202321void AArch64AsmPrinter::emitInstruction(const MachineInstr *MI) {2322AArch64_MC::verifyInstructionPredicates(MI->getOpcode(), STI->getFeatureBits());23232324// Do any auto-generated pseudo lowerings.2325if (emitPseudoExpansionLowering(*OutStreamer, MI))2326return;23272328if (MI->getOpcode() == AArch64::ADRP) {2329for (auto &Opd : MI->operands()) {2330if (Opd.isSymbol() && StringRef(Opd.getSymbolName()) ==2331"swift_async_extendedFramePointerFlags") {2332ShouldEmitWeakSwiftAsyncExtendedFramePointerFlags = true;2333}2334}2335}23362337if (AArch64FI->getLOHRelated().count(MI)) {2338// Generate a label for LOH related instruction2339MCSymbol *LOHLabel = createTempSymbol("loh");2340// Associate the instruction with the label2341LOHInstToLabel[MI] = LOHLabel;2342OutStreamer->emitLabel(LOHLabel);2343}23442345AArch64TargetStreamer *TS =2346static_cast<AArch64TargetStreamer *>(OutStreamer->getTargetStreamer());2347// Do any manual lowerings.2348switch (MI->getOpcode()) {2349default:2350break;2351case AArch64::HINT: {2352// CurrentPatchableFunctionEntrySym can be CurrentFnBegin only for2353// -fpatchable-function-entry=N,0. The entry MBB is guaranteed to be2354// non-empty. If MI is the initial BTI, place the2355// __patchable_function_entries label after BTI.2356if (CurrentPatchableFunctionEntrySym &&2357CurrentPatchableFunctionEntrySym == CurrentFnBegin &&2358MI == &MF->front().front()) {2359int64_t Imm = MI->getOperand(0).getImm();2360if ((Imm & 32) && (Imm & 6)) {2361MCInst Inst;2362MCInstLowering.Lower(MI, Inst);2363EmitToStreamer(*OutStreamer, Inst);2364CurrentPatchableFunctionEntrySym = createTempSymbol("patch");2365OutStreamer->emitLabel(CurrentPatchableFunctionEntrySym);2366return;2367}2368}2369break;2370}2371case AArch64::MOVMCSym: {2372Register DestReg = MI->getOperand(0).getReg();2373const MachineOperand &MO_Sym = MI->getOperand(1);2374MachineOperand Hi_MOSym(MO_Sym), Lo_MOSym(MO_Sym);2375MCOperand Hi_MCSym, Lo_MCSym;23762377Hi_MOSym.setTargetFlags(AArch64II::MO_G1 | AArch64II::MO_S);2378Lo_MOSym.setTargetFlags(AArch64II::MO_G0 | AArch64II::MO_NC);23792380MCInstLowering.lowerOperand(Hi_MOSym, Hi_MCSym);2381MCInstLowering.lowerOperand(Lo_MOSym, Lo_MCSym);23822383MCInst MovZ;2384MovZ.setOpcode(AArch64::MOVZXi);2385MovZ.addOperand(MCOperand::createReg(DestReg));2386MovZ.addOperand(Hi_MCSym);2387MovZ.addOperand(MCOperand::createImm(16));2388EmitToStreamer(*OutStreamer, MovZ);23892390MCInst MovK;2391MovK.setOpcode(AArch64::MOVKXi);2392MovK.addOperand(MCOperand::createReg(DestReg));2393MovK.addOperand(MCOperand::createReg(DestReg));2394MovK.addOperand(Lo_MCSym);2395MovK.addOperand(MCOperand::createImm(0));2396EmitToStreamer(*OutStreamer, MovK);2397return;2398}2399case AArch64::MOVIv2d_ns:2400// It is generally beneficial to rewrite "fmov s0, wzr" to "movi d0, #0".2401// as movi is more efficient across all cores. Newer cores can eliminate2402// fmovs early and there is no difference with movi, but this not true for2403// all implementations.2404//2405// The floating-point version doesn't quite work in rare cases on older2406// CPUs, so on those targets we lower this instruction to movi.16b instead.2407if (STI->hasZeroCycleZeroingFPWorkaround() &&2408MI->getOperand(1).getImm() == 0) {2409MCInst TmpInst;2410TmpInst.setOpcode(AArch64::MOVIv16b_ns);2411TmpInst.addOperand(MCOperand::createReg(MI->getOperand(0).getReg()));2412TmpInst.addOperand(MCOperand::createImm(MI->getOperand(1).getImm()));2413EmitToStreamer(*OutStreamer, TmpInst);2414return;2415}2416break;24172418case AArch64::DBG_VALUE:2419case AArch64::DBG_VALUE_LIST:2420if (isVerbose() && OutStreamer->hasRawTextSupport()) {2421SmallString<128> TmpStr;2422raw_svector_ostream OS(TmpStr);2423PrintDebugValueComment(MI, OS);2424OutStreamer->emitRawText(StringRef(OS.str()));2425}2426return;24272428case AArch64::EMITBKEY: {2429ExceptionHandling ExceptionHandlingType = MAI->getExceptionHandlingType();2430if (ExceptionHandlingType != ExceptionHandling::DwarfCFI &&2431ExceptionHandlingType != ExceptionHandling::ARM)2432return;24332434if (getFunctionCFISectionType(*MF) == CFISection::None)2435return;24362437OutStreamer->emitCFIBKeyFrame();2438return;2439}24402441case AArch64::EMITMTETAGGED: {2442ExceptionHandling ExceptionHandlingType = MAI->getExceptionHandlingType();2443if (ExceptionHandlingType != ExceptionHandling::DwarfCFI &&2444ExceptionHandlingType != ExceptionHandling::ARM)2445return;24462447if (getFunctionCFISectionType(*MF) != CFISection::None)2448OutStreamer->emitCFIMTETaggedFrame();2449return;2450}24512452case AArch64::AUT:2453case AArch64::AUTPAC:2454emitPtrauthAuthResign(MI);2455return;24562457case AArch64::LOADauthptrstatic:2458LowerLOADauthptrstatic(*MI);2459return;24602461case AArch64::LOADgotPAC:2462case AArch64::MOVaddrPAC:2463LowerMOVaddrPAC(*MI);2464return;24652466case AArch64::BRA:2467case AArch64::BLRA:2468emitPtrauthBranch(MI);2469return;24702471// Tail calls use pseudo instructions so they have the proper code-gen2472// attributes (isCall, isReturn, etc.). We lower them to the real2473// instruction here.2474case AArch64::AUTH_TCRETURN:2475case AArch64::AUTH_TCRETURN_BTI: {2476const uint64_t Key = MI->getOperand(2).getImm();2477assert((Key == AArch64PACKey::IA || Key == AArch64PACKey::IB) &&2478"Invalid auth key for tail-call return");24792480const uint64_t Disc = MI->getOperand(3).getImm();2481assert(isUInt<16>(Disc) && "Integer discriminator is too wide");24822483Register AddrDisc = MI->getOperand(4).getReg();24842485Register ScratchReg = MI->getOperand(0).getReg() == AArch64::X162486? AArch64::X172487: AArch64::X16;24882489unsigned DiscReg = AddrDisc;2490if (Disc) {2491if (AddrDisc != AArch64::NoRegister) {2492EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::ORRXrs)2493.addReg(ScratchReg)2494.addReg(AArch64::XZR)2495.addReg(AddrDisc)2496.addImm(0));2497EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::MOVKXi)2498.addReg(ScratchReg)2499.addReg(ScratchReg)2500.addImm(Disc)2501.addImm(/*shift=*/48));2502} else {2503EmitToStreamer(*OutStreamer, MCInstBuilder(AArch64::MOVZXi)2504.addReg(ScratchReg)2505.addImm(Disc)2506.addImm(/*shift=*/0));2507}2508DiscReg = ScratchReg;2509}25102511const bool IsZero = DiscReg == AArch64::NoRegister;2512const unsigned Opcodes[2][2] = {{AArch64::BRAA, AArch64::BRAAZ},2513{AArch64::BRAB, AArch64::BRABZ}};25142515MCInst TmpInst;2516TmpInst.setOpcode(Opcodes[Key][IsZero]);2517TmpInst.addOperand(MCOperand::createReg(MI->getOperand(0).getReg()));2518if (!IsZero)2519TmpInst.addOperand(MCOperand::createReg(DiscReg));2520EmitToStreamer(*OutStreamer, TmpInst);2521return;2522}25232524case AArch64::TCRETURNri:2525case AArch64::TCRETURNrix16x17:2526case AArch64::TCRETURNrix17:2527case AArch64::TCRETURNrinotx16:2528case AArch64::TCRETURNriALL: {2529MCInst TmpInst;2530TmpInst.setOpcode(AArch64::BR);2531TmpInst.addOperand(MCOperand::createReg(MI->getOperand(0).getReg()));2532EmitToStreamer(*OutStreamer, TmpInst);2533return;2534}2535case AArch64::TCRETURNdi: {2536MCOperand Dest;2537MCInstLowering.lowerOperand(MI->getOperand(0), Dest);2538MCInst TmpInst;2539TmpInst.setOpcode(AArch64::B);2540TmpInst.addOperand(Dest);2541EmitToStreamer(*OutStreamer, TmpInst);2542return;2543}2544case AArch64::SpeculationBarrierISBDSBEndBB: {2545// Print DSB SYS + ISB2546MCInst TmpInstDSB;2547TmpInstDSB.setOpcode(AArch64::DSB);2548TmpInstDSB.addOperand(MCOperand::createImm(0xf));2549EmitToStreamer(*OutStreamer, TmpInstDSB);2550MCInst TmpInstISB;2551TmpInstISB.setOpcode(AArch64::ISB);2552TmpInstISB.addOperand(MCOperand::createImm(0xf));2553EmitToStreamer(*OutStreamer, TmpInstISB);2554return;2555}2556case AArch64::SpeculationBarrierSBEndBB: {2557// Print SB2558MCInst TmpInstSB;2559TmpInstSB.setOpcode(AArch64::SB);2560EmitToStreamer(*OutStreamer, TmpInstSB);2561return;2562}2563case AArch64::TLSDESC_CALLSEQ: {2564/// lower this to:2565/// adrp x0, :tlsdesc:var2566/// ldr x1, [x0, #:tlsdesc_lo12:var]2567/// add x0, x0, #:tlsdesc_lo12:var2568/// .tlsdesccall var2569/// blr x12570/// (TPIDR_EL0 offset now in x0)2571const MachineOperand &MO_Sym = MI->getOperand(0);2572MachineOperand MO_TLSDESC_LO12(MO_Sym), MO_TLSDESC(MO_Sym);2573MCOperand Sym, SymTLSDescLo12, SymTLSDesc;2574MO_TLSDESC_LO12.setTargetFlags(AArch64II::MO_TLS | AArch64II::MO_PAGEOFF);2575MO_TLSDESC.setTargetFlags(AArch64II::MO_TLS | AArch64II::MO_PAGE);2576MCInstLowering.lowerOperand(MO_Sym, Sym);2577MCInstLowering.lowerOperand(MO_TLSDESC_LO12, SymTLSDescLo12);2578MCInstLowering.lowerOperand(MO_TLSDESC, SymTLSDesc);25792580MCInst Adrp;2581Adrp.setOpcode(AArch64::ADRP);2582Adrp.addOperand(MCOperand::createReg(AArch64::X0));2583Adrp.addOperand(SymTLSDesc);2584EmitToStreamer(*OutStreamer, Adrp);25852586MCInst Ldr;2587if (STI->isTargetILP32()) {2588Ldr.setOpcode(AArch64::LDRWui);2589Ldr.addOperand(MCOperand::createReg(AArch64::W1));2590} else {2591Ldr.setOpcode(AArch64::LDRXui);2592Ldr.addOperand(MCOperand::createReg(AArch64::X1));2593}2594Ldr.addOperand(MCOperand::createReg(AArch64::X0));2595Ldr.addOperand(SymTLSDescLo12);2596Ldr.addOperand(MCOperand::createImm(0));2597EmitToStreamer(*OutStreamer, Ldr);25982599MCInst Add;2600if (STI->isTargetILP32()) {2601Add.setOpcode(AArch64::ADDWri);2602Add.addOperand(MCOperand::createReg(AArch64::W0));2603Add.addOperand(MCOperand::createReg(AArch64::W0));2604} else {2605Add.setOpcode(AArch64::ADDXri);2606Add.addOperand(MCOperand::createReg(AArch64::X0));2607Add.addOperand(MCOperand::createReg(AArch64::X0));2608}2609Add.addOperand(SymTLSDescLo12);2610Add.addOperand(MCOperand::createImm(AArch64_AM::getShiftValue(0)));2611EmitToStreamer(*OutStreamer, Add);26122613// Emit a relocation-annotation. This expands to no code, but requests2614// the following instruction gets an R_AARCH64_TLSDESC_CALL.2615MCInst TLSDescCall;2616TLSDescCall.setOpcode(AArch64::TLSDESCCALL);2617TLSDescCall.addOperand(Sym);2618EmitToStreamer(*OutStreamer, TLSDescCall);26192620MCInst Blr;2621Blr.setOpcode(AArch64::BLR);2622Blr.addOperand(MCOperand::createReg(AArch64::X1));2623EmitToStreamer(*OutStreamer, Blr);26242625return;2626}26272628case AArch64::JumpTableDest32:2629case AArch64::JumpTableDest16:2630case AArch64::JumpTableDest8:2631LowerJumpTableDest(*OutStreamer, *MI);2632return;26332634case AArch64::BR_JumpTable:2635LowerHardenedBRJumpTable(*MI);2636return;26372638case AArch64::FMOVH0:2639case AArch64::FMOVS0:2640case AArch64::FMOVD0:2641emitFMov0(*MI);2642return;26432644case AArch64::MOPSMemoryCopyPseudo:2645case AArch64::MOPSMemoryMovePseudo:2646case AArch64::MOPSMemorySetPseudo:2647case AArch64::MOPSMemorySetTaggingPseudo:2648LowerMOPS(*OutStreamer, *MI);2649return;26502651case TargetOpcode::STACKMAP:2652return LowerSTACKMAP(*OutStreamer, SM, *MI);26532654case TargetOpcode::PATCHPOINT:2655return LowerPATCHPOINT(*OutStreamer, SM, *MI);26562657case TargetOpcode::STATEPOINT:2658return LowerSTATEPOINT(*OutStreamer, SM, *MI);26592660case TargetOpcode::FAULTING_OP:2661return LowerFAULTING_OP(*MI);26622663case TargetOpcode::PATCHABLE_FUNCTION_ENTER:2664LowerPATCHABLE_FUNCTION_ENTER(*MI);2665return;26662667case TargetOpcode::PATCHABLE_FUNCTION_EXIT:2668LowerPATCHABLE_FUNCTION_EXIT(*MI);2669return;26702671case TargetOpcode::PATCHABLE_TAIL_CALL:2672LowerPATCHABLE_TAIL_CALL(*MI);2673return;2674case TargetOpcode::PATCHABLE_EVENT_CALL:2675return LowerPATCHABLE_EVENT_CALL(*MI, false);2676case TargetOpcode::PATCHABLE_TYPED_EVENT_CALL:2677return LowerPATCHABLE_EVENT_CALL(*MI, true);26782679case AArch64::KCFI_CHECK:2680LowerKCFI_CHECK(*MI);2681return;26822683case AArch64::HWASAN_CHECK_MEMACCESS:2684case AArch64::HWASAN_CHECK_MEMACCESS_SHORTGRANULES:2685case AArch64::HWASAN_CHECK_MEMACCESS_FIXEDSHADOW:2686case AArch64::HWASAN_CHECK_MEMACCESS_SHORTGRANULES_FIXEDSHADOW:2687LowerHWASAN_CHECK_MEMACCESS(*MI);2688return;26892690case AArch64::SEH_StackAlloc:2691TS->emitARM64WinCFIAllocStack(MI->getOperand(0).getImm());2692return;26932694case AArch64::SEH_SaveFPLR:2695TS->emitARM64WinCFISaveFPLR(MI->getOperand(0).getImm());2696return;26972698case AArch64::SEH_SaveFPLR_X:2699assert(MI->getOperand(0).getImm() < 0 &&2700"Pre increment SEH opcode must have a negative offset");2701TS->emitARM64WinCFISaveFPLRX(-MI->getOperand(0).getImm());2702return;27032704case AArch64::SEH_SaveReg:2705TS->emitARM64WinCFISaveReg(MI->getOperand(0).getImm(),2706MI->getOperand(1).getImm());2707return;27082709case AArch64::SEH_SaveReg_X:2710assert(MI->getOperand(1).getImm() < 0 &&2711"Pre increment SEH opcode must have a negative offset");2712TS->emitARM64WinCFISaveRegX(MI->getOperand(0).getImm(),2713-MI->getOperand(1).getImm());2714return;27152716case AArch64::SEH_SaveRegP:2717if (MI->getOperand(1).getImm() == 30 && MI->getOperand(0).getImm() >= 19 &&2718MI->getOperand(0).getImm() <= 28) {2719assert((MI->getOperand(0).getImm() - 19) % 2 == 0 &&2720"Register paired with LR must be odd");2721TS->emitARM64WinCFISaveLRPair(MI->getOperand(0).getImm(),2722MI->getOperand(2).getImm());2723return;2724}2725assert((MI->getOperand(1).getImm() - MI->getOperand(0).getImm() == 1) &&2726"Non-consecutive registers not allowed for save_regp");2727TS->emitARM64WinCFISaveRegP(MI->getOperand(0).getImm(),2728MI->getOperand(2).getImm());2729return;27302731case AArch64::SEH_SaveRegP_X:2732assert((MI->getOperand(1).getImm() - MI->getOperand(0).getImm() == 1) &&2733"Non-consecutive registers not allowed for save_regp_x");2734assert(MI->getOperand(2).getImm() < 0 &&2735"Pre increment SEH opcode must have a negative offset");2736TS->emitARM64WinCFISaveRegPX(MI->getOperand(0).getImm(),2737-MI->getOperand(2).getImm());2738return;27392740case AArch64::SEH_SaveFReg:2741TS->emitARM64WinCFISaveFReg(MI->getOperand(0).getImm(),2742MI->getOperand(1).getImm());2743return;27442745case AArch64::SEH_SaveFReg_X:2746assert(MI->getOperand(1).getImm() < 0 &&2747"Pre increment SEH opcode must have a negative offset");2748TS->emitARM64WinCFISaveFRegX(MI->getOperand(0).getImm(),2749-MI->getOperand(1).getImm());2750return;27512752case AArch64::SEH_SaveFRegP:2753assert((MI->getOperand(1).getImm() - MI->getOperand(0).getImm() == 1) &&2754"Non-consecutive registers not allowed for save_regp");2755TS->emitARM64WinCFISaveFRegP(MI->getOperand(0).getImm(),2756MI->getOperand(2).getImm());2757return;27582759case AArch64::SEH_SaveFRegP_X:2760assert((MI->getOperand(1).getImm() - MI->getOperand(0).getImm() == 1) &&2761"Non-consecutive registers not allowed for save_regp_x");2762assert(MI->getOperand(2).getImm() < 0 &&2763"Pre increment SEH opcode must have a negative offset");2764TS->emitARM64WinCFISaveFRegPX(MI->getOperand(0).getImm(),2765-MI->getOperand(2).getImm());2766return;27672768case AArch64::SEH_SetFP:2769TS->emitARM64WinCFISetFP();2770return;27712772case AArch64::SEH_AddFP:2773TS->emitARM64WinCFIAddFP(MI->getOperand(0).getImm());2774return;27752776case AArch64::SEH_Nop:2777TS->emitARM64WinCFINop();2778return;27792780case AArch64::SEH_PrologEnd:2781TS->emitARM64WinCFIPrologEnd();2782return;27832784case AArch64::SEH_EpilogStart:2785TS->emitARM64WinCFIEpilogStart();2786return;27872788case AArch64::SEH_EpilogEnd:2789TS->emitARM64WinCFIEpilogEnd();2790return;27912792case AArch64::SEH_PACSignLR:2793TS->emitARM64WinCFIPACSignLR();2794return;27952796case AArch64::SEH_SaveAnyRegQP:2797assert(MI->getOperand(1).getImm() - MI->getOperand(0).getImm() == 1 &&2798"Non-consecutive registers not allowed for save_any_reg");2799assert(MI->getOperand(2).getImm() >= 0 &&2800"SaveAnyRegQP SEH opcode offset must be non-negative");2801assert(MI->getOperand(2).getImm() <= 1008 &&2802"SaveAnyRegQP SEH opcode offset must fit into 6 bits");2803TS->emitARM64WinCFISaveAnyRegQP(MI->getOperand(0).getImm(),2804MI->getOperand(2).getImm());2805return;28062807case AArch64::SEH_SaveAnyRegQPX:2808assert(MI->getOperand(1).getImm() - MI->getOperand(0).getImm() == 1 &&2809"Non-consecutive registers not allowed for save_any_reg");2810assert(MI->getOperand(2).getImm() < 0 &&2811"SaveAnyRegQPX SEH opcode offset must be negative");2812assert(MI->getOperand(2).getImm() >= -1008 &&2813"SaveAnyRegQPX SEH opcode offset must fit into 6 bits");2814TS->emitARM64WinCFISaveAnyRegQPX(MI->getOperand(0).getImm(),2815-MI->getOperand(2).getImm());2816return;2817}28182819// Finally, do the automated lowerings for everything else.2820MCInst TmpInst;2821MCInstLowering.Lower(MI, TmpInst);2822EmitToStreamer(*OutStreamer, TmpInst);2823}28242825void AArch64AsmPrinter::emitMachOIFuncStubBody(Module &M, const GlobalIFunc &GI,2826MCSymbol *LazyPointer) {2827// _ifunc:2828// adrp x16, lazy_pointer@GOTPAGE2829// ldr x16, [x16, lazy_pointer@GOTPAGEOFF]2830// ldr x16, [x16]2831// br x1628322833{2834MCInst Adrp;2835Adrp.setOpcode(AArch64::ADRP);2836Adrp.addOperand(MCOperand::createReg(AArch64::X16));2837MCOperand SymPage;2838MCInstLowering.lowerOperand(2839MachineOperand::CreateMCSymbol(LazyPointer,2840AArch64II::MO_GOT | AArch64II::MO_PAGE),2841SymPage);2842Adrp.addOperand(SymPage);2843OutStreamer->emitInstruction(Adrp, *STI);2844}28452846{2847MCInst Ldr;2848Ldr.setOpcode(AArch64::LDRXui);2849Ldr.addOperand(MCOperand::createReg(AArch64::X16));2850Ldr.addOperand(MCOperand::createReg(AArch64::X16));2851MCOperand SymPageOff;2852MCInstLowering.lowerOperand(2853MachineOperand::CreateMCSymbol(LazyPointer, AArch64II::MO_GOT |2854AArch64II::MO_PAGEOFF),2855SymPageOff);2856Ldr.addOperand(SymPageOff);2857Ldr.addOperand(MCOperand::createImm(0));2858OutStreamer->emitInstruction(Ldr, *STI);2859}28602861OutStreamer->emitInstruction(MCInstBuilder(AArch64::LDRXui)2862.addReg(AArch64::X16)2863.addReg(AArch64::X16)2864.addImm(0),2865*STI);28662867OutStreamer->emitInstruction(MCInstBuilder(TM.getTargetTriple().isArm64e()2868? AArch64::BRAAZ2869: AArch64::BR)2870.addReg(AArch64::X16),2871*STI);2872}28732874void AArch64AsmPrinter::emitMachOIFuncStubHelperBody(Module &M,2875const GlobalIFunc &GI,2876MCSymbol *LazyPointer) {2877// These stub helpers are only ever called once, so here we're optimizing for2878// minimum size by using the pre-indexed store variants, which saves a few2879// bytes of instructions to bump & restore sp.28802881// _ifunc.stub_helper:2882// stp fp, lr, [sp, #-16]!2883// mov fp, sp2884// stp x1, x0, [sp, #-16]!2885// stp x3, x2, [sp, #-16]!2886// stp x5, x4, [sp, #-16]!2887// stp x7, x6, [sp, #-16]!2888// stp d1, d0, [sp, #-16]!2889// stp d3, d2, [sp, #-16]!2890// stp d5, d4, [sp, #-16]!2891// stp d7, d6, [sp, #-16]!2892// bl _resolver2893// adrp x16, lazy_pointer@GOTPAGE2894// ldr x16, [x16, lazy_pointer@GOTPAGEOFF]2895// str x0, [x16]2896// mov x16, x02897// ldp d7, d6, [sp], #162898// ldp d5, d4, [sp], #162899// ldp d3, d2, [sp], #162900// ldp d1, d0, [sp], #162901// ldp x7, x6, [sp], #162902// ldp x5, x4, [sp], #162903// ldp x3, x2, [sp], #162904// ldp x1, x0, [sp], #162905// ldp fp, lr, [sp], #162906// br x1629072908OutStreamer->emitInstruction(MCInstBuilder(AArch64::STPXpre)2909.addReg(AArch64::SP)2910.addReg(AArch64::FP)2911.addReg(AArch64::LR)2912.addReg(AArch64::SP)2913.addImm(-2),2914*STI);29152916OutStreamer->emitInstruction(MCInstBuilder(AArch64::ADDXri)2917.addReg(AArch64::FP)2918.addReg(AArch64::SP)2919.addImm(0)2920.addImm(0),2921*STI);29222923for (int I = 0; I != 4; ++I)2924OutStreamer->emitInstruction(MCInstBuilder(AArch64::STPXpre)2925.addReg(AArch64::SP)2926.addReg(AArch64::X1 + 2 * I)2927.addReg(AArch64::X0 + 2 * I)2928.addReg(AArch64::SP)2929.addImm(-2),2930*STI);29312932for (int I = 0; I != 4; ++I)2933OutStreamer->emitInstruction(MCInstBuilder(AArch64::STPDpre)2934.addReg(AArch64::SP)2935.addReg(AArch64::D1 + 2 * I)2936.addReg(AArch64::D0 + 2 * I)2937.addReg(AArch64::SP)2938.addImm(-2),2939*STI);29402941OutStreamer->emitInstruction(2942MCInstBuilder(AArch64::BL)2943.addOperand(MCOperand::createExpr(lowerConstant(GI.getResolver()))),2944*STI);29452946{2947MCInst Adrp;2948Adrp.setOpcode(AArch64::ADRP);2949Adrp.addOperand(MCOperand::createReg(AArch64::X16));2950MCOperand SymPage;2951MCInstLowering.lowerOperand(2952MachineOperand::CreateES(LazyPointer->getName().data() + 1,2953AArch64II::MO_GOT | AArch64II::MO_PAGE),2954SymPage);2955Adrp.addOperand(SymPage);2956OutStreamer->emitInstruction(Adrp, *STI);2957}29582959{2960MCInst Ldr;2961Ldr.setOpcode(AArch64::LDRXui);2962Ldr.addOperand(MCOperand::createReg(AArch64::X16));2963Ldr.addOperand(MCOperand::createReg(AArch64::X16));2964MCOperand SymPageOff;2965MCInstLowering.lowerOperand(2966MachineOperand::CreateES(LazyPointer->getName().data() + 1,2967AArch64II::MO_GOT | AArch64II::MO_PAGEOFF),2968SymPageOff);2969Ldr.addOperand(SymPageOff);2970Ldr.addOperand(MCOperand::createImm(0));2971OutStreamer->emitInstruction(Ldr, *STI);2972}29732974OutStreamer->emitInstruction(MCInstBuilder(AArch64::STRXui)2975.addReg(AArch64::X0)2976.addReg(AArch64::X16)2977.addImm(0),2978*STI);29792980OutStreamer->emitInstruction(MCInstBuilder(AArch64::ADDXri)2981.addReg(AArch64::X16)2982.addReg(AArch64::X0)2983.addImm(0)2984.addImm(0),2985*STI);29862987for (int I = 3; I != -1; --I)2988OutStreamer->emitInstruction(MCInstBuilder(AArch64::LDPDpost)2989.addReg(AArch64::SP)2990.addReg(AArch64::D1 + 2 * I)2991.addReg(AArch64::D0 + 2 * I)2992.addReg(AArch64::SP)2993.addImm(2),2994*STI);29952996for (int I = 3; I != -1; --I)2997OutStreamer->emitInstruction(MCInstBuilder(AArch64::LDPXpost)2998.addReg(AArch64::SP)2999.addReg(AArch64::X1 + 2 * I)3000.addReg(AArch64::X0 + 2 * I)3001.addReg(AArch64::SP)3002.addImm(2),3003*STI);30043005OutStreamer->emitInstruction(MCInstBuilder(AArch64::LDPXpost)3006.addReg(AArch64::SP)3007.addReg(AArch64::FP)3008.addReg(AArch64::LR)3009.addReg(AArch64::SP)3010.addImm(2),3011*STI);30123013OutStreamer->emitInstruction(MCInstBuilder(TM.getTargetTriple().isArm64e()3014? AArch64::BRAAZ3015: AArch64::BR)3016.addReg(AArch64::X16),3017*STI);3018}30193020const MCExpr *AArch64AsmPrinter::lowerConstant(const Constant *CV) {3021if (const GlobalValue *GV = dyn_cast<GlobalValue>(CV)) {3022return MCSymbolRefExpr::create(MCInstLowering.GetGlobalValueSymbol(GV, 0),3023OutContext);3024}30253026return AsmPrinter::lowerConstant(CV);3027}30283029// Force static initialization.3030extern "C" LLVM_EXTERNAL_VISIBILITY void LLVMInitializeAArch64AsmPrinter() {3031RegisterAsmPrinter<AArch64AsmPrinter> X(getTheAArch64leTarget());3032RegisterAsmPrinter<AArch64AsmPrinter> Y(getTheAArch64beTarget());3033RegisterAsmPrinter<AArch64AsmPrinter> Z(getTheARM64Target());3034RegisterAsmPrinter<AArch64AsmPrinter> W(getTheARM64_32Target());3035RegisterAsmPrinter<AArch64AsmPrinter> V(getTheAArch64_32Target());3036}303730383039