1 //===- MCMachOStreamer.cpp - MachO Streamer -------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "llvm/ADT/DenseMap.h"
10 #include "llvm/ADT/SmallString.h"
11 #include "llvm/ADT/SmallVector.h"
12 #include "llvm/ADT/StringRef.h"
13 #include "llvm/ADT/Triple.h"
14 #include "llvm/MC/MCAsmBackend.h"
15 #include "llvm/MC/MCAssembler.h"
16 #include "llvm/MC/MCCodeEmitter.h"
17 #include "llvm/MC/MCContext.h"
18 #include "llvm/MC/MCDirectives.h"
19 #include "llvm/MC/MCExpr.h"
20 #include "llvm/MC/MCFixup.h"
21 #include "llvm/MC/MCFragment.h"
22 #include "llvm/MC/MCInst.h"
23 #include "llvm/MC/MCLinkerOptimizationHint.h"
24 #include "llvm/MC/MCObjectFileInfo.h"
25 #include "llvm/MC/MCObjectStreamer.h"
26 #include "llvm/MC/MCObjectWriter.h"
27 #include "llvm/MC/MCSection.h"
28 #include "llvm/MC/MCSectionMachO.h"
29 #include "llvm/MC/MCStreamer.h"
30 #include "llvm/MC/MCSymbol.h"
31 #include "llvm/MC/MCSymbolMachO.h"
32 #include "llvm/MC/MCValue.h"
33 #include "llvm/Support/Casting.h"
34 #include "llvm/Support/ErrorHandling.h"
35 #include "llvm/Support/TargetRegistry.h"
36 #include "llvm/Support/raw_ostream.h"
44 class MCMachOStreamer
: public MCObjectStreamer
{
46 /// LabelSections - true if each section change should emit a linker local
47 /// label for use in relocations for assembler local references. Obviates the
48 /// need for local relocations. False by default.
51 bool DWARFMustBeAtTheEnd
;
52 bool CreatedADWARFSection
;
54 /// HasSectionLabel - map of which sections have already had a non-local
55 /// label emitted to them. Used so we don't emit extraneous linker local
56 /// labels in the middle of the section.
57 DenseMap
<const MCSection
*, bool> HasSectionLabel
;
59 void emitInstToData(const MCInst
&Inst
, const MCSubtargetInfo
&STI
) override
;
61 void emitDataRegion(DataRegionData::KindTy Kind
);
62 void emitDataRegionEnd();
65 MCMachOStreamer(MCContext
&Context
, std::unique_ptr
<MCAsmBackend
> MAB
,
66 std::unique_ptr
<MCObjectWriter
> OW
,
67 std::unique_ptr
<MCCodeEmitter
> Emitter
,
68 bool DWARFMustBeAtTheEnd
, bool label
)
69 : MCObjectStreamer(Context
, std::move(MAB
), std::move(OW
),
71 LabelSections(label
), DWARFMustBeAtTheEnd(DWARFMustBeAtTheEnd
),
72 CreatedADWARFSection(false) {}
75 void reset() override
{
76 CreatedADWARFSection
= false;
77 HasSectionLabel
.clear();
78 MCObjectStreamer::reset();
81 /// @name MCStreamer Interface
84 void changeSection(MCSection
*Sect
, const MCExpr
*Subsect
) override
;
85 void emitLabel(MCSymbol
*Symbol
, SMLoc Loc
= SMLoc()) override
;
86 void emitAssignment(MCSymbol
*Symbol
, const MCExpr
*Value
) override
;
87 void emitEHSymAttributes(const MCSymbol
*Symbol
, MCSymbol
*EHSymbol
) override
;
88 void emitAssemblerFlag(MCAssemblerFlag Flag
) override
;
89 void emitLinkerOptions(ArrayRef
<std::string
> Options
) override
;
90 void emitDataRegion(MCDataRegionType Kind
) override
;
91 void emitVersionMin(MCVersionMinType Kind
, unsigned Major
, unsigned Minor
,
92 unsigned Update
, VersionTuple SDKVersion
) override
;
93 void emitBuildVersion(unsigned Platform
, unsigned Major
, unsigned Minor
,
94 unsigned Update
, VersionTuple SDKVersion
) override
;
95 void emitThumbFunc(MCSymbol
*Func
) override
;
96 bool emitSymbolAttribute(MCSymbol
*Symbol
, MCSymbolAttr Attribute
) override
;
97 void emitSymbolDesc(MCSymbol
*Symbol
, unsigned DescValue
) override
;
98 void emitCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
99 unsigned ByteAlignment
) override
;
101 void emitLocalCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
102 unsigned ByteAlignment
) override
;
103 void emitZerofill(MCSection
*Section
, MCSymbol
*Symbol
= nullptr,
104 uint64_t Size
= 0, unsigned ByteAlignment
= 0,
105 SMLoc Loc
= SMLoc()) override
;
106 void emitTBSSSymbol(MCSection
*Section
, MCSymbol
*Symbol
, uint64_t Size
,
107 unsigned ByteAlignment
= 0) override
;
109 void emitIdent(StringRef IdentString
) override
{
110 llvm_unreachable("macho doesn't support this directive");
113 void emitLOHDirective(MCLOHType Kind
, const MCLOHArgs
&Args
) override
{
114 getAssembler().getLOHContainer().addDirective(Kind
, Args
);
117 void finishImpl() override
;
120 } // end anonymous namespace.
122 static bool canGoAfterDWARF(const MCSectionMachO
&MSec
) {
123 // These sections are created by the assembler itself after the end of
125 StringRef SegName
= MSec
.getSegmentName();
126 StringRef SecName
= MSec
.getName();
128 if (SegName
== "__LD" && SecName
== "__compact_unwind")
131 if (SegName
== "__IMPORT") {
132 if (SecName
== "__jump_table")
135 if (SecName
== "__pointers")
139 if (SegName
== "__TEXT" && SecName
== "__eh_frame")
142 if (SegName
== "__DATA" && (SecName
== "__nl_symbol_ptr" ||
143 SecName
== "__thread_ptr"))
149 void MCMachOStreamer::changeSection(MCSection
*Section
,
150 const MCExpr
*Subsection
) {
151 // Change the section normally.
152 bool Created
= changeSectionImpl(Section
, Subsection
);
153 const MCSectionMachO
&MSec
= *cast
<MCSectionMachO
>(Section
);
154 StringRef SegName
= MSec
.getSegmentName();
155 if (SegName
== "__DWARF")
156 CreatedADWARFSection
= true;
157 else if (Created
&& DWARFMustBeAtTheEnd
&& !canGoAfterDWARF(MSec
))
158 assert((!CreatedADWARFSection
||
159 Section
== getContext().getObjectFileInfo()->getStackMapSection())
160 && "Creating regular section after DWARF");
162 // Output a linker-local symbol so we don't need section-relative local
163 // relocations. The linker hates us when we do that.
164 if (LabelSections
&& !HasSectionLabel
[Section
] &&
165 !Section
->getBeginSymbol()) {
166 MCSymbol
*Label
= getContext().createLinkerPrivateTempSymbol();
167 Section
->setBeginSymbol(Label
);
168 HasSectionLabel
[Section
] = true;
172 void MCMachOStreamer::emitEHSymAttributes(const MCSymbol
*Symbol
,
173 MCSymbol
*EHSymbol
) {
174 getAssembler().registerSymbol(*Symbol
);
175 if (Symbol
->isExternal())
176 emitSymbolAttribute(EHSymbol
, MCSA_Global
);
177 if (cast
<MCSymbolMachO
>(Symbol
)->isWeakDefinition())
178 emitSymbolAttribute(EHSymbol
, MCSA_WeakDefinition
);
179 if (Symbol
->isPrivateExtern())
180 emitSymbolAttribute(EHSymbol
, MCSA_PrivateExtern
);
183 void MCMachOStreamer::emitLabel(MCSymbol
*Symbol
, SMLoc Loc
) {
184 // We have to create a new fragment if this is an atom defining symbol,
185 // fragments cannot span atoms.
186 if (getAssembler().isSymbolLinkerVisible(*Symbol
))
187 insert(new MCDataFragment());
189 MCObjectStreamer::emitLabel(Symbol
, Loc
);
191 // This causes the reference type flag to be cleared. Darwin 'as' was "trying"
192 // to clear the weak reference and weak definition bits too, but the
193 // implementation was buggy. For now we just try to match 'as', for
196 // FIXME: Cleanup this code, these bits should be emitted based on semantic
197 // properties, not on the order of definition, etc.
198 cast
<MCSymbolMachO
>(Symbol
)->clearReferenceType();
201 void MCMachOStreamer::emitAssignment(MCSymbol
*Symbol
, const MCExpr
*Value
) {
204 if (Value
->evaluateAsRelocatable(Res
, nullptr, nullptr)) {
205 if (const MCSymbolRefExpr
*SymAExpr
= Res
.getSymA()) {
206 const MCSymbol
&SymA
= SymAExpr
->getSymbol();
207 if (!Res
.getSymB() && (SymA
.getName() == "" || Res
.getConstant() != 0))
208 cast
<MCSymbolMachO
>(Symbol
)->setAltEntry();
211 MCObjectStreamer::emitAssignment(Symbol
, Value
);
214 void MCMachOStreamer::emitDataRegion(DataRegionData::KindTy Kind
) {
215 // Create a temporary label to mark the start of the data region.
216 MCSymbol
*Start
= getContext().createTempSymbol();
218 // Record the region for the object writer to use.
219 DataRegionData Data
= { Kind
, Start
, nullptr };
220 std::vector
<DataRegionData
> &Regions
= getAssembler().getDataRegions();
221 Regions
.push_back(Data
);
224 void MCMachOStreamer::emitDataRegionEnd() {
225 std::vector
<DataRegionData
> &Regions
= getAssembler().getDataRegions();
226 assert(!Regions
.empty() && "Mismatched .end_data_region!");
227 DataRegionData
&Data
= Regions
.back();
228 assert(!Data
.End
&& "Mismatched .end_data_region!");
229 // Create a temporary label to mark the end of the data region.
230 Data
.End
= getContext().createTempSymbol();
234 void MCMachOStreamer::emitAssemblerFlag(MCAssemblerFlag Flag
) {
235 // Let the target do whatever target specific stuff it needs to do.
236 getAssembler().getBackend().handleAssemblerFlag(Flag
);
237 // Do any generic stuff we need to do.
239 case MCAF_SyntaxUnified
: return; // no-op here.
240 case MCAF_Code16
: return; // Change parsing mode; no-op here.
241 case MCAF_Code32
: return; // Change parsing mode; no-op here.
242 case MCAF_Code64
: return; // Change parsing mode; no-op here.
243 case MCAF_SubsectionsViaSymbols
:
244 getAssembler().setSubsectionsViaSymbols(true);
249 void MCMachOStreamer::emitLinkerOptions(ArrayRef
<std::string
> Options
) {
250 getAssembler().getLinkerOptions().push_back(Options
);
253 void MCMachOStreamer::emitDataRegion(MCDataRegionType Kind
) {
255 case MCDR_DataRegion
:
256 emitDataRegion(DataRegionData::Data
);
258 case MCDR_DataRegionJT8
:
259 emitDataRegion(DataRegionData::JumpTable8
);
261 case MCDR_DataRegionJT16
:
262 emitDataRegion(DataRegionData::JumpTable16
);
264 case MCDR_DataRegionJT32
:
265 emitDataRegion(DataRegionData::JumpTable32
);
267 case MCDR_DataRegionEnd
:
273 void MCMachOStreamer::emitVersionMin(MCVersionMinType Kind
, unsigned Major
,
274 unsigned Minor
, unsigned Update
,
275 VersionTuple SDKVersion
) {
276 getAssembler().setVersionMin(Kind
, Major
, Minor
, Update
, SDKVersion
);
279 void MCMachOStreamer::emitBuildVersion(unsigned Platform
, unsigned Major
,
280 unsigned Minor
, unsigned Update
,
281 VersionTuple SDKVersion
) {
282 getAssembler().setBuildVersion((MachO::PlatformType
)Platform
, Major
, Minor
,
286 void MCMachOStreamer::emitThumbFunc(MCSymbol
*Symbol
) {
287 // Remember that the function is a thumb function. Fixup and relocation
288 // values will need adjusted.
289 getAssembler().setIsThumbFunc(Symbol
);
290 cast
<MCSymbolMachO
>(Symbol
)->setThumbFunc();
293 bool MCMachOStreamer::emitSymbolAttribute(MCSymbol
*Sym
,
294 MCSymbolAttr Attribute
) {
295 MCSymbolMachO
*Symbol
= cast
<MCSymbolMachO
>(Sym
);
297 // Indirect symbols are handled differently, to match how 'as' handles
298 // them. This makes writing matching .o files easier.
299 if (Attribute
== MCSA_IndirectSymbol
) {
300 // Note that we intentionally cannot use the symbol data here; this is
301 // important for matching the string table that 'as' generates.
302 IndirectSymbolData ISD
;
304 ISD
.Section
= getCurrentSectionOnly();
305 getAssembler().getIndirectSymbols().push_back(ISD
);
309 // Adding a symbol attribute always introduces the symbol, note that an
310 // important side effect of calling registerSymbol here is to register
311 // the symbol with the assembler.
312 getAssembler().registerSymbol(*Symbol
);
314 // The implementation of symbol attributes is designed to match 'as', but it
315 // leaves much to desired. It doesn't really make sense to arbitrarily add and
316 // remove flags, but 'as' allows this (in particular, see .desc).
318 // In the future it might be worth trying to make these operations more well
322 case MCSA_ELF_TypeFunction
:
323 case MCSA_ELF_TypeIndFunction
:
324 case MCSA_ELF_TypeObject
:
325 case MCSA_ELF_TypeTLS
:
326 case MCSA_ELF_TypeCommon
:
327 case MCSA_ELF_TypeNoType
:
328 case MCSA_ELF_TypeGnuUniqueObject
:
331 case MCSA_IndirectSymbol
:
340 Symbol
->setExternal(true);
341 // This effectively clears the undefined lazy bit, in Darwin 'as', although
342 // it isn't very consistent because it implements this as part of symbol
345 // FIXME: Cleanup this code, these bits should be emitted based on semantic
346 // properties, not on the order of definition, etc.
347 Symbol
->setReferenceTypeUndefinedLazy(false);
350 case MCSA_LazyReference
:
351 // FIXME: This requires -dynamic.
352 Symbol
->setNoDeadStrip();
353 if (Symbol
->isUndefined())
354 Symbol
->setReferenceTypeUndefinedLazy(true);
357 // Since .reference sets the no dead strip bit, it is equivalent to
358 // .no_dead_strip in practice.
360 case MCSA_NoDeadStrip
:
361 Symbol
->setNoDeadStrip();
364 case MCSA_SymbolResolver
:
365 Symbol
->setSymbolResolver();
369 Symbol
->setAltEntry();
372 case MCSA_PrivateExtern
:
373 Symbol
->setExternal(true);
374 Symbol
->setPrivateExtern(true);
377 case MCSA_WeakReference
:
378 // FIXME: This requires -dynamic.
379 if (Symbol
->isUndefined())
380 Symbol
->setWeakReference();
383 case MCSA_WeakDefinition
:
384 // FIXME: 'as' enforces that this is defined and global. The manual claims
385 // it has to be in a coalesced section, but this isn't enforced.
386 Symbol
->setWeakDefinition();
389 case MCSA_WeakDefAutoPrivate
:
390 Symbol
->setWeakDefinition();
391 Symbol
->setWeakReference();
402 void MCMachOStreamer::emitSymbolDesc(MCSymbol
*Symbol
, unsigned DescValue
) {
403 // Encode the 'desc' value into the lowest implementation defined bits.
404 getAssembler().registerSymbol(*Symbol
);
405 cast
<MCSymbolMachO
>(Symbol
)->setDesc(DescValue
);
408 void MCMachOStreamer::emitCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
409 unsigned ByteAlignment
) {
410 // FIXME: Darwin 'as' does appear to allow redef of a .comm by itself.
411 assert(Symbol
->isUndefined() && "Cannot define a symbol twice!");
413 getAssembler().registerSymbol(*Symbol
);
414 Symbol
->setExternal(true);
415 Symbol
->setCommon(Size
, ByteAlignment
);
418 void MCMachOStreamer::emitLocalCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
419 unsigned ByteAlignment
) {
420 // '.lcomm' is equivalent to '.zerofill'.
421 return emitZerofill(getContext().getObjectFileInfo()->getDataBSSSection(),
422 Symbol
, Size
, ByteAlignment
);
425 void MCMachOStreamer::emitZerofill(MCSection
*Section
, MCSymbol
*Symbol
,
426 uint64_t Size
, unsigned ByteAlignment
,
428 // On darwin all virtual sections have zerofill type. Disallow the usage of
429 // .zerofill in non-virtual functions. If something similar is needed, use
431 if (!Section
->isVirtualSection()) {
432 getContext().reportError(
433 Loc
, "The usage of .zerofill is restricted to sections of "
434 "ZEROFILL type. Use .zero or .space instead.");
435 return; // Early returning here shouldn't harm. EmitZeros should work on any
440 SwitchSection(Section
);
442 // The symbol may not be present, which only creates the section.
444 emitValueToAlignment(ByteAlignment
, 0, 1, 0);
451 // This should always be called with the thread local bss section. Like the
452 // .zerofill directive this doesn't actually switch sections on us.
453 void MCMachOStreamer::emitTBSSSymbol(MCSection
*Section
, MCSymbol
*Symbol
,
454 uint64_t Size
, unsigned ByteAlignment
) {
455 emitZerofill(Section
, Symbol
, Size
, ByteAlignment
);
458 void MCMachOStreamer::emitInstToData(const MCInst
&Inst
,
459 const MCSubtargetInfo
&STI
) {
460 MCDataFragment
*DF
= getOrCreateDataFragment();
462 SmallVector
<MCFixup
, 4> Fixups
;
463 SmallString
<256> Code
;
464 raw_svector_ostream
VecOS(Code
);
465 getAssembler().getEmitter().encodeInstruction(Inst
, VecOS
, Fixups
, STI
);
467 // Add the fixups and data.
468 for (MCFixup
&Fixup
: Fixups
) {
469 Fixup
.setOffset(Fixup
.getOffset() + DF
->getContents().size());
470 DF
->getFixups().push_back(Fixup
);
472 DF
->setHasInstructions(STI
);
473 DF
->getContents().append(Code
.begin(), Code
.end());
476 void MCMachOStreamer::finishImpl() {
477 emitFrames(&getAssembler().getBackend());
479 // We have to set the fragment atom associations so we can relax properly for
482 // First, scan the symbol table to build a lookup table from fragments to
484 DenseMap
<const MCFragment
*, const MCSymbol
*> DefiningSymbolMap
;
485 for (const MCSymbol
&Symbol
: getAssembler().symbols()) {
486 if (getAssembler().isSymbolLinkerVisible(Symbol
) && Symbol
.isInSection() &&
487 !Symbol
.isVariable()) {
488 // An atom defining symbol should never be internal to a fragment.
489 assert(Symbol
.getOffset() == 0 &&
490 "Invalid offset in atom defining symbol!");
491 DefiningSymbolMap
[Symbol
.getFragment()] = &Symbol
;
495 // Set the fragment atom associations by tracking the last seen atom defining
497 for (MCSection
&Sec
: getAssembler()) {
498 const MCSymbol
*CurrentAtom
= nullptr;
499 for (MCFragment
&Frag
: Sec
) {
500 if (const MCSymbol
*Symbol
= DefiningSymbolMap
.lookup(&Frag
))
501 CurrentAtom
= Symbol
;
502 Frag
.setAtom(CurrentAtom
);
506 this->MCObjectStreamer::finishImpl();
509 MCStreamer
*llvm::createMachOStreamer(MCContext
&Context
,
510 std::unique_ptr
<MCAsmBackend
> &&MAB
,
511 std::unique_ptr
<MCObjectWriter
> &&OW
,
512 std::unique_ptr
<MCCodeEmitter
> &&CE
,
513 bool RelaxAll
, bool DWARFMustBeAtTheEnd
,
514 bool LabelSections
) {
516 new MCMachOStreamer(Context
, std::move(MAB
), std::move(OW
), std::move(CE
),
517 DWARFMustBeAtTheEnd
, LabelSections
);
518 const Triple
&Target
= Context
.getTargetTriple();
519 S
->emitVersionForTarget(Target
, Context
.getObjectFileInfo()->getSDKVersion());
521 S
->getAssembler().setRelaxAll(true);