1 //===- MCMachOStreamer.cpp - MachO Streamer -------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "llvm/ADT/DenseMap.h"
10 #include "llvm/ADT/SmallString.h"
11 #include "llvm/ADT/SmallVector.h"
12 #include "llvm/ADT/StringRef.h"
13 #include "llvm/ADT/Triple.h"
14 #include "llvm/MC/MCAsmBackend.h"
15 #include "llvm/MC/MCAssembler.h"
16 #include "llvm/MC/MCCodeEmitter.h"
17 #include "llvm/MC/MCContext.h"
18 #include "llvm/MC/MCDirectives.h"
19 #include "llvm/MC/MCExpr.h"
20 #include "llvm/MC/MCFixup.h"
21 #include "llvm/MC/MCFragment.h"
22 #include "llvm/MC/MCInst.h"
23 #include "llvm/MC/MCLinkerOptimizationHint.h"
24 #include "llvm/MC/MCObjectFileInfo.h"
25 #include "llvm/MC/MCObjectStreamer.h"
26 #include "llvm/MC/MCObjectWriter.h"
27 #include "llvm/MC/MCSection.h"
28 #include "llvm/MC/MCSectionMachO.h"
29 #include "llvm/MC/MCStreamer.h"
30 #include "llvm/MC/MCSymbol.h"
31 #include "llvm/MC/MCSymbolMachO.h"
32 #include "llvm/MC/MCValue.h"
33 #include "llvm/Support/Casting.h"
34 #include "llvm/Support/ErrorHandling.h"
35 #include "llvm/Support/TargetRegistry.h"
36 #include "llvm/Support/raw_ostream.h"
44 class MCMachOStreamer
: public MCObjectStreamer
{
46 /// LabelSections - true if each section change should emit a linker local
47 /// label for use in relocations for assembler local references. Obviates the
48 /// need for local relocations. False by default.
51 bool DWARFMustBeAtTheEnd
;
52 bool CreatedADWARFSection
;
54 /// HasSectionLabel - map of which sections have already had a non-local
55 /// label emitted to them. Used so we don't emit extraneous linker local
56 /// labels in the middle of the section.
57 DenseMap
<const MCSection
*, bool> HasSectionLabel
;
59 void EmitInstToData(const MCInst
&Inst
, const MCSubtargetInfo
&STI
) override
;
61 void EmitDataRegion(DataRegionData::KindTy Kind
);
62 void EmitDataRegionEnd();
65 MCMachOStreamer(MCContext
&Context
, std::unique_ptr
<MCAsmBackend
> MAB
,
66 std::unique_ptr
<MCObjectWriter
> OW
,
67 std::unique_ptr
<MCCodeEmitter
> Emitter
,
68 bool DWARFMustBeAtTheEnd
, bool label
)
69 : MCObjectStreamer(Context
, std::move(MAB
), std::move(OW
),
71 LabelSections(label
), DWARFMustBeAtTheEnd(DWARFMustBeAtTheEnd
),
72 CreatedADWARFSection(false) {}
75 void reset() override
{
76 CreatedADWARFSection
= false;
77 HasSectionLabel
.clear();
78 MCObjectStreamer::reset();
81 /// @name MCStreamer Interface
84 void ChangeSection(MCSection
*Sect
, const MCExpr
*Subsect
) override
;
85 void EmitLabel(MCSymbol
*Symbol
, SMLoc Loc
= SMLoc()) override
;
86 void EmitAssignment(MCSymbol
*Symbol
, const MCExpr
*Value
) override
;
87 void EmitEHSymAttributes(const MCSymbol
*Symbol
, MCSymbol
*EHSymbol
) override
;
88 void EmitAssemblerFlag(MCAssemblerFlag Flag
) override
;
89 void EmitLinkerOptions(ArrayRef
<std::string
> Options
) override
;
90 void EmitDataRegion(MCDataRegionType Kind
) override
;
91 void EmitVersionMin(MCVersionMinType Kind
, unsigned Major
, unsigned Minor
,
92 unsigned Update
, VersionTuple SDKVersion
) override
;
93 void EmitBuildVersion(unsigned Platform
, unsigned Major
, unsigned Minor
,
94 unsigned Update
, VersionTuple SDKVersion
) override
;
95 void EmitThumbFunc(MCSymbol
*Func
) override
;
96 bool EmitSymbolAttribute(MCSymbol
*Symbol
, MCSymbolAttr Attribute
) override
;
97 void EmitSymbolDesc(MCSymbol
*Symbol
, unsigned DescValue
) override
;
98 void EmitCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
99 unsigned ByteAlignment
) override
;
101 void EmitLocalCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
102 unsigned ByteAlignment
) override
;
103 void EmitZerofill(MCSection
*Section
, MCSymbol
*Symbol
= nullptr,
104 uint64_t Size
= 0, unsigned ByteAlignment
= 0,
105 SMLoc Loc
= SMLoc()) override
;
106 void EmitTBSSSymbol(MCSection
*Section
, MCSymbol
*Symbol
, uint64_t Size
,
107 unsigned ByteAlignment
= 0) override
;
109 void EmitIdent(StringRef IdentString
) override
{
110 llvm_unreachable("macho doesn't support this directive");
113 void EmitLOHDirective(MCLOHType Kind
, const MCLOHArgs
&Args
) override
{
114 getAssembler().getLOHContainer().addDirective(Kind
, Args
);
117 void FinishImpl() override
;
120 } // end anonymous namespace.
122 static bool canGoAfterDWARF(const MCSectionMachO
&MSec
) {
123 // These sections are created by the assembler itself after the end of
125 StringRef SegName
= MSec
.getSegmentName();
126 StringRef SecName
= MSec
.getSectionName();
128 if (SegName
== "__LD" && SecName
== "__compact_unwind")
131 if (SegName
== "__IMPORT") {
132 if (SecName
== "__jump_table")
135 if (SecName
== "__pointers")
139 if (SegName
== "__TEXT" && SecName
== "__eh_frame")
142 if (SegName
== "__DATA" && (SecName
== "__nl_symbol_ptr" ||
143 SecName
== "__thread_ptr"))
149 void MCMachOStreamer::ChangeSection(MCSection
*Section
,
150 const MCExpr
*Subsection
) {
151 // Change the section normally.
152 bool Created
= changeSectionImpl(Section
, Subsection
);
153 const MCSectionMachO
&MSec
= *cast
<MCSectionMachO
>(Section
);
154 StringRef SegName
= MSec
.getSegmentName();
155 if (SegName
== "__DWARF")
156 CreatedADWARFSection
= true;
157 else if (Created
&& DWARFMustBeAtTheEnd
&& !canGoAfterDWARF(MSec
))
158 assert(!CreatedADWARFSection
&& "Creating regular section after DWARF");
160 // Output a linker-local symbol so we don't need section-relative local
161 // relocations. The linker hates us when we do that.
162 if (LabelSections
&& !HasSectionLabel
[Section
] &&
163 !Section
->getBeginSymbol()) {
164 MCSymbol
*Label
= getContext().createLinkerPrivateTempSymbol();
165 Section
->setBeginSymbol(Label
);
166 HasSectionLabel
[Section
] = true;
170 void MCMachOStreamer::EmitEHSymAttributes(const MCSymbol
*Symbol
,
171 MCSymbol
*EHSymbol
) {
172 getAssembler().registerSymbol(*Symbol
);
173 if (Symbol
->isExternal())
174 EmitSymbolAttribute(EHSymbol
, MCSA_Global
);
175 if (cast
<MCSymbolMachO
>(Symbol
)->isWeakDefinition())
176 EmitSymbolAttribute(EHSymbol
, MCSA_WeakDefinition
);
177 if (Symbol
->isPrivateExtern())
178 EmitSymbolAttribute(EHSymbol
, MCSA_PrivateExtern
);
181 void MCMachOStreamer::EmitLabel(MCSymbol
*Symbol
, SMLoc Loc
) {
182 // We have to create a new fragment if this is an atom defining symbol,
183 // fragments cannot span atoms.
184 if (getAssembler().isSymbolLinkerVisible(*Symbol
))
185 insert(new MCDataFragment());
187 MCObjectStreamer::EmitLabel(Symbol
, Loc
);
189 // This causes the reference type flag to be cleared. Darwin 'as' was "trying"
190 // to clear the weak reference and weak definition bits too, but the
191 // implementation was buggy. For now we just try to match 'as', for
194 // FIXME: Cleanup this code, these bits should be emitted based on semantic
195 // properties, not on the order of definition, etc.
196 cast
<MCSymbolMachO
>(Symbol
)->clearReferenceType();
199 void MCMachOStreamer::EmitAssignment(MCSymbol
*Symbol
, const MCExpr
*Value
) {
202 if (Value
->evaluateAsRelocatable(Res
, nullptr, nullptr)) {
203 if (const MCSymbolRefExpr
*SymAExpr
= Res
.getSymA()) {
204 const MCSymbol
&SymA
= SymAExpr
->getSymbol();
205 if (!Res
.getSymB() && (SymA
.getName() == "" || Res
.getConstant() != 0))
206 cast
<MCSymbolMachO
>(Symbol
)->setAltEntry();
209 MCObjectStreamer::EmitAssignment(Symbol
, Value
);
212 void MCMachOStreamer::EmitDataRegion(DataRegionData::KindTy Kind
) {
213 // Create a temporary label to mark the start of the data region.
214 MCSymbol
*Start
= getContext().createTempSymbol();
216 // Record the region for the object writer to use.
217 DataRegionData Data
= { Kind
, Start
, nullptr };
218 std::vector
<DataRegionData
> &Regions
= getAssembler().getDataRegions();
219 Regions
.push_back(Data
);
222 void MCMachOStreamer::EmitDataRegionEnd() {
223 std::vector
<DataRegionData
> &Regions
= getAssembler().getDataRegions();
224 assert(!Regions
.empty() && "Mismatched .end_data_region!");
225 DataRegionData
&Data
= Regions
.back();
226 assert(!Data
.End
&& "Mismatched .end_data_region!");
227 // Create a temporary label to mark the end of the data region.
228 Data
.End
= getContext().createTempSymbol();
232 void MCMachOStreamer::EmitAssemblerFlag(MCAssemblerFlag Flag
) {
233 // Let the target do whatever target specific stuff it needs to do.
234 getAssembler().getBackend().handleAssemblerFlag(Flag
);
235 // Do any generic stuff we need to do.
237 case MCAF_SyntaxUnified
: return; // no-op here.
238 case MCAF_Code16
: return; // Change parsing mode; no-op here.
239 case MCAF_Code32
: return; // Change parsing mode; no-op here.
240 case MCAF_Code64
: return; // Change parsing mode; no-op here.
241 case MCAF_SubsectionsViaSymbols
:
242 getAssembler().setSubsectionsViaSymbols(true);
247 void MCMachOStreamer::EmitLinkerOptions(ArrayRef
<std::string
> Options
) {
248 getAssembler().getLinkerOptions().push_back(Options
);
251 void MCMachOStreamer::EmitDataRegion(MCDataRegionType Kind
) {
253 case MCDR_DataRegion
:
254 EmitDataRegion(DataRegionData::Data
);
256 case MCDR_DataRegionJT8
:
257 EmitDataRegion(DataRegionData::JumpTable8
);
259 case MCDR_DataRegionJT16
:
260 EmitDataRegion(DataRegionData::JumpTable16
);
262 case MCDR_DataRegionJT32
:
263 EmitDataRegion(DataRegionData::JumpTable32
);
265 case MCDR_DataRegionEnd
:
271 void MCMachOStreamer::EmitVersionMin(MCVersionMinType Kind
, unsigned Major
,
272 unsigned Minor
, unsigned Update
,
273 VersionTuple SDKVersion
) {
274 getAssembler().setVersionMin(Kind
, Major
, Minor
, Update
, SDKVersion
);
277 void MCMachOStreamer::EmitBuildVersion(unsigned Platform
, unsigned Major
,
278 unsigned Minor
, unsigned Update
,
279 VersionTuple SDKVersion
) {
280 getAssembler().setBuildVersion((MachO::PlatformType
)Platform
, Major
, Minor
,
284 void MCMachOStreamer::EmitThumbFunc(MCSymbol
*Symbol
) {
285 // Remember that the function is a thumb function. Fixup and relocation
286 // values will need adjusted.
287 getAssembler().setIsThumbFunc(Symbol
);
288 cast
<MCSymbolMachO
>(Symbol
)->setThumbFunc();
291 bool MCMachOStreamer::EmitSymbolAttribute(MCSymbol
*Sym
,
292 MCSymbolAttr Attribute
) {
293 MCSymbolMachO
*Symbol
= cast
<MCSymbolMachO
>(Sym
);
295 // Indirect symbols are handled differently, to match how 'as' handles
296 // them. This makes writing matching .o files easier.
297 if (Attribute
== MCSA_IndirectSymbol
) {
298 // Note that we intentionally cannot use the symbol data here; this is
299 // important for matching the string table that 'as' generates.
300 IndirectSymbolData ISD
;
302 ISD
.Section
= getCurrentSectionOnly();
303 getAssembler().getIndirectSymbols().push_back(ISD
);
307 // Adding a symbol attribute always introduces the symbol, note that an
308 // important side effect of calling registerSymbol here is to register
309 // the symbol with the assembler.
310 getAssembler().registerSymbol(*Symbol
);
312 // The implementation of symbol attributes is designed to match 'as', but it
313 // leaves much to desired. It doesn't really make sense to arbitrarily add and
314 // remove flags, but 'as' allows this (in particular, see .desc).
316 // In the future it might be worth trying to make these operations more well
320 case MCSA_ELF_TypeFunction
:
321 case MCSA_ELF_TypeIndFunction
:
322 case MCSA_ELF_TypeObject
:
323 case MCSA_ELF_TypeTLS
:
324 case MCSA_ELF_TypeCommon
:
325 case MCSA_ELF_TypeNoType
:
326 case MCSA_ELF_TypeGnuUniqueObject
:
328 case MCSA_IndirectSymbol
:
337 Symbol
->setExternal(true);
338 // This effectively clears the undefined lazy bit, in Darwin 'as', although
339 // it isn't very consistent because it implements this as part of symbol
342 // FIXME: Cleanup this code, these bits should be emitted based on semantic
343 // properties, not on the order of definition, etc.
344 Symbol
->setReferenceTypeUndefinedLazy(false);
347 case MCSA_LazyReference
:
348 // FIXME: This requires -dynamic.
349 Symbol
->setNoDeadStrip();
350 if (Symbol
->isUndefined())
351 Symbol
->setReferenceTypeUndefinedLazy(true);
354 // Since .reference sets the no dead strip bit, it is equivalent to
355 // .no_dead_strip in practice.
357 case MCSA_NoDeadStrip
:
358 Symbol
->setNoDeadStrip();
361 case MCSA_SymbolResolver
:
362 Symbol
->setSymbolResolver();
366 Symbol
->setAltEntry();
369 case MCSA_PrivateExtern
:
370 Symbol
->setExternal(true);
371 Symbol
->setPrivateExtern(true);
374 case MCSA_WeakReference
:
375 // FIXME: This requires -dynamic.
376 if (Symbol
->isUndefined())
377 Symbol
->setWeakReference();
380 case MCSA_WeakDefinition
:
381 // FIXME: 'as' enforces that this is defined and global. The manual claims
382 // it has to be in a coalesced section, but this isn't enforced.
383 Symbol
->setWeakDefinition();
386 case MCSA_WeakDefAutoPrivate
:
387 Symbol
->setWeakDefinition();
388 Symbol
->setWeakReference();
399 void MCMachOStreamer::EmitSymbolDesc(MCSymbol
*Symbol
, unsigned DescValue
) {
400 // Encode the 'desc' value into the lowest implementation defined bits.
401 getAssembler().registerSymbol(*Symbol
);
402 cast
<MCSymbolMachO
>(Symbol
)->setDesc(DescValue
);
405 void MCMachOStreamer::EmitCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
406 unsigned ByteAlignment
) {
407 // FIXME: Darwin 'as' does appear to allow redef of a .comm by itself.
408 assert(Symbol
->isUndefined() && "Cannot define a symbol twice!");
410 getAssembler().registerSymbol(*Symbol
);
411 Symbol
->setExternal(true);
412 Symbol
->setCommon(Size
, ByteAlignment
);
415 void MCMachOStreamer::EmitLocalCommonSymbol(MCSymbol
*Symbol
, uint64_t Size
,
416 unsigned ByteAlignment
) {
417 // '.lcomm' is equivalent to '.zerofill'.
418 return EmitZerofill(getContext().getObjectFileInfo()->getDataBSSSection(),
419 Symbol
, Size
, ByteAlignment
);
422 void MCMachOStreamer::EmitZerofill(MCSection
*Section
, MCSymbol
*Symbol
,
423 uint64_t Size
, unsigned ByteAlignment
,
425 // On darwin all virtual sections have zerofill type. Disallow the usage of
426 // .zerofill in non-virtual functions. If something similar is needed, use
428 if (!Section
->isVirtualSection()) {
429 getContext().reportError(
430 Loc
, "The usage of .zerofill is restricted to sections of "
431 "ZEROFILL type. Use .zero or .space instead.");
432 return; // Early returning here shouldn't harm. EmitZeros should work on any
437 SwitchSection(Section
);
439 // The symbol may not be present, which only creates the section.
441 EmitValueToAlignment(ByteAlignment
, 0, 1, 0);
448 // This should always be called with the thread local bss section. Like the
449 // .zerofill directive this doesn't actually switch sections on us.
450 void MCMachOStreamer::EmitTBSSSymbol(MCSection
*Section
, MCSymbol
*Symbol
,
451 uint64_t Size
, unsigned ByteAlignment
) {
452 EmitZerofill(Section
, Symbol
, Size
, ByteAlignment
);
455 void MCMachOStreamer::EmitInstToData(const MCInst
&Inst
,
456 const MCSubtargetInfo
&STI
) {
457 MCDataFragment
*DF
= getOrCreateDataFragment();
459 SmallVector
<MCFixup
, 4> Fixups
;
460 SmallString
<256> Code
;
461 raw_svector_ostream
VecOS(Code
);
462 getAssembler().getEmitter().encodeInstruction(Inst
, VecOS
, Fixups
, STI
);
464 // Add the fixups and data.
465 for (MCFixup
&Fixup
: Fixups
) {
466 Fixup
.setOffset(Fixup
.getOffset() + DF
->getContents().size());
467 DF
->getFixups().push_back(Fixup
);
469 DF
->setHasInstructions(STI
);
470 DF
->getContents().append(Code
.begin(), Code
.end());
473 void MCMachOStreamer::FinishImpl() {
474 EmitFrames(&getAssembler().getBackend());
476 // We have to set the fragment atom associations so we can relax properly for
479 // First, scan the symbol table to build a lookup table from fragments to
481 DenseMap
<const MCFragment
*, const MCSymbol
*> DefiningSymbolMap
;
482 for (const MCSymbol
&Symbol
: getAssembler().symbols()) {
483 if (getAssembler().isSymbolLinkerVisible(Symbol
) && Symbol
.isInSection() &&
484 !Symbol
.isVariable()) {
485 // An atom defining symbol should never be internal to a fragment.
486 assert(Symbol
.getOffset() == 0 &&
487 "Invalid offset in atom defining symbol!");
488 DefiningSymbolMap
[Symbol
.getFragment()] = &Symbol
;
492 // Set the fragment atom associations by tracking the last seen atom defining
494 for (MCSection
&Sec
: getAssembler()) {
495 const MCSymbol
*CurrentAtom
= nullptr;
496 for (MCFragment
&Frag
: Sec
) {
497 if (const MCSymbol
*Symbol
= DefiningSymbolMap
.lookup(&Frag
))
498 CurrentAtom
= Symbol
;
499 Frag
.setAtom(CurrentAtom
);
503 this->MCObjectStreamer::FinishImpl();
506 MCStreamer
*llvm::createMachOStreamer(MCContext
&Context
,
507 std::unique_ptr
<MCAsmBackend
> &&MAB
,
508 std::unique_ptr
<MCObjectWriter
> &&OW
,
509 std::unique_ptr
<MCCodeEmitter
> &&CE
,
510 bool RelaxAll
, bool DWARFMustBeAtTheEnd
,
511 bool LabelSections
) {
513 new MCMachOStreamer(Context
, std::move(MAB
), std::move(OW
), std::move(CE
),
514 DWARFMustBeAtTheEnd
, LabelSections
);
515 const Triple
&Target
= Context
.getObjectFileInfo()->getTargetTriple();
516 S
->EmitVersionForTarget(Target
, Context
.getObjectFileInfo()->getSDKVersion());
518 S
->getAssembler().setRelaxAll(true);