1 //===- Relocations.cpp ----------------------------------------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "Relocations.h"
10 #include "ConcatOutputSection.h"
12 #include "SyntheticSections.h"
15 #include "lld/Common/ErrorHandler.h"
19 using namespace lld::macho
;
21 static_assert(sizeof(void *) != 8 || sizeof(Reloc
) == 24,
22 "Try to minimize Reloc's size; we create many instances");
24 InputSection
*Reloc::getReferentInputSection() const {
25 if (const auto *sym
= referent
.dyn_cast
<Symbol
*>()) {
26 if (const auto *d
= dyn_cast
<Defined
>(sym
))
30 return referent
.get
<InputSection
*>();
34 StringRef
Reloc::getReferentString() const {
35 if (auto *isec
= referent
.dyn_cast
<InputSection
*>()) {
36 const auto *cisec
= dyn_cast
<CStringInputSection
>(isec
);
37 assert(cisec
&& "referent must be a CStringInputSection");
38 return cisec
->getStringRefAtOffset(addend
);
41 auto *sym
= dyn_cast
<Defined
>(referent
.get
<Symbol
*>());
42 assert(sym
&& "referent must be a Defined symbol");
44 auto *symIsec
= sym
->isec();
45 auto symOffset
= sym
->value
+ addend
;
47 if (auto *s
= dyn_cast_or_null
<CStringInputSection
>(symIsec
))
48 return s
->getStringRefAtOffset(symOffset
);
50 if (isa
<ConcatInputSection
>(symIsec
)) {
51 auto strData
= symIsec
->data
.slice(symOffset
);
52 const char *pszData
= reinterpret_cast<const char *>(strData
.data());
53 return StringRef(pszData
, strnlen(pszData
, strData
.size()));
56 llvm_unreachable("unknown reference section in getReferentString");
59 bool macho::validateSymbolRelocation(const Symbol
*sym
,
60 const InputSection
*isec
, const Reloc
&r
) {
61 const RelocAttrs
&relocAttrs
= target
->getRelocAttrs(r
.type
);
63 auto message
= [&](const Twine
&diagnostic
) {
65 return (isec
->getLocation(r
.offset
) + ": " + relocAttrs
.name
+
66 " relocation " + diagnostic
)
70 if (relocAttrs
.hasAttr(RelocAttrBits::TLV
) != sym
->isTlv())
71 error(message(Twine("requires that symbol ") + sym
->getName() + " " +
72 (sym
->isTlv() ? "not " : "") + "be thread-local"));
77 // Given an offset in the output buffer, figure out which ConcatInputSection (if
78 // any) maps to it. At the same time, update the offset such that it is relative
79 // to the InputSection rather than to the output buffer.
81 // Obtaining the InputSection allows us to have better error diagnostics.
82 // However, many of our relocation-handling methods do not take the InputSection
83 // as a parameter. Since we are already passing the buffer offsets to our Target
84 // methods, this function allows us to emit better errors without threading an
85 // additional InputSection argument through the call stack.
87 // This is implemented as a slow linear search through OutputSegments,
88 // OutputSections, and finally the InputSections themselves. However, this
89 // function should be called only on error paths, so some overhead is fine.
90 InputSection
*macho::offsetToInputSection(uint64_t *off
) {
91 for (OutputSegment
*seg
: outputSegments
) {
92 if (*off
< seg
->fileOff
|| *off
>= seg
->fileOff
+ seg
->fileSize
)
95 const std::vector
<OutputSection
*> §ions
= seg
->getSections();
97 for (; osecIdx
< sections
.size(); ++osecIdx
)
98 if (*off
< sections
[osecIdx
]->fileOff
)
101 // We should be only calling this function on offsets that belong to
102 // ConcatOutputSections.
103 auto *osec
= cast
<ConcatOutputSection
>(sections
[osecIdx
- 1]);
104 *off
-= osec
->fileOff
;
107 for (; isecIdx
< osec
->inputs
.size(); ++isecIdx
) {
108 const ConcatInputSection
*isec
= osec
->inputs
[isecIdx
];
109 if (*off
< isec
->outSecOff
)
113 ConcatInputSection
*isec
= osec
->inputs
[isecIdx
- 1];
114 *off
-= isec
->outSecOff
;
120 void macho::reportRangeError(void *loc
, const Reloc
&r
, const Twine
&v
,
121 uint8_t bits
, int64_t min
, uint64_t max
) {
123 uint64_t off
= reinterpret_cast<const uint8_t *>(loc
) - in
.bufferStart
;
124 const InputSection
*isec
= offsetToInputSection(&off
);
125 std::string locStr
= isec
? isec
->getLocation(off
) : "(invalid location)";
126 if (auto *sym
= r
.referent
.dyn_cast
<Symbol
*>())
127 hint
= "; references " + toString(*sym
);
128 error(locStr
+ ": relocation " + target
->getRelocAttrs(r
.type
).name
+
129 " is out of range: " + v
+ " is not in [" + Twine(min
) + ", " +
130 Twine(max
) + "]" + hint
);
133 void macho::reportRangeError(void *loc
, SymbolDiagnostic d
, const Twine
&v
,
134 uint8_t bits
, int64_t min
, uint64_t max
) {
135 // FIXME: should we use `loc` somehow to provide a better error message?
138 hint
= "; references " + toString(*d
.symbol
);
139 error(d
.reason
+ " is out of range: " + v
+ " is not in [" + Twine(min
) +
140 ", " + Twine(max
) + "]" + hint
);
143 const RelocAttrs
macho::invalidRelocAttrs
{"INVALID", RelocAttrBits::_0
};