1 //===- lib/MC/MCWin64EH.cpp - MCWin64EH implementation --------------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "llvm/MC/MCWin64EH.h"
10 #include "llvm/ADT/Twine.h"
11 #include "llvm/MC/MCContext.h"
12 #include "llvm/MC/MCExpr.h"
13 #include "llvm/MC/MCObjectFileInfo.h"
14 #include "llvm/MC/MCObjectStreamer.h"
15 #include "llvm/MC/MCSectionCOFF.h"
16 #include "llvm/MC/MCStreamer.h"
17 #include "llvm/MC/MCSymbol.h"
18 #include "llvm/Support/Win64EH.h"
22 // NOTE: All relocations generated here are 4-byte image-relative.
24 static uint8_t CountOfUnwindCodes(std::vector
<WinEH::Instruction
> &Insns
) {
26 for (const auto &I
: Insns
) {
27 switch (static_cast<Win64EH::UnwindOpcodes
>(I
.Operation
)) {
29 llvm_unreachable("Unsupported unwind code");
30 case Win64EH::UOP_PushNonVol
:
31 case Win64EH::UOP_AllocSmall
:
32 case Win64EH::UOP_SetFPReg
:
33 case Win64EH::UOP_PushMachFrame
:
36 case Win64EH::UOP_SaveNonVol
:
37 case Win64EH::UOP_SaveXMM128
:
40 case Win64EH::UOP_SaveNonVolBig
:
41 case Win64EH::UOP_SaveXMM128Big
:
44 case Win64EH::UOP_AllocLarge
:
45 Count
+= (I
.Offset
> 512 * 1024 - 8) ? 3 : 2;
52 static void EmitAbsDifference(MCStreamer
&Streamer
, const MCSymbol
*LHS
,
53 const MCSymbol
*RHS
) {
54 MCContext
&Context
= Streamer
.getContext();
56 MCBinaryExpr::createSub(MCSymbolRefExpr::create(LHS
, Context
),
57 MCSymbolRefExpr::create(RHS
, Context
), Context
);
58 Streamer
.emitValue(Diff
, 1);
61 static void EmitUnwindCode(MCStreamer
&streamer
, const MCSymbol
*begin
,
62 WinEH::Instruction
&inst
) {
65 b2
= (inst
.Operation
& 0x0F);
66 switch (static_cast<Win64EH::UnwindOpcodes
>(inst
.Operation
)) {
68 llvm_unreachable("Unsupported unwind code");
69 case Win64EH::UOP_PushNonVol
:
70 EmitAbsDifference(streamer
, inst
.Label
, begin
);
71 b2
|= (inst
.Register
& 0x0F) << 4;
72 streamer
.emitInt8(b2
);
74 case Win64EH::UOP_AllocLarge
:
75 EmitAbsDifference(streamer
, inst
.Label
, begin
);
76 if (inst
.Offset
> 512 * 1024 - 8) {
78 streamer
.emitInt8(b2
);
79 w
= inst
.Offset
& 0xFFF8;
80 streamer
.emitInt16(w
);
81 w
= inst
.Offset
>> 16;
83 streamer
.emitInt8(b2
);
86 streamer
.emitInt16(w
);
88 case Win64EH::UOP_AllocSmall
:
89 b2
|= (((inst
.Offset
- 8) >> 3) & 0x0F) << 4;
90 EmitAbsDifference(streamer
, inst
.Label
, begin
);
91 streamer
.emitInt8(b2
);
93 case Win64EH::UOP_SetFPReg
:
94 EmitAbsDifference(streamer
, inst
.Label
, begin
);
95 streamer
.emitInt8(b2
);
97 case Win64EH::UOP_SaveNonVol
:
98 case Win64EH::UOP_SaveXMM128
:
99 b2
|= (inst
.Register
& 0x0F) << 4;
100 EmitAbsDifference(streamer
, inst
.Label
, begin
);
101 streamer
.emitInt8(b2
);
102 w
= inst
.Offset
>> 3;
103 if (inst
.Operation
== Win64EH::UOP_SaveXMM128
)
105 streamer
.emitInt16(w
);
107 case Win64EH::UOP_SaveNonVolBig
:
108 case Win64EH::UOP_SaveXMM128Big
:
109 b2
|= (inst
.Register
& 0x0F) << 4;
110 EmitAbsDifference(streamer
, inst
.Label
, begin
);
111 streamer
.emitInt8(b2
);
112 if (inst
.Operation
== Win64EH::UOP_SaveXMM128Big
)
113 w
= inst
.Offset
& 0xFFF0;
115 w
= inst
.Offset
& 0xFFF8;
116 streamer
.emitInt16(w
);
117 w
= inst
.Offset
>> 16;
118 streamer
.emitInt16(w
);
120 case Win64EH::UOP_PushMachFrame
:
121 if (inst
.Offset
== 1)
123 EmitAbsDifference(streamer
, inst
.Label
, begin
);
124 streamer
.emitInt8(b2
);
129 static void EmitSymbolRefWithOfs(MCStreamer
&streamer
,
130 const MCSymbol
*Base
,
131 const MCSymbol
*Other
) {
132 MCContext
&Context
= streamer
.getContext();
133 const MCSymbolRefExpr
*BaseRef
= MCSymbolRefExpr::create(Base
, Context
);
134 const MCSymbolRefExpr
*OtherRef
= MCSymbolRefExpr::create(Other
, Context
);
135 const MCExpr
*Ofs
= MCBinaryExpr::createSub(OtherRef
, BaseRef
, Context
);
136 const MCSymbolRefExpr
*BaseRefRel
= MCSymbolRefExpr::create(Base
,
137 MCSymbolRefExpr::VK_COFF_IMGREL32
,
139 streamer
.emitValue(MCBinaryExpr::createAdd(BaseRefRel
, Ofs
, Context
), 4);
142 static void EmitRuntimeFunction(MCStreamer
&streamer
,
143 const WinEH::FrameInfo
*info
) {
144 MCContext
&context
= streamer
.getContext();
146 streamer
.emitValueToAlignment(4);
147 EmitSymbolRefWithOfs(streamer
, info
->Function
, info
->Begin
);
148 EmitSymbolRefWithOfs(streamer
, info
->Function
, info
->End
);
149 streamer
.emitValue(MCSymbolRefExpr::create(info
->Symbol
,
150 MCSymbolRefExpr::VK_COFF_IMGREL32
,
154 static void EmitUnwindInfo(MCStreamer
&streamer
, WinEH::FrameInfo
*info
) {
155 // If this UNWIND_INFO already has a symbol, it's already been emitted.
159 MCContext
&context
= streamer
.getContext();
160 MCSymbol
*Label
= context
.createTempSymbol();
162 streamer
.emitValueToAlignment(4);
163 streamer
.emitLabel(Label
);
164 info
->Symbol
= Label
;
166 // Upper 3 bits are the version number (currently 1).
167 uint8_t flags
= 0x01;
168 if (info
->ChainedParent
)
169 flags
|= Win64EH::UNW_ChainInfo
<< 3;
171 if (info
->HandlesUnwind
)
172 flags
|= Win64EH::UNW_TerminateHandler
<< 3;
173 if (info
->HandlesExceptions
)
174 flags
|= Win64EH::UNW_ExceptionHandler
<< 3;
176 streamer
.emitInt8(flags
);
179 EmitAbsDifference(streamer
, info
->PrologEnd
, info
->Begin
);
181 streamer
.emitInt8(0);
183 uint8_t numCodes
= CountOfUnwindCodes(info
->Instructions
);
184 streamer
.emitInt8(numCodes
);
187 if (info
->LastFrameInst
>= 0) {
188 WinEH::Instruction
&frameInst
= info
->Instructions
[info
->LastFrameInst
];
189 assert(frameInst
.Operation
== Win64EH::UOP_SetFPReg
);
190 frame
= (frameInst
.Register
& 0x0F) | (frameInst
.Offset
& 0xF0);
192 streamer
.emitInt8(frame
);
194 // Emit unwind instructions (in reverse order).
195 uint8_t numInst
= info
->Instructions
.size();
196 for (uint8_t c
= 0; c
< numInst
; ++c
) {
197 WinEH::Instruction inst
= info
->Instructions
.back();
198 info
->Instructions
.pop_back();
199 EmitUnwindCode(streamer
, info
->Begin
, inst
);
202 // For alignment purposes, the instruction array will always have an even
203 // number of entries, with the final entry potentially unused (in which case
204 // the array will be one longer than indicated by the count of unwind codes
207 streamer
.emitInt16(0);
210 if (flags
& (Win64EH::UNW_ChainInfo
<< 3))
211 EmitRuntimeFunction(streamer
, info
->ChainedParent
);
213 ((Win64EH::UNW_TerminateHandler
|Win64EH::UNW_ExceptionHandler
) << 3))
214 streamer
.emitValue(MCSymbolRefExpr::create(info
->ExceptionHandler
,
215 MCSymbolRefExpr::VK_COFF_IMGREL32
,
217 else if (numCodes
== 0) {
218 // The minimum size of an UNWIND_INFO struct is 8 bytes. If we're not
219 // a chained unwind info, if there is no handler, and if there are fewer
220 // than 2 slots used in the unwind code array, we have to pad to 8 bytes.
221 streamer
.emitInt32(0);
225 void llvm::Win64EH::UnwindEmitter::Emit(MCStreamer
&Streamer
) const {
226 // Emit the unwind info structs first.
227 for (const auto &CFI
: Streamer
.getWinFrameInfos()) {
228 MCSection
*XData
= Streamer
.getAssociatedXDataSection(CFI
->TextSection
);
229 Streamer
.SwitchSection(XData
);
230 ::EmitUnwindInfo(Streamer
, CFI
.get());
233 // Now emit RUNTIME_FUNCTION entries.
234 for (const auto &CFI
: Streamer
.getWinFrameInfos()) {
235 MCSection
*PData
= Streamer
.getAssociatedPDataSection(CFI
->TextSection
);
236 Streamer
.SwitchSection(PData
);
237 EmitRuntimeFunction(Streamer
, CFI
.get());
241 void llvm::Win64EH::UnwindEmitter::EmitUnwindInfo(MCStreamer
&Streamer
,
242 WinEH::FrameInfo
*info
,
243 bool HandlerData
) const {
244 // Switch sections (the static function above is meant to be called from
245 // here and from Emit().
246 MCSection
*XData
= Streamer
.getAssociatedXDataSection(info
->TextSection
);
247 Streamer
.SwitchSection(XData
);
249 ::EmitUnwindInfo(Streamer
, info
);
252 static int64_t GetAbsDifference(MCStreamer
&Streamer
, const MCSymbol
*LHS
,
253 const MCSymbol
*RHS
) {
254 MCContext
&Context
= Streamer
.getContext();
256 MCBinaryExpr::createSub(MCSymbolRefExpr::create(LHS
, Context
),
257 MCSymbolRefExpr::create(RHS
, Context
), Context
);
258 MCObjectStreamer
*OS
= (MCObjectStreamer
*)(&Streamer
);
259 // It should normally be possible to calculate the length of a function
260 // at this point, but it might not be possible in the presence of certain
261 // unusual constructs, like an inline asm with an alignment directive.
263 if (!Diff
->evaluateAsAbsolute(value
, OS
->getAssembler()))
264 report_fatal_error("Failed to evaluate function length in SEH unwind info");
268 static uint32_t ARM64CountOfUnwindCodes(ArrayRef
<WinEH::Instruction
> Insns
) {
270 for (const auto &I
: Insns
) {
271 switch (static_cast<Win64EH::UnwindOpcodes
>(I
.Operation
)) {
273 llvm_unreachable("Unsupported ARM64 unwind code");
274 case Win64EH::UOP_AllocSmall
:
277 case Win64EH::UOP_AllocMedium
:
280 case Win64EH::UOP_AllocLarge
:
283 case Win64EH::UOP_SaveR19R20X
:
286 case Win64EH::UOP_SaveFPLRX
:
289 case Win64EH::UOP_SaveFPLR
:
292 case Win64EH::UOP_SaveReg
:
295 case Win64EH::UOP_SaveRegP
:
298 case Win64EH::UOP_SaveRegPX
:
301 case Win64EH::UOP_SaveRegX
:
304 case Win64EH::UOP_SaveLRPair
:
307 case Win64EH::UOP_SaveFReg
:
310 case Win64EH::UOP_SaveFRegP
:
313 case Win64EH::UOP_SaveFRegX
:
316 case Win64EH::UOP_SaveFRegPX
:
319 case Win64EH::UOP_SetFP
:
322 case Win64EH::UOP_AddFP
:
325 case Win64EH::UOP_Nop
:
328 case Win64EH::UOP_End
:
331 case Win64EH::UOP_SaveNext
:
334 case Win64EH::UOP_TrapFrame
:
337 case Win64EH::UOP_PushMachFrame
:
340 case Win64EH::UOP_Context
:
343 case Win64EH::UOP_ClearUnwoundToCall
:
351 // Unwind opcode encodings and restrictions are documented at
352 // https://docs.microsoft.com/en-us/cpp/build/arm64-exception-handling
353 static void ARM64EmitUnwindCode(MCStreamer
&streamer
, const MCSymbol
*begin
,
354 WinEH::Instruction
&inst
) {
356 switch (static_cast<Win64EH::UnwindOpcodes
>(inst
.Operation
)) {
358 llvm_unreachable("Unsupported ARM64 unwind code");
359 case Win64EH::UOP_AllocSmall
:
360 b
= (inst
.Offset
>> 4) & 0x1F;
361 streamer
.emitInt8(b
);
363 case Win64EH::UOP_AllocMedium
: {
364 uint16_t hw
= (inst
.Offset
>> 4) & 0x7FF;
367 streamer
.emitInt8(b
);
369 streamer
.emitInt8(b
);
372 case Win64EH::UOP_AllocLarge
: {
375 streamer
.emitInt8(b
);
376 w
= inst
.Offset
>> 4;
377 b
= (w
& 0x00FF0000) >> 16;
378 streamer
.emitInt8(b
);
379 b
= (w
& 0x0000FF00) >> 8;
380 streamer
.emitInt8(b
);
382 streamer
.emitInt8(b
);
385 case Win64EH::UOP_SetFP
:
387 streamer
.emitInt8(b
);
389 case Win64EH::UOP_AddFP
:
391 streamer
.emitInt8(b
);
392 b
= (inst
.Offset
>> 3);
393 streamer
.emitInt8(b
);
395 case Win64EH::UOP_Nop
:
397 streamer
.emitInt8(b
);
399 case Win64EH::UOP_SaveR19R20X
:
401 b
|= (inst
.Offset
>> 3) & 0x1F;
402 streamer
.emitInt8(b
);
404 case Win64EH::UOP_SaveFPLRX
:
406 b
|= ((inst
.Offset
- 1) >> 3) & 0x3F;
407 streamer
.emitInt8(b
);
409 case Win64EH::UOP_SaveFPLR
:
411 b
|= (inst
.Offset
>> 3) & 0x3F;
412 streamer
.emitInt8(b
);
414 case Win64EH::UOP_SaveReg
:
415 assert(inst
.Register
>= 19 && "Saved reg must be >= 19");
416 reg
= inst
.Register
- 19;
417 b
= 0xD0 | ((reg
& 0xC) >> 2);
418 streamer
.emitInt8(b
);
419 b
= ((reg
& 0x3) << 6) | (inst
.Offset
>> 3);
420 streamer
.emitInt8(b
);
422 case Win64EH::UOP_SaveRegX
:
423 assert(inst
.Register
>= 19 && "Saved reg must be >= 19");
424 reg
= inst
.Register
- 19;
425 b
= 0xD4 | ((reg
& 0x8) >> 3);
426 streamer
.emitInt8(b
);
427 b
= ((reg
& 0x7) << 5) | ((inst
.Offset
>> 3) - 1);
428 streamer
.emitInt8(b
);
430 case Win64EH::UOP_SaveRegP
:
431 assert(inst
.Register
>= 19 && "Saved registers must be >= 19");
432 reg
= inst
.Register
- 19;
433 b
= 0xC8 | ((reg
& 0xC) >> 2);
434 streamer
.emitInt8(b
);
435 b
= ((reg
& 0x3) << 6) | (inst
.Offset
>> 3);
436 streamer
.emitInt8(b
);
438 case Win64EH::UOP_SaveRegPX
:
439 assert(inst
.Register
>= 19 && "Saved registers must be >= 19");
440 reg
= inst
.Register
- 19;
441 b
= 0xCC | ((reg
& 0xC) >> 2);
442 streamer
.emitInt8(b
);
443 b
= ((reg
& 0x3) << 6) | ((inst
.Offset
>> 3) - 1);
444 streamer
.emitInt8(b
);
446 case Win64EH::UOP_SaveLRPair
:
447 assert(inst
.Register
>= 19 && "Saved reg must be >= 19");
448 reg
= inst
.Register
- 19;
449 assert((reg
% 2) == 0 && "Saved reg must be 19+2*X");
451 b
= 0xD6 | ((reg
& 0x7) >> 2);
452 streamer
.emitInt8(b
);
453 b
= ((reg
& 0x3) << 6) | (inst
.Offset
>> 3);
454 streamer
.emitInt8(b
);
456 case Win64EH::UOP_SaveFReg
:
457 assert(inst
.Register
>= 8 && "Saved dreg must be >= 8");
458 reg
= inst
.Register
- 8;
459 b
= 0xDC | ((reg
& 0x4) >> 2);
460 streamer
.emitInt8(b
);
461 b
= ((reg
& 0x3) << 6) | (inst
.Offset
>> 3);
462 streamer
.emitInt8(b
);
464 case Win64EH::UOP_SaveFRegX
:
465 assert(inst
.Register
>= 8 && "Saved dreg must be >= 8");
466 reg
= inst
.Register
- 8;
468 streamer
.emitInt8(b
);
469 b
= ((reg
& 0x7) << 5) | ((inst
.Offset
>> 3) - 1);
470 streamer
.emitInt8(b
);
472 case Win64EH::UOP_SaveFRegP
:
473 assert(inst
.Register
>= 8 && "Saved dregs must be >= 8");
474 reg
= inst
.Register
- 8;
475 b
= 0xD8 | ((reg
& 0x4) >> 2);
476 streamer
.emitInt8(b
);
477 b
= ((reg
& 0x3) << 6) | (inst
.Offset
>> 3);
478 streamer
.emitInt8(b
);
480 case Win64EH::UOP_SaveFRegPX
:
481 assert(inst
.Register
>= 8 && "Saved dregs must be >= 8");
482 reg
= inst
.Register
- 8;
483 b
= 0xDA | ((reg
& 0x4) >> 2);
484 streamer
.emitInt8(b
);
485 b
= ((reg
& 0x3) << 6) | ((inst
.Offset
>> 3) - 1);
486 streamer
.emitInt8(b
);
488 case Win64EH::UOP_End
:
490 streamer
.emitInt8(b
);
492 case Win64EH::UOP_SaveNext
:
494 streamer
.emitInt8(b
);
496 case Win64EH::UOP_TrapFrame
:
498 streamer
.emitInt8(b
);
500 case Win64EH::UOP_PushMachFrame
:
502 streamer
.emitInt8(b
);
504 case Win64EH::UOP_Context
:
506 streamer
.emitInt8(b
);
508 case Win64EH::UOP_ClearUnwoundToCall
:
510 streamer
.emitInt8(b
);
515 // Returns the epilog symbol of an epilog with the exact same unwind code
516 // sequence, if it exists. Otherwise, returns nulltpr.
517 // EpilogInstrs - Unwind codes for the current epilog.
518 // Epilogs - Epilogs that potentialy match the current epilog.
520 FindMatchingEpilog(const std::vector
<WinEH::Instruction
>& EpilogInstrs
,
521 const std::vector
<MCSymbol
*>& Epilogs
,
522 const WinEH::FrameInfo
*info
) {
523 for (auto *EpilogStart
: Epilogs
) {
524 auto InstrsIter
= info
->EpilogMap
.find(EpilogStart
);
525 assert(InstrsIter
!= info
->EpilogMap
.end() &&
526 "Epilog not found in EpilogMap");
527 const auto &Instrs
= InstrsIter
->second
;
529 if (Instrs
.size() != EpilogInstrs
.size())
533 for (unsigned i
= 0; i
< Instrs
.size(); ++i
)
534 if (Instrs
[i
].Operation
!= EpilogInstrs
[i
].Operation
||
535 Instrs
[i
].Offset
!= EpilogInstrs
[i
].Offset
||
536 Instrs
[i
].Register
!= EpilogInstrs
[i
].Register
) {
547 static void simplifyOpcodes(std::vector
<WinEH::Instruction
> &Instructions
,
549 unsigned PrevOffset
= -1;
550 unsigned PrevRegister
= -1;
552 auto VisitInstruction
= [&](WinEH::Instruction
&Inst
) {
553 // Convert 2-byte opcodes into equivalent 1-byte ones.
554 if (Inst
.Operation
== Win64EH::UOP_SaveRegP
&& Inst
.Register
== 29) {
555 Inst
.Operation
= Win64EH::UOP_SaveFPLR
;
557 } else if (Inst
.Operation
== Win64EH::UOP_SaveRegPX
&&
558 Inst
.Register
== 29) {
559 Inst
.Operation
= Win64EH::UOP_SaveFPLRX
;
561 } else if (Inst
.Operation
== Win64EH::UOP_SaveRegPX
&&
562 Inst
.Register
== 19 && Inst
.Offset
<= 248) {
563 Inst
.Operation
= Win64EH::UOP_SaveR19R20X
;
565 } else if (Inst
.Operation
== Win64EH::UOP_AddFP
&& Inst
.Offset
== 0) {
566 Inst
.Operation
= Win64EH::UOP_SetFP
;
567 } else if (Inst
.Operation
== Win64EH::UOP_SaveRegP
&&
568 Inst
.Register
== PrevRegister
+ 2 &&
569 Inst
.Offset
== PrevOffset
+ 16) {
570 Inst
.Operation
= Win64EH::UOP_SaveNext
;
573 // Intentionally not creating UOP_SaveNext for float register pairs,
574 // as current versions of Windows (up to at least 20.04) is buggy
575 // regarding SaveNext for float pairs.
577 // Update info about the previous instruction, for detecting if
578 // the next one can be made a UOP_SaveNext
579 if (Inst
.Operation
== Win64EH::UOP_SaveR19R20X
) {
582 } else if (Inst
.Operation
== Win64EH::UOP_SaveRegPX
) {
584 PrevRegister
= Inst
.Register
;
585 } else if (Inst
.Operation
== Win64EH::UOP_SaveRegP
) {
586 PrevOffset
= Inst
.Offset
;
587 PrevRegister
= Inst
.Register
;
588 } else if (Inst
.Operation
== Win64EH::UOP_SaveNext
) {
597 // Iterate over instructions in a forward order (for prologues),
598 // backwards for epilogues (i.e. always reverse compared to how the
599 // opcodes are stored).
601 for (auto It
= Instructions
.rbegin(); It
!= Instructions
.rend(); It
++)
602 VisitInstruction(*It
);
604 for (WinEH::Instruction
&Inst
: Instructions
)
605 VisitInstruction(Inst
);
609 static int checkPackedEpilog(MCStreamer
&streamer
, WinEH::FrameInfo
*info
,
610 int PrologCodeBytes
) {
611 // Can only pack if there's one single epilog
612 if (info
->EpilogMap
.size() != 1)
615 const std::vector
<WinEH::Instruction
> &Epilog
=
616 info
->EpilogMap
.begin()->second
;
618 // Can pack if the epilog is a subset of the prolog but not vice versa
619 if (Epilog
.size() > info
->Instructions
.size())
622 // Check that the epilog actually is a perfect match for the end (backwrds)
624 for (int I
= Epilog
.size() - 1; I
>= 0; I
--) {
625 if (info
->Instructions
[I
] != Epilog
[Epilog
.size() - 1 - I
])
629 // Check that the epilog actually is at the very end of the function,
630 // otherwise it can't be packed.
631 uint32_t DistanceFromEnd
= (uint32_t)GetAbsDifference(
632 streamer
, info
->FuncletOrFuncEnd
, info
->EpilogMap
.begin()->first
);
633 if (DistanceFromEnd
/ 4 != Epilog
.size())
636 int Offset
= Epilog
.size() == info
->Instructions
.size()
638 : ARM64CountOfUnwindCodes(ArrayRef
<WinEH::Instruction
>(
639 &info
->Instructions
[Epilog
.size()],
640 info
->Instructions
.size() - Epilog
.size()));
642 // Check that the offset and prolog size fits in the first word; it's
643 // unclear whether the epilog count in the extension word can be taken
644 // as packed epilog offset.
645 if (Offset
> 31 || PrologCodeBytes
> 124)
648 info
->EpilogMap
.clear();
652 static bool tryPackedUnwind(WinEH::FrameInfo
*info
, uint32_t FuncLength
,
653 int PackedEpilogOffset
) {
654 if (PackedEpilogOffset
== 0) {
655 // Fully symmetric prolog and epilog, should be ok for packed format.
656 // For CR=3, the corresponding synthesized epilog actually lacks the
657 // SetFP opcode, but unwinding should work just fine despite that
658 // (if at the SetFP opcode, the unwinder considers it as part of the
659 // function body and just unwinds the full prolog instead).
660 } else if (PackedEpilogOffset
== 1) {
661 // One single case of differences between prolog and epilog is allowed:
662 // The epilog can lack a single SetFP that is the last opcode in the
663 // prolog, for the CR=3 case.
664 if (info
->Instructions
.back().Operation
!= Win64EH::UOP_SetFP
)
667 // Too much difference between prolog and epilog.
670 unsigned RegI
= 0, RegF
= 0;
671 int Predecrement
= 0;
682 bool StandaloneLR
= false, FPLRPair
= false;
685 // Iterate over the prolog and check that all opcodes exactly match
686 // the canonical order and form. A more lax check could verify that
687 // all saved registers are in the expected locations, but not enforce
688 // the order - that would work fine when unwinding from within
689 // functions, but not be exactly right if unwinding happens within
691 for (const WinEH::Instruction
&Inst
: info
->Instructions
) {
692 switch (Inst
.Operation
) {
693 case Win64EH::UOP_End
:
694 if (Location
!= Start
)
698 case Win64EH::UOP_SaveR19R20X
:
699 if (Location
!= Start2
)
701 Predecrement
= Inst
.Offset
;
705 case Win64EH::UOP_SaveRegX
:
706 if (Location
!= Start2
)
708 Predecrement
= Inst
.Offset
;
709 if (Inst
.Register
== 19)
711 else if (Inst
.Register
== 30)
715 // Odd register; can't be any further int registers.
716 Location
= FloatRegs
;
718 case Win64EH::UOP_SaveRegPX
:
719 // Can't have this in a canonical prologue. Either this has been
720 // canonicalized into SaveR19R20X or SaveFPLRX, or it's an unsupported
722 // It can't be canonicalized into SaveR19R20X if the offset is
723 // larger than 248 bytes, but even with the maximum case with
724 // RegI=10/RegF=8/CR=1/H=1, we end up with SavSZ = 216, which should
725 // fit into SaveR19R20X.
726 // The unwinding opcodes can't describe the otherwise seemingly valid
727 // case for RegI=1 CR=1, that would start with a
728 // "stp x19, lr, [sp, #-...]!" as that fits neither SaveRegPX nor
731 case Win64EH::UOP_SaveRegP
:
732 if (Location
!= IntRegs
|| Inst
.Offset
!= 8 * RegI
||
733 Inst
.Register
!= 19 + RegI
)
737 case Win64EH::UOP_SaveReg
:
738 if (Location
!= IntRegs
|| Inst
.Offset
!= 8 * RegI
)
740 if (Inst
.Register
== 19 + RegI
)
742 else if (Inst
.Register
== 30)
746 // Odd register; can't be any further int registers.
747 Location
= FloatRegs
;
749 case Win64EH::UOP_SaveLRPair
:
750 if (Location
!= IntRegs
|| Inst
.Offset
!= 8 * RegI
||
751 Inst
.Register
!= 19 + RegI
)
755 Location
= FloatRegs
;
757 case Win64EH::UOP_SaveFRegX
:
758 // Packed unwind can't handle prologs that only save one single
761 case Win64EH::UOP_SaveFReg
:
762 if (Location
!= FloatRegs
|| RegF
== 0 || Inst
.Register
!= 8 + RegF
||
763 Inst
.Offset
!= 8 * (RegI
+ (StandaloneLR
? 1 : 0) + RegF
))
766 Location
= InputArgs
;
768 case Win64EH::UOP_SaveFRegPX
:
769 if (Location
!= Start2
|| Inst
.Register
!= 8)
771 Predecrement
= Inst
.Offset
;
773 Location
= FloatRegs
;
775 case Win64EH::UOP_SaveFRegP
:
776 if ((Location
!= IntRegs
&& Location
!= FloatRegs
) ||
777 Inst
.Register
!= 8 + RegF
||
778 Inst
.Offset
!= 8 * (RegI
+ (StandaloneLR
? 1 : 0) + RegF
))
781 Location
= FloatRegs
;
783 case Win64EH::UOP_SaveNext
:
784 if (Location
== IntRegs
)
786 else if (Location
== FloatRegs
)
791 case Win64EH::UOP_Nop
:
792 if (Location
!= IntRegs
&& Location
!= FloatRegs
&& Location
!= InputArgs
)
794 Location
= InputArgs
;
797 case Win64EH::UOP_AllocSmall
:
798 case Win64EH::UOP_AllocMedium
:
799 if (Location
!= Start2
&& Location
!= IntRegs
&& Location
!= FloatRegs
&&
800 Location
!= InputArgs
&& Location
!= StackAdjust
)
802 // Can have either a single decrement, or a pair of decrements with
803 // 4080 and another decrement.
804 if (StackOffset
== 0)
805 StackOffset
= Inst
.Offset
;
806 else if (StackOffset
!= 4080)
809 StackOffset
+= Inst
.Offset
;
810 Location
= StackAdjust
;
812 case Win64EH::UOP_SaveFPLRX
:
813 // Not allowing FPLRX after StackAdjust; if a StackAdjust is used, it
814 // should be followed by a FPLR instead.
815 if (Location
!= Start2
&& Location
!= IntRegs
&& Location
!= FloatRegs
&&
816 Location
!= InputArgs
)
818 StackOffset
= Inst
.Offset
;
819 Location
= FrameRecord
;
822 case Win64EH::UOP_SaveFPLR
:
823 // This can only follow after a StackAdjust
824 if (Location
!= StackAdjust
|| Inst
.Offset
!= 0)
826 Location
= FrameRecord
;
829 case Win64EH::UOP_SetFP
:
830 if (Location
!= FrameRecord
)
836 if (RegI
> 10 || RegF
> 8)
838 if (StandaloneLR
&& FPLRPair
)
840 if (FPLRPair
&& Location
!= End
)
842 if (Nops
!= 0 && Nops
!= 4)
845 int IntSZ
= 8 * RegI
;
848 int FpSZ
= 8 * RegF
; // RegF not yet decremented
849 int SavSZ
= (IntSZ
+ FpSZ
+ 8 * 8 * H
+ 0xF) & ~0xF;
850 if (Predecrement
!= SavSZ
)
852 if (FPLRPair
&& StackOffset
< 16)
854 if (StackOffset
% 16)
856 uint32_t FrameSize
= (StackOffset
+ SavSZ
) / 16;
857 if (FrameSize
> 0x1FF)
859 assert(RegF
!= 1 && "One single float reg not allowed");
861 RegF
--; // Convert from actual number of registers, to value stored
862 assert(FuncLength
<= 0x7FF && "FuncLength should have been checked earlier");
863 int Flag
= 0x01; // Function segments not supported yet
864 int CR
= FPLRPair
? 3 : StandaloneLR
? 1 : 0;
865 info
->PackedInfo
|= Flag
<< 0;
866 info
->PackedInfo
|= (FuncLength
& 0x7FF) << 2;
867 info
->PackedInfo
|= (RegF
& 0x7) << 13;
868 info
->PackedInfo
|= (RegI
& 0xF) << 16;
869 info
->PackedInfo
|= (H
& 0x1) << 20;
870 info
->PackedInfo
|= (CR
& 0x3) << 21;
871 info
->PackedInfo
|= (FrameSize
& 0x1FF) << 23;
875 // Populate the .xdata section. The format of .xdata on ARM64 is documented at
876 // https://docs.microsoft.com/en-us/cpp/build/arm64-exception-handling
877 static void ARM64EmitUnwindInfo(MCStreamer
&streamer
, WinEH::FrameInfo
*info
,
878 bool TryPacked
= true) {
879 // If this UNWIND_INFO already has a symbol, it's already been emitted.
882 // If there's no unwind info here (not even a terminating UOP_End), the
883 // unwind info is considered bogus and skipped. If this was done in
884 // response to an explicit .seh_handlerdata, the associated trailing
885 // handler data is left orphaned in the xdata section.
887 info
->EmitAttempted
= true;
890 if (info
->EmitAttempted
) {
891 // If we tried to emit unwind info before (due to an explicit
892 // .seh_handlerdata directive), but skipped it (because there was no
893 // valid information to emit at the time), and it later got valid unwind
894 // opcodes, we can't emit it here, because the trailing handler data
895 // was already emitted elsewhere in the xdata section.
896 streamer
.getContext().reportError(
897 SMLoc(), "Earlier .seh_handlerdata for " + info
->Function
->getName() +
898 " skipped due to no unwind info at the time "
899 "(.seh_handlerdata too early?), but the function later "
900 "did get unwind info that can't be emitted");
904 simplifyOpcodes(info
->Instructions
, false);
905 for (auto &I
: info
->EpilogMap
)
906 simplifyOpcodes(I
.second
, true);
908 MCContext
&context
= streamer
.getContext();
909 MCSymbol
*Label
= context
.createTempSymbol();
911 streamer
.emitValueToAlignment(4);
912 streamer
.emitLabel(Label
);
913 info
->Symbol
= Label
;
915 int64_t RawFuncLength
;
916 if (!info
->FuncletOrFuncEnd
) {
917 report_fatal_error("FuncletOrFuncEnd not set");
919 // FIXME: GetAbsDifference tries to compute the length of the function
920 // immediately, before the whole file is emitted, but in general
921 // that's impossible: the size in bytes of certain assembler directives
922 // like .align and .fill is not known until the whole file is parsed and
923 // relaxations are applied. Currently, GetAbsDifference fails with a fatal
924 // error in that case. (We mostly don't hit this because inline assembly
925 // specifying those directives is rare, and we don't normally try to
926 // align loops on AArch64.)
928 // There are two potential approaches to delaying the computation. One,
929 // we could emit something like ".word (endfunc-beginfunc)/4+0x10800000",
930 // as long as we have some conservative estimate we could use to prove
931 // that we don't need to split the unwind data. Emitting the constant
932 // is straightforward, but there's no existing code for estimating the
933 // size of the function.
935 // The other approach would be to use a dedicated, relaxable fragment,
936 // which could grow to accommodate splitting the unwind data if
937 // necessary. This is more straightforward, since it automatically works
938 // without any new infrastructure, and it's consistent with how we handle
939 // relaxation in other contexts. But it would require some refactoring
940 // to move parts of the pdata/xdata emission into the implementation of
941 // a fragment. We could probably continue to encode the unwind codes
942 // here, but we'd have to emit the pdata, the xdata header, and the
943 // epilogue scopes later, since they depend on whether the we need to
944 // split the unwind data.
945 RawFuncLength
= GetAbsDifference(streamer
, info
->FuncletOrFuncEnd
,
948 if (RawFuncLength
> 0xFFFFF)
949 report_fatal_error("SEH unwind data splitting not yet implemented");
950 uint32_t FuncLength
= (uint32_t)RawFuncLength
/ 4;
951 uint32_t PrologCodeBytes
= ARM64CountOfUnwindCodes(info
->Instructions
);
952 uint32_t TotalCodeBytes
= PrologCodeBytes
;
954 int PackedEpilogOffset
= checkPackedEpilog(streamer
, info
, PrologCodeBytes
);
956 if (PackedEpilogOffset
>= 0 && !info
->HandlesExceptions
&&
957 FuncLength
<= 0x7ff && TryPacked
) {
958 // Matching prolog/epilog and no exception handlers; check if the
959 // prolog matches the patterns that can be described by the packed
962 // info->Symbol was already set even if we didn't actually write any
963 // unwind info there. Keep using that as indicator that this unwind
964 // info has been generated already.
966 if (tryPackedUnwind(info
, FuncLength
, PackedEpilogOffset
))
971 MapVector
<MCSymbol
*, uint32_t> EpilogInfo
;
972 // Epilogs processed so far.
973 std::vector
<MCSymbol
*> AddedEpilogs
;
975 for (auto &I
: info
->EpilogMap
) {
976 MCSymbol
*EpilogStart
= I
.first
;
977 auto &EpilogInstrs
= I
.second
;
978 uint32_t CodeBytes
= ARM64CountOfUnwindCodes(EpilogInstrs
);
980 MCSymbol
* MatchingEpilog
=
981 FindMatchingEpilog(EpilogInstrs
, AddedEpilogs
, info
);
982 if (MatchingEpilog
) {
983 assert(EpilogInfo
.find(MatchingEpilog
) != EpilogInfo
.end() &&
984 "Duplicate epilog not found");
985 EpilogInfo
[EpilogStart
] = EpilogInfo
.lookup(MatchingEpilog
);
986 // Clear the unwind codes in the EpilogMap, so that they don't get output
987 // in the logic below.
988 EpilogInstrs
.clear();
990 EpilogInfo
[EpilogStart
] = TotalCodeBytes
;
991 TotalCodeBytes
+= CodeBytes
;
992 AddedEpilogs
.push_back(EpilogStart
);
996 // Code Words, Epilog count, E, X, Vers, Function Length
998 uint32_t CodeWords
= TotalCodeBytes
/ 4;
999 uint32_t CodeWordsMod
= TotalCodeBytes
% 4;
1002 uint32_t EpilogCount
=
1003 PackedEpilogOffset
>= 0 ? PackedEpilogOffset
: info
->EpilogMap
.size();
1004 bool ExtensionWord
= EpilogCount
> 31 || TotalCodeBytes
> 124;
1005 if (!ExtensionWord
) {
1006 row1
|= (EpilogCount
& 0x1F) << 22;
1007 row1
|= (CodeWords
& 0x1F) << 27;
1009 if (info
->HandlesExceptions
) // X
1011 if (PackedEpilogOffset
>= 0) // E
1013 row1
|= FuncLength
& 0x3FFFF;
1014 streamer
.emitInt32(row1
);
1016 // Extended Code Words, Extended Epilog Count
1017 if (ExtensionWord
) {
1018 // FIXME: We should be able to split unwind info into multiple sections.
1019 // FIXME: We should share epilog codes across epilogs, where possible,
1020 // which would make this issue show up less frequently.
1021 if (CodeWords
> 0xFF || EpilogCount
> 0xFFFF)
1022 report_fatal_error("SEH unwind data splitting not yet implemented");
1023 uint32_t row2
= 0x0;
1024 row2
|= (CodeWords
& 0xFF) << 16;
1025 row2
|= (EpilogCount
& 0xFFFF);
1026 streamer
.emitInt32(row2
);
1029 // Epilog Start Index, Epilog Start Offset
1030 for (auto &I
: EpilogInfo
) {
1031 MCSymbol
*EpilogStart
= I
.first
;
1032 uint32_t EpilogIndex
= I
.second
;
1033 uint32_t EpilogOffset
=
1034 (uint32_t)GetAbsDifference(streamer
, EpilogStart
, info
->Begin
);
1037 uint32_t row3
= EpilogOffset
;
1038 row3
|= (EpilogIndex
& 0x3FF) << 22;
1039 streamer
.emitInt32(row3
);
1042 // Emit prolog unwind instructions (in reverse order).
1043 uint8_t numInst
= info
->Instructions
.size();
1044 for (uint8_t c
= 0; c
< numInst
; ++c
) {
1045 WinEH::Instruction inst
= info
->Instructions
.back();
1046 info
->Instructions
.pop_back();
1047 ARM64EmitUnwindCode(streamer
, info
->Begin
, inst
);
1050 // Emit epilog unwind instructions
1051 for (auto &I
: info
->EpilogMap
) {
1052 auto &EpilogInstrs
= I
.second
;
1053 for (uint32_t i
= 0; i
< EpilogInstrs
.size(); i
++) {
1054 WinEH::Instruction inst
= EpilogInstrs
[i
];
1055 ARM64EmitUnwindCode(streamer
, info
->Begin
, inst
);
1059 int32_t BytesMod
= CodeWords
* 4 - TotalCodeBytes
;
1060 assert(BytesMod
>= 0);
1061 for (int i
= 0; i
< BytesMod
; i
++)
1062 streamer
.emitInt8(0xE3);
1064 if (info
->HandlesExceptions
)
1066 MCSymbolRefExpr::create(info
->ExceptionHandler
,
1067 MCSymbolRefExpr::VK_COFF_IMGREL32
, context
),
1071 static void ARM64EmitRuntimeFunction(MCStreamer
&streamer
,
1072 const WinEH::FrameInfo
*info
) {
1073 MCContext
&context
= streamer
.getContext();
1075 streamer
.emitValueToAlignment(4);
1076 EmitSymbolRefWithOfs(streamer
, info
->Function
, info
->Begin
);
1077 if (info
->PackedInfo
)
1078 streamer
.emitInt32(info
->PackedInfo
);
1081 MCSymbolRefExpr::create(info
->Symbol
, MCSymbolRefExpr::VK_COFF_IMGREL32
,
1086 void llvm::Win64EH::ARM64UnwindEmitter::Emit(MCStreamer
&Streamer
) const {
1087 // Emit the unwind info structs first.
1088 for (const auto &CFI
: Streamer
.getWinFrameInfos()) {
1089 WinEH::FrameInfo
*Info
= CFI
.get();
1092 MCSection
*XData
= Streamer
.getAssociatedXDataSection(CFI
->TextSection
);
1093 Streamer
.SwitchSection(XData
);
1094 ARM64EmitUnwindInfo(Streamer
, Info
);
1097 // Now emit RUNTIME_FUNCTION entries.
1098 for (const auto &CFI
: Streamer
.getWinFrameInfos()) {
1099 WinEH::FrameInfo
*Info
= CFI
.get();
1100 // ARM64EmitUnwindInfo above clears the info struct, so we can't check
1101 // empty here. But if a Symbol is set, we should create the corresponding
1105 MCSection
*PData
= Streamer
.getAssociatedPDataSection(CFI
->TextSection
);
1106 Streamer
.SwitchSection(PData
);
1107 ARM64EmitRuntimeFunction(Streamer
, Info
);
1111 void llvm::Win64EH::ARM64UnwindEmitter::EmitUnwindInfo(MCStreamer
&Streamer
,
1112 WinEH::FrameInfo
*info
,
1113 bool HandlerData
) const {
1114 // Called if there's an .seh_handlerdata directive before the end of the
1115 // function. This forces writing the xdata record already here - and
1116 // in this case, the function isn't actually ended already, but the xdata
1117 // record needs to know the function length. In these cases, if the funclet
1118 // end hasn't been marked yet, the xdata function length won't cover the
1119 // whole function, only up to this point.
1120 if (!info
->FuncletOrFuncEnd
) {
1121 Streamer
.SwitchSection(info
->TextSection
);
1122 info
->FuncletOrFuncEnd
= Streamer
.emitCFILabel();
1124 // Switch sections (the static function above is meant to be called from
1125 // here and from Emit().
1126 MCSection
*XData
= Streamer
.getAssociatedXDataSection(info
->TextSection
);
1127 Streamer
.SwitchSection(XData
);
1128 ARM64EmitUnwindInfo(Streamer
, info
, /* TryPacked = */ !HandlerData
);