1 //=== WebAssemblyLateEHPrepare.cpp - WebAssembly Exception Preparation -===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// \brief Does various transformations for exception handling.
12 //===----------------------------------------------------------------------===//
14 #include "MCTargetDesc/WebAssemblyMCTargetDesc.h"
15 #include "WebAssembly.h"
16 #include "WebAssemblySubtarget.h"
17 #include "WebAssemblyUtilities.h"
18 #include "llvm/ADT/SmallPtrSet.h"
19 #include "llvm/CodeGen/MachineFunctionPass.h"
20 #include "llvm/CodeGen/MachineInstrBuilder.h"
21 #include "llvm/CodeGen/WasmEHFuncInfo.h"
22 #include "llvm/MC/MCAsmInfo.h"
23 #include "llvm/Support/Debug.h"
24 #include "llvm/Target/TargetMachine.h"
27 #define DEBUG_TYPE "wasm-late-eh-prepare"
30 class WebAssemblyLateEHPrepare final
: public MachineFunctionPass
{
31 StringRef
getPassName() const override
{
32 return "WebAssembly Late Prepare Exception";
35 bool runOnMachineFunction(MachineFunction
&MF
) override
;
36 bool removeUnreachableEHPads(MachineFunction
&MF
);
37 void recordCatchRetBBs(MachineFunction
&MF
);
38 bool hoistCatches(MachineFunction
&MF
);
39 bool addCatchAlls(MachineFunction
&MF
);
40 bool addCatchRefsAndThrowRefs(MachineFunction
&MF
);
41 bool replaceFuncletReturns(MachineFunction
&MF
);
42 bool removeUnnecessaryUnreachables(MachineFunction
&MF
);
43 bool restoreStackPointer(MachineFunction
&MF
);
45 MachineBasicBlock
*getMatchingEHPad(MachineInstr
*MI
);
46 SmallPtrSet
<MachineBasicBlock
*, 8> CatchRetBBs
;
49 static char ID
; // Pass identification, replacement for typeid
50 WebAssemblyLateEHPrepare() : MachineFunctionPass(ID
) {}
52 } // end anonymous namespace
54 char WebAssemblyLateEHPrepare::ID
= 0;
55 INITIALIZE_PASS(WebAssemblyLateEHPrepare
, DEBUG_TYPE
,
56 "WebAssembly Late Exception Preparation", false, false)
58 FunctionPass
*llvm::createWebAssemblyLateEHPrepare() {
59 return new WebAssemblyLateEHPrepare();
62 // Returns the nearest EH pad that dominates this instruction. This does not use
63 // dominator analysis; it just does BFS on its predecessors until arriving at an
64 // EH pad. This assumes valid EH scopes so the first EH pad it arrives in all
65 // possible search paths should be the same.
66 // Returns nullptr in case it does not find any EH pad in the search, or finds
67 // multiple different EH pads.
69 WebAssemblyLateEHPrepare::getMatchingEHPad(MachineInstr
*MI
) {
70 MachineFunction
*MF
= MI
->getParent()->getParent();
71 SmallVector
<MachineBasicBlock
*, 2> WL
;
72 SmallPtrSet
<MachineBasicBlock
*, 2> Visited
;
73 WL
.push_back(MI
->getParent());
74 MachineBasicBlock
*EHPad
= nullptr;
76 MachineBasicBlock
*MBB
= WL
.pop_back_val();
77 if (!Visited
.insert(MBB
).second
)
80 if (EHPad
&& EHPad
!= MBB
)
85 if (MBB
== &MF
->front())
87 for (auto *Pred
: MBB
->predecessors())
88 if (!CatchRetBBs
.count(Pred
)) // We don't go into child scopes
94 // Erase the specified BBs if the BB does not have any remaining predecessors,
95 // and also all its dead children.
96 template <typename Container
>
97 static void eraseDeadBBsAndChildren(const Container
&MBBs
) {
98 SmallVector
<MachineBasicBlock
*, 8> WL(MBBs
.begin(), MBBs
.end());
99 SmallPtrSet
<MachineBasicBlock
*, 8> Deleted
;
100 while (!WL
.empty()) {
101 MachineBasicBlock
*MBB
= WL
.pop_back_val();
102 if (Deleted
.count(MBB
) || !MBB
->pred_empty())
104 SmallVector
<MachineBasicBlock
*, 4> Succs(MBB
->successors());
105 WL
.append(MBB
->succ_begin(), MBB
->succ_end());
106 for (auto *Succ
: Succs
)
107 MBB
->removeSuccessor(Succ
);
108 // To prevent deleting the same BB multiple times, which can happen when
109 // 'MBBs' contain both a parent and a child
111 MBB
->eraseFromParent();
115 bool WebAssemblyLateEHPrepare::runOnMachineFunction(MachineFunction
&MF
) {
116 LLVM_DEBUG(dbgs() << "********** Late EH Prepare **********\n"
117 "********** Function: "
118 << MF
.getName() << '\n');
120 if (MF
.getTarget().getMCAsmInfo()->getExceptionHandlingType() !=
121 ExceptionHandling::Wasm
)
124 bool Changed
= false;
125 if (MF
.getFunction().hasPersonalityFn()) {
126 Changed
|= removeUnreachableEHPads(MF
);
127 recordCatchRetBBs(MF
);
128 Changed
|= hoistCatches(MF
);
129 Changed
|= addCatchAlls(MF
);
130 Changed
|= replaceFuncletReturns(MF
);
131 if (WebAssembly::WasmEnableExnref
)
132 Changed
|= addCatchRefsAndThrowRefs(MF
);
134 Changed
|= removeUnnecessaryUnreachables(MF
);
135 if (MF
.getFunction().hasPersonalityFn())
136 Changed
|= restoreStackPointer(MF
);
140 // Remove unreachable EH pads and its children. If they remain, CFG
141 // stackification can be tricky.
142 bool WebAssemblyLateEHPrepare::removeUnreachableEHPads(MachineFunction
&MF
) {
143 SmallVector
<MachineBasicBlock
*, 4> ToDelete
;
145 if (MBB
.isEHPad() && MBB
.pred_empty())
146 ToDelete
.push_back(&MBB
);
147 eraseDeadBBsAndChildren(ToDelete
);
148 return !ToDelete
.empty();
151 // Record which BB ends with catchret instruction, because this will be replaced
152 // with 'br's later. This set of catchret BBs is necessary in 'getMatchingEHPad'
154 void WebAssemblyLateEHPrepare::recordCatchRetBBs(MachineFunction
&MF
) {
156 for (auto &MBB
: MF
) {
157 auto Pos
= MBB
.getFirstTerminator();
158 if (Pos
== MBB
.end())
160 MachineInstr
*TI
= &*Pos
;
161 if (TI
->getOpcode() == WebAssembly::CATCHRET
)
162 CatchRetBBs
.insert(&MBB
);
166 // Hoist catch instructions to the beginning of their matching EH pad BBs in
168 // (1) catch instruction is not the first instruction in EH pad.
170 // some_other_instruction
173 // (2) catch instruction is in a non-EH pad BB. For example,
178 bool WebAssemblyLateEHPrepare::hoistCatches(MachineFunction
&MF
) {
179 bool Changed
= false;
180 SmallVector
<MachineInstr
*, 16> Catches
;
183 if (WebAssembly::isCatch(MI
.getOpcode()))
184 Catches
.push_back(&MI
);
186 for (auto *Catch
: Catches
) {
187 MachineBasicBlock
*EHPad
= getMatchingEHPad(Catch
);
188 assert(EHPad
&& "No matching EH pad for catch");
189 auto InsertPos
= EHPad
->begin();
190 // Skip EH_LABELs in the beginning of an EH pad if present. We don't use
191 // these labels at the moment, but other targets also seem to have an
192 // EH_LABEL instruction in the beginning of an EH pad.
193 while (InsertPos
!= EHPad
->end() && InsertPos
->isEHLabel())
195 if (InsertPos
== Catch
)
198 EHPad
->insert(InsertPos
, Catch
->removeFromParent());
203 // Add catch_all to beginning of cleanup pads.
204 bool WebAssemblyLateEHPrepare::addCatchAlls(MachineFunction
&MF
) {
205 bool Changed
= false;
206 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
208 for (auto &MBB
: MF
) {
211 auto InsertPos
= MBB
.begin();
212 // Skip EH_LABELs in the beginning of an EH pad if present.
213 while (InsertPos
!= MBB
.end() && InsertPos
->isEHLabel())
215 // This runs after hoistCatches(), so we assume that if there is a catch,
216 // that should be the first non-EH-label instruction in an EH pad.
217 if (InsertPos
== MBB
.end() ||
218 !WebAssembly::isCatch(InsertPos
->getOpcode())) {
220 unsigned CatchAllOpcode
= WebAssembly::WasmEnableExnref
221 ? WebAssembly::CATCH_ALL
222 : WebAssembly::CATCH_ALL_LEGACY
;
223 BuildMI(MBB
, InsertPos
,
224 InsertPos
== MBB
.end() ? DebugLoc() : InsertPos
->getDebugLoc(),
225 TII
.get(CatchAllOpcode
));
231 // Replace pseudo-instructions catchret and cleanupret with br and rethrow
233 bool WebAssemblyLateEHPrepare::replaceFuncletReturns(MachineFunction
&MF
) {
234 bool Changed
= false;
235 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
237 for (auto &MBB
: MF
) {
238 auto Pos
= MBB
.getFirstTerminator();
239 if (Pos
== MBB
.end())
241 MachineInstr
*TI
= &*Pos
;
243 switch (TI
->getOpcode()) {
244 case WebAssembly::CATCHRET
: {
245 // Replace a catchret with a branch
246 MachineBasicBlock
*TBB
= TI
->getOperand(0).getMBB();
247 if (!MBB
.isLayoutSuccessor(TBB
))
248 BuildMI(MBB
, TI
, TI
->getDebugLoc(), TII
.get(WebAssembly::BR
))
250 TI
->eraseFromParent();
254 case WebAssembly::RETHROW
:
255 // These RETHROWs here were lowered from llvm.wasm.rethrow() intrinsics,
256 // generated in Clang for when an exception is not caught by the given
257 // type (e.g. catch (int)).
259 // RETHROW's BB argument is the EH pad where the exception to rethrow has
260 // been caught. (Until this point, RETHROW has just a '0' as a placeholder
261 // argument.) For these llvm.wasm.rethrow()s, we can safely assume the
262 // exception comes from the nearest dominating EH pad, because catch.start
263 // EH pad is structured like this:
267 // %matches = compare ehselector with typeid
268 // br i1 %matches, label %catch, label %rethrow
271 // ;; rethrows the exception caught in 'catch.start'
272 // call @llvm.wasm.rethrow()
273 TI
->removeOperand(0);
274 TI
->addOperand(MachineOperand::CreateMBB(getMatchingEHPad(TI
)));
277 case WebAssembly::CLEANUPRET
: {
278 // CLEANUPRETs have the EH pad BB the exception to rethrow has been caught
279 // as an argument. Use it and change the instruction opcode to 'RETHROW'
280 // to make rethrowing instructions consistent.
282 // This is because we cannot safely assume that it is always the nearest
283 // dominating EH pad, in case there are code transformations such as
285 BuildMI(MBB
, TI
, TI
->getDebugLoc(), TII
.get(WebAssembly::RETHROW
))
286 .addMBB(TI
->getOperand(0).getMBB());
287 TI
->eraseFromParent();
296 // Add CATCH_REF and CATCH_ALL_REF pseudo instructions to EH pads, and convert
297 // RETHROWs to THROW_REFs.
298 bool WebAssemblyLateEHPrepare::addCatchRefsAndThrowRefs(MachineFunction
&MF
) {
299 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
300 auto &MRI
= MF
.getRegInfo();
301 DenseMap
<MachineBasicBlock
*, SmallVector
<MachineInstr
*, 2>> EHPadToRethrows
;
303 // Create a map of <EH pad, a vector of RETHROWs rethrowing its exception>
306 if (MI
.getOpcode() == WebAssembly::RETHROW
)
307 EHPadToRethrows
[MI
.getOperand(0).getMBB()].push_back(&MI
);
308 if (EHPadToRethrows
.empty())
311 // Convert CATCH into CATCH_REF and CATCH_ALL into CATCH_ALL_REF, when the
312 // caught exception is rethrown. And convert RETHROWs to THROW_REFs.
313 for (auto &[EHPad
, Rethrows
] : EHPadToRethrows
) {
314 auto *Catch
= WebAssembly::findCatch(EHPad
);
315 auto *InsertPos
= Catch
->getIterator()->getNextNode();
316 auto ExnReg
= MRI
.createVirtualRegister(&WebAssembly::EXNREFRegClass
);
317 if (Catch
->getOpcode() == WebAssembly::CATCH
) {
318 MachineInstrBuilder MIB
= BuildMI(*EHPad
, InsertPos
, Catch
->getDebugLoc(),
319 TII
.get(WebAssembly::CATCH_REF
));
320 // Copy defs (= extracted values) from the old CATCH to the new CATCH_REF
321 for (const auto &Def
: Catch
->defs())
322 MIB
.addDef(Def
.getReg());
323 MIB
.addDef(ExnReg
); // Attach the exnref def after extracted values
324 // Copy the tag symbol (The only use operand a CATCH can have is the tag
326 for (const auto &Use
: Catch
->uses()) {
327 MIB
.addExternalSymbol(Use
.getSymbolName());
330 } else if (Catch
->getOpcode() == WebAssembly::CATCH_ALL
) {
331 BuildMI(*EHPad
, InsertPos
, Catch
->getDebugLoc(),
332 TII
.get(WebAssembly::CATCH_ALL_REF
))
337 Catch
->eraseFromParent();
339 for (auto *Rethrow
: Rethrows
) {
340 auto InsertPos
= std::next(Rethrow
->getIterator());
341 BuildMI(*Rethrow
->getParent(), InsertPos
, Rethrow
->getDebugLoc(),
342 TII
.get(WebAssembly::THROW_REF
))
344 Rethrow
->eraseFromParent();
351 // Remove unnecessary unreachables after a throw/rethrow/throw_ref.
352 bool WebAssemblyLateEHPrepare::removeUnnecessaryUnreachables(
353 MachineFunction
&MF
) {
354 bool Changed
= false;
355 for (auto &MBB
: MF
) {
356 for (auto &MI
: MBB
) {
357 if (MI
.getOpcode() != WebAssembly::THROW
&&
358 MI
.getOpcode() != WebAssembly::RETHROW
&&
359 MI
.getOpcode() != WebAssembly::THROW_REF
)
363 // The instruction after the throw should be an unreachable or a branch to
364 // another BB that should eventually lead to an unreachable. Delete it
365 // because throw itself is a terminator, and also delete successors if
367 MBB
.erase(std::next(MI
.getIterator()), MBB
.end());
368 SmallVector
<MachineBasicBlock
*, 8> Succs(MBB
.successors());
369 for (auto *Succ
: Succs
)
370 if (!Succ
->isEHPad())
371 MBB
.removeSuccessor(Succ
);
372 eraseDeadBBsAndChildren(Succs
);
379 // After the stack is unwound due to a thrown exception, the __stack_pointer
380 // global can point to an invalid address. This inserts instructions that
381 // restore __stack_pointer global.
382 bool WebAssemblyLateEHPrepare::restoreStackPointer(MachineFunction
&MF
) {
383 const auto *FrameLowering
= static_cast<const WebAssemblyFrameLowering
*>(
384 MF
.getSubtarget().getFrameLowering());
385 if (!FrameLowering
->needsPrologForEH(MF
))
387 bool Changed
= false;
389 for (auto &MBB
: MF
) {
394 // Insert __stack_pointer restoring instructions at the beginning of each EH
395 // pad, after the catch instruction. Here it is safe to assume that SP32
396 // holds the latest value of __stack_pointer, because the only exception for
397 // this case is when a function uses the red zone, but that only happens
398 // with leaf functions, and we don't restore __stack_pointer in leaf
400 auto InsertPos
= MBB
.begin();
401 // Skip EH_LABELs in the beginning of an EH pad if present.
402 while (InsertPos
!= MBB
.end() && InsertPos
->isEHLabel())
404 assert(InsertPos
!= MBB
.end() &&
405 WebAssembly::isCatch(InsertPos
->getOpcode()) &&
406 "catch/catch_all should be present in every EH pad at this point");
407 ++InsertPos
; // Skip the catch instruction
408 FrameLowering
->writeSPToGlobal(FrameLowering
->getSPReg(MF
), MF
, MBB
,
409 InsertPos
, MBB
.begin()->getDebugLoc());