1 //=== WebAssemblyLateEHPrepare.cpp - WebAssembly Exception Preparation -===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// \brief Does various transformations for exception handling.
12 //===----------------------------------------------------------------------===//
14 #include "MCTargetDesc/WebAssemblyMCTargetDesc.h"
15 #include "WebAssembly.h"
16 #include "WebAssemblySubtarget.h"
17 #include "WebAssemblyUtilities.h"
18 #include "llvm/ADT/SmallSet.h"
19 #include "llvm/CodeGen/MachineInstrBuilder.h"
20 #include "llvm/CodeGen/WasmEHFuncInfo.h"
21 #include "llvm/MC/MCAsmInfo.h"
24 #define DEBUG_TYPE "wasm-exception-prepare"
27 class WebAssemblyLateEHPrepare final
: public MachineFunctionPass
{
28 StringRef
getPassName() const override
{
29 return "WebAssembly Late Prepare Exception";
32 bool runOnMachineFunction(MachineFunction
&MF
) override
;
33 bool removeUnnecessaryUnreachables(MachineFunction
&MF
);
34 bool replaceFuncletReturns(MachineFunction
&MF
);
35 bool addCatches(MachineFunction
&MF
);
36 bool addExceptionExtraction(MachineFunction
&MF
);
37 bool restoreStackPointer(MachineFunction
&MF
);
40 static char ID
; // Pass identification, replacement for typeid
41 WebAssemblyLateEHPrepare() : MachineFunctionPass(ID
) {}
43 } // end anonymous namespace
45 char WebAssemblyLateEHPrepare::ID
= 0;
46 INITIALIZE_PASS(WebAssemblyLateEHPrepare
, DEBUG_TYPE
,
47 "WebAssembly Late Exception Preparation", false, false)
49 FunctionPass
*llvm::createWebAssemblyLateEHPrepare() {
50 return new WebAssemblyLateEHPrepare();
53 // Returns the nearest EH pad that dominates this instruction. This does not use
54 // dominator analysis; it just does BFS on its predecessors until arriving at an
55 // EH pad. This assumes valid EH scopes so the first EH pad it arrives in all
56 // possible search paths should be the same.
57 // Returns nullptr in case it does not find any EH pad in the search, or finds
58 // multiple different EH pads.
59 static MachineBasicBlock
*getMatchingEHPad(MachineInstr
*MI
) {
60 MachineFunction
*MF
= MI
->getParent()->getParent();
61 SmallVector
<MachineBasicBlock
*, 2> WL
;
62 SmallPtrSet
<MachineBasicBlock
*, 2> Visited
;
63 WL
.push_back(MI
->getParent());
64 MachineBasicBlock
*EHPad
= nullptr;
66 MachineBasicBlock
*MBB
= WL
.pop_back_val();
67 if (Visited
.count(MBB
))
71 if (EHPad
&& EHPad
!= MBB
)
76 if (MBB
== &MF
->front())
78 WL
.append(MBB
->pred_begin(), MBB
->pred_end());
83 // Erase the specified BBs if the BB does not have any remaining predecessors,
84 // and also all its dead children.
85 template <typename Container
>
86 static void eraseDeadBBsAndChildren(const Container
&MBBs
) {
87 SmallVector
<MachineBasicBlock
*, 8> WL(MBBs
.begin(), MBBs
.end());
89 MachineBasicBlock
*MBB
= WL
.pop_back_val();
90 if (!MBB
->pred_empty())
92 SmallVector
<MachineBasicBlock
*, 4> Succs(MBB
->succ_begin(),
94 WL
.append(MBB
->succ_begin(), MBB
->succ_end());
95 for (auto *Succ
: Succs
)
96 MBB
->removeSuccessor(Succ
);
97 MBB
->eraseFromParent();
101 bool WebAssemblyLateEHPrepare::runOnMachineFunction(MachineFunction
&MF
) {
102 LLVM_DEBUG(dbgs() << "********** Late EH Prepare **********\n"
103 "********** Function: "
104 << MF
.getName() << '\n');
106 if (MF
.getTarget().getMCAsmInfo()->getExceptionHandlingType() !=
107 ExceptionHandling::Wasm
)
110 bool Changed
= false;
111 Changed
|= removeUnnecessaryUnreachables(MF
);
112 if (!MF
.getFunction().hasPersonalityFn())
114 Changed
|= replaceFuncletReturns(MF
);
115 Changed
|= addCatches(MF
);
116 Changed
|= addExceptionExtraction(MF
);
117 Changed
|= restoreStackPointer(MF
);
121 bool WebAssemblyLateEHPrepare::removeUnnecessaryUnreachables(
122 MachineFunction
&MF
) {
123 bool Changed
= false;
124 for (auto &MBB
: MF
) {
125 for (auto &MI
: MBB
) {
126 if (MI
.getOpcode() != WebAssembly::THROW
&&
127 MI
.getOpcode() != WebAssembly::RETHROW
)
131 // The instruction after the throw should be an unreachable or a branch to
132 // another BB that should eventually lead to an unreachable. Delete it
133 // because throw itself is a terminator, and also delete successors if
135 MBB
.erase(std::next(MachineBasicBlock::iterator(MI
)), MBB
.end());
136 SmallVector
<MachineBasicBlock
*, 8> Succs(MBB
.succ_begin(),
138 for (auto *Succ
: Succs
)
139 MBB
.removeSuccessor(Succ
);
140 eraseDeadBBsAndChildren(Succs
);
147 bool WebAssemblyLateEHPrepare::replaceFuncletReturns(MachineFunction
&MF
) {
148 bool Changed
= false;
149 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
151 for (auto &MBB
: MF
) {
152 auto Pos
= MBB
.getFirstTerminator();
153 if (Pos
== MBB
.end())
155 MachineInstr
*TI
= &*Pos
;
157 switch (TI
->getOpcode()) {
158 case WebAssembly::CATCHRET
: {
159 // Replace a catchret with a branch
160 MachineBasicBlock
*TBB
= TI
->getOperand(0).getMBB();
161 if (!MBB
.isLayoutSuccessor(TBB
))
162 BuildMI(MBB
, TI
, TI
->getDebugLoc(), TII
.get(WebAssembly::BR
))
164 TI
->eraseFromParent();
168 case WebAssembly::CLEANUPRET
: {
169 // Replace a cleanupret with a rethrow
170 BuildMI(MBB
, TI
, TI
->getDebugLoc(), TII
.get(WebAssembly::RETHROW
));
171 TI
->eraseFromParent();
180 // Add catch instruction to beginning of catchpads and cleanuppads.
181 bool WebAssemblyLateEHPrepare::addCatches(MachineFunction
&MF
) {
182 bool Changed
= false;
183 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
184 MachineRegisterInfo
&MRI
= MF
.getRegInfo();
185 for (auto &MBB
: MF
) {
189 MRI
.createVirtualRegister(&WebAssembly::EXCEPT_REFRegClass
);
190 BuildMI(MBB
, MBB
.begin(), MBB
.begin()->getDebugLoc(),
191 TII
.get(WebAssembly::CATCH
), DstReg
);
197 // Wasm uses 'br_on_exn' instruction to check the tag of an exception. It takes
198 // except_ref type object returned by 'catch', and branches to the destination
199 // if it matches a given tag. We currently use __cpp_exception symbol to
200 // represent the tag for all C++ exceptions.
202 // block $l (result i32)
204 // ;; except_ref $e is on the stack at this point
205 // br_on_exn $l $e ;; branch to $l with $e's arguments
208 // ;; Here we expect the extracted values are on top of the wasm value stack
209 // ... Handle exception using values ...
211 // br_on_exn takes an except_ref object and branches if it matches the given
212 // tag. There can be multiple br_on_exn instructions if we want to match for
213 // another tag, but for now we only test for __cpp_exception tag, and if it does
214 // not match, i.e., it is a foreign exception, we rethrow it.
216 // In the destination BB that's the target of br_on_exn, extracted exception
217 // values (in C++'s case a single i32, which represents an exception pointer)
218 // are placed on top of the wasm stack. Because we can't model wasm stack in
219 // LLVM instruction, we use 'extract_exception' pseudo instruction to retrieve
220 // it. The pseudo instruction will be deleted later.
221 bool WebAssemblyLateEHPrepare::addExceptionExtraction(MachineFunction
&MF
) {
222 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
223 auto *EHInfo
= MF
.getWasmEHFuncInfo();
224 SmallVector
<MachineInstr
*, 16> ExtractInstrs
;
225 for (auto &MBB
: MF
) {
226 for (auto &MI
: MBB
) {
227 if (MI
.getOpcode() == WebAssembly::EXTRACT_EXCEPTION_I32
) {
228 if (MI
.getOperand(0).isDead())
229 MI
.eraseFromParent();
231 ExtractInstrs
.push_back(&MI
);
235 if (ExtractInstrs
.empty())
238 // Find terminate pads.
239 SmallSet
<MachineBasicBlock
*, 8> TerminatePads
;
240 for (auto &MBB
: MF
) {
241 for (auto &MI
: MBB
) {
243 const MachineOperand
&CalleeOp
= MI
.getOperand(0);
244 if (CalleeOp
.isGlobal() && CalleeOp
.getGlobal()->getName() ==
245 WebAssembly::ClangCallTerminateFn
)
246 TerminatePads
.insert(getMatchingEHPad(&MI
));
251 for (auto *Extract
: ExtractInstrs
) {
252 MachineBasicBlock
*EHPad
= getMatchingEHPad(Extract
);
253 assert(EHPad
&& "No matching EH pad for extract_exception");
254 MachineInstr
*Catch
= &*EHPad
->begin();
255 if (Catch
->getNextNode() != Extract
)
256 EHPad
->insert(Catch
->getNextNode(), Extract
->removeFromParent());
260 // %exnref:except_ref = catch
261 // %exn:i32 = extract_exception
266 // %exnref:except_ref = catch
267 // br_on_exn %thenbb, $__cpp_exception, %exnref
272 // %exn:i32 = extract_exception
274 unsigned ExnRefReg
= Catch
->getOperand(0).getReg();
275 auto *ThenMBB
= MF
.CreateMachineBasicBlock();
276 auto *ElseMBB
= MF
.CreateMachineBasicBlock();
277 MF
.insert(std::next(MachineFunction::iterator(EHPad
)), ElseMBB
);
278 MF
.insert(std::next(MachineFunction::iterator(ElseMBB
)), ThenMBB
);
279 ThenMBB
->splice(ThenMBB
->end(), EHPad
, Extract
, EHPad
->end());
280 ThenMBB
->transferSuccessors(EHPad
);
281 EHPad
->addSuccessor(ThenMBB
);
282 EHPad
->addSuccessor(ElseMBB
);
284 DebugLoc DL
= Extract
->getDebugLoc();
285 const char *CPPExnSymbol
= MF
.createExternalSymbolName("__cpp_exception");
286 BuildMI(EHPad
, DL
, TII
.get(WebAssembly::BR_ON_EXN
))
288 .addExternalSymbol(CPPExnSymbol
, WebAssemblyII::MO_SYMBOL_EVENT
)
290 BuildMI(EHPad
, DL
, TII
.get(WebAssembly::BR
)).addMBB(ElseMBB
);
292 // When this is a terminate pad with __clang_call_terminate() call, we don't
293 // rethrow it anymore and call __clang_call_terminate() with a nullptr
294 // argument, which will call std::terminate().
298 // %exnref:except_ref = catch
299 // %exn:i32 = extract_exception
300 // call @__clang_call_terminate(%exn)
305 // %exnref:except_ref = catch
306 // br_on_exn %thenbb, $__cpp_exception, %exnref
309 // call @__clang_call_terminate(0)
312 // %exn:i32 = extract_exception
313 // call @__clang_call_terminate(%exn)
315 if (TerminatePads
.count(EHPad
)) {
316 Function
*ClangCallTerminateFn
=
317 MF
.getFunction().getParent()->getFunction(
318 WebAssembly::ClangCallTerminateFn
);
319 assert(ClangCallTerminateFn
&&
320 "There is no __clang_call_terminate() function");
321 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::CALL_VOID
))
322 .addGlobalAddress(ClangCallTerminateFn
)
324 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::UNREACHABLE
));
327 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::RETHROW
));
328 if (EHInfo
->hasEHPadUnwindDest(EHPad
))
329 EHInfo
->setThrowUnwindDest(ElseMBB
, EHInfo
->getEHPadUnwindDest(EHPad
));
336 // After the stack is unwound due to a thrown exception, the __stack_pointer
337 // global can point to an invalid address. This inserts instructions that
338 // restore __stack_pointer global.
339 bool WebAssemblyLateEHPrepare::restoreStackPointer(MachineFunction
&MF
) {
340 const auto *FrameLowering
= static_cast<const WebAssemblyFrameLowering
*>(
341 MF
.getSubtarget().getFrameLowering());
342 if (!FrameLowering
->needsPrologForEH(MF
))
344 bool Changed
= false;
346 for (auto &MBB
: MF
) {
351 // Insert __stack_pointer restoring instructions at the beginning of each EH
352 // pad, after the catch instruction. Here it is safe to assume that SP32
353 // holds the latest value of __stack_pointer, because the only exception for
354 // this case is when a function uses the red zone, but that only happens
355 // with leaf functions, and we don't restore __stack_pointer in leaf
357 auto InsertPos
= MBB
.begin();
358 if (MBB
.begin()->getOpcode() == WebAssembly::CATCH
)
360 FrameLowering
->writeSPToGlobal(WebAssembly::SP32
, MF
, MBB
, InsertPos
,
361 MBB
.begin()->getDebugLoc());