1 //=== WebAssemblyLateEHPrepare.cpp - WebAssembly Exception Preparation -===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
10 /// \brief Does various transformations for exception handling.
12 //===----------------------------------------------------------------------===//
14 #include "MCTargetDesc/WebAssemblyMCTargetDesc.h"
15 #include "WebAssembly.h"
16 #include "WebAssemblySubtarget.h"
17 #include "WebAssemblyUtilities.h"
18 #include "llvm/ADT/SmallSet.h"
19 #include "llvm/CodeGen/MachineInstrBuilder.h"
20 #include "llvm/CodeGen/WasmEHFuncInfo.h"
21 #include "llvm/MC/MCAsmInfo.h"
24 #define DEBUG_TYPE "wasm-late-eh-prepare"
27 class WebAssemblyLateEHPrepare final
: public MachineFunctionPass
{
28 StringRef
getPassName() const override
{
29 return "WebAssembly Late Prepare Exception";
32 bool runOnMachineFunction(MachineFunction
&MF
) override
;
33 bool addCatches(MachineFunction
&MF
);
34 bool replaceFuncletReturns(MachineFunction
&MF
);
35 bool removeUnnecessaryUnreachables(MachineFunction
&MF
);
36 bool addExceptionExtraction(MachineFunction
&MF
);
37 bool restoreStackPointer(MachineFunction
&MF
);
40 static char ID
; // Pass identification, replacement for typeid
41 WebAssemblyLateEHPrepare() : MachineFunctionPass(ID
) {}
43 } // end anonymous namespace
45 char WebAssemblyLateEHPrepare::ID
= 0;
46 INITIALIZE_PASS(WebAssemblyLateEHPrepare
, DEBUG_TYPE
,
47 "WebAssembly Late Exception Preparation", false, false)
49 FunctionPass
*llvm::createWebAssemblyLateEHPrepare() {
50 return new WebAssemblyLateEHPrepare();
53 // Returns the nearest EH pad that dominates this instruction. This does not use
54 // dominator analysis; it just does BFS on its predecessors until arriving at an
55 // EH pad. This assumes valid EH scopes so the first EH pad it arrives in all
56 // possible search paths should be the same.
57 // Returns nullptr in case it does not find any EH pad in the search, or finds
58 // multiple different EH pads.
59 static MachineBasicBlock
*getMatchingEHPad(MachineInstr
*MI
) {
60 MachineFunction
*MF
= MI
->getParent()->getParent();
61 SmallVector
<MachineBasicBlock
*, 2> WL
;
62 SmallPtrSet
<MachineBasicBlock
*, 2> Visited
;
63 WL
.push_back(MI
->getParent());
64 MachineBasicBlock
*EHPad
= nullptr;
66 MachineBasicBlock
*MBB
= WL
.pop_back_val();
67 if (Visited
.count(MBB
))
71 if (EHPad
&& EHPad
!= MBB
)
76 if (MBB
== &MF
->front())
78 WL
.append(MBB
->pred_begin(), MBB
->pred_end());
83 // Erase the specified BBs if the BB does not have any remaining predecessors,
84 // and also all its dead children.
85 template <typename Container
>
86 static void eraseDeadBBsAndChildren(const Container
&MBBs
) {
87 SmallVector
<MachineBasicBlock
*, 8> WL(MBBs
.begin(), MBBs
.end());
89 MachineBasicBlock
*MBB
= WL
.pop_back_val();
90 if (!MBB
->pred_empty())
92 SmallVector
<MachineBasicBlock
*, 4> Succs(MBB
->succ_begin(),
94 WL
.append(MBB
->succ_begin(), MBB
->succ_end());
95 for (auto *Succ
: Succs
)
96 MBB
->removeSuccessor(Succ
);
97 MBB
->eraseFromParent();
101 bool WebAssemblyLateEHPrepare::runOnMachineFunction(MachineFunction
&MF
) {
102 LLVM_DEBUG(dbgs() << "********** Late EH Prepare **********\n"
103 "********** Function: "
104 << MF
.getName() << '\n');
106 if (MF
.getTarget().getMCAsmInfo()->getExceptionHandlingType() !=
107 ExceptionHandling::Wasm
)
110 bool Changed
= false;
111 if (MF
.getFunction().hasPersonalityFn()) {
112 Changed
|= addCatches(MF
);
113 Changed
|= replaceFuncletReturns(MF
);
115 Changed
|= removeUnnecessaryUnreachables(MF
);
116 if (MF
.getFunction().hasPersonalityFn()) {
117 Changed
|= addExceptionExtraction(MF
);
118 Changed
|= restoreStackPointer(MF
);
123 // Add catch instruction to beginning of catchpads and cleanuppads.
124 bool WebAssemblyLateEHPrepare::addCatches(MachineFunction
&MF
) {
125 bool Changed
= false;
126 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
127 MachineRegisterInfo
&MRI
= MF
.getRegInfo();
128 for (auto &MBB
: MF
) {
131 auto InsertPos
= MBB
.begin();
132 if (InsertPos
->isEHLabel()) // EH pad starts with an EH label
134 Register DstReg
= MRI
.createVirtualRegister(&WebAssembly::EXNREFRegClass
);
135 BuildMI(MBB
, InsertPos
, MBB
.begin()->getDebugLoc(),
136 TII
.get(WebAssembly::CATCH
), DstReg
);
142 bool WebAssemblyLateEHPrepare::replaceFuncletReturns(MachineFunction
&MF
) {
143 bool Changed
= false;
144 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
146 for (auto &MBB
: MF
) {
147 auto Pos
= MBB
.getFirstTerminator();
148 if (Pos
== MBB
.end())
150 MachineInstr
*TI
= &*Pos
;
152 switch (TI
->getOpcode()) {
153 case WebAssembly::CATCHRET
: {
154 // Replace a catchret with a branch
155 MachineBasicBlock
*TBB
= TI
->getOperand(0).getMBB();
156 if (!MBB
.isLayoutSuccessor(TBB
))
157 BuildMI(MBB
, TI
, TI
->getDebugLoc(), TII
.get(WebAssembly::BR
))
159 TI
->eraseFromParent();
163 case WebAssembly::CLEANUPRET
:
164 case WebAssembly::RETHROW_IN_CATCH
: {
165 // Replace a cleanupret/rethrow_in_catch with a rethrow
166 auto *EHPad
= getMatchingEHPad(TI
);
167 auto CatchPos
= EHPad
->begin();
168 if (CatchPos
->isEHLabel()) // EH pad starts with an EH label
170 MachineInstr
*Catch
= &*CatchPos
;
171 Register ExnReg
= Catch
->getOperand(0).getReg();
172 BuildMI(MBB
, TI
, TI
->getDebugLoc(), TII
.get(WebAssembly::RETHROW
))
174 TI
->eraseFromParent();
183 bool WebAssemblyLateEHPrepare::removeUnnecessaryUnreachables(
184 MachineFunction
&MF
) {
185 bool Changed
= false;
186 for (auto &MBB
: MF
) {
187 for (auto &MI
: MBB
) {
188 if (MI
.getOpcode() != WebAssembly::THROW
&&
189 MI
.getOpcode() != WebAssembly::RETHROW
)
193 // The instruction after the throw should be an unreachable or a branch to
194 // another BB that should eventually lead to an unreachable. Delete it
195 // because throw itself is a terminator, and also delete successors if
197 MBB
.erase(std::next(MI
.getIterator()), MBB
.end());
198 SmallVector
<MachineBasicBlock
*, 8> Succs(MBB
.succ_begin(),
200 for (auto *Succ
: Succs
)
201 if (!Succ
->isEHPad())
202 MBB
.removeSuccessor(Succ
);
203 eraseDeadBBsAndChildren(Succs
);
210 // Wasm uses 'br_on_exn' instruction to check the tag of an exception. It takes
211 // exnref type object returned by 'catch', and branches to the destination if it
212 // matches a given tag. We currently use __cpp_exception symbol to represent the
213 // tag for all C++ exceptions.
215 // block $l (result i32)
217 // ;; exnref $e is on the stack at this point
218 // br_on_exn $l $e ;; branch to $l with $e's arguments
221 // ;; Here we expect the extracted values are on top of the wasm value stack
222 // ... Handle exception using values ...
224 // br_on_exn takes an exnref object and branches if it matches the given tag.
225 // There can be multiple br_on_exn instructions if we want to match for another
226 // tag, but for now we only test for __cpp_exception tag, and if it does not
227 // match, i.e., it is a foreign exception, we rethrow it.
229 // In the destination BB that's the target of br_on_exn, extracted exception
230 // values (in C++'s case a single i32, which represents an exception pointer)
231 // are placed on top of the wasm stack. Because we can't model wasm stack in
232 // LLVM instruction, we use 'extract_exception' pseudo instruction to retrieve
233 // it. The pseudo instruction will be deleted later.
234 bool WebAssemblyLateEHPrepare::addExceptionExtraction(MachineFunction
&MF
) {
235 const auto &TII
= *MF
.getSubtarget
<WebAssemblySubtarget
>().getInstrInfo();
236 MachineRegisterInfo
&MRI
= MF
.getRegInfo();
237 auto *EHInfo
= MF
.getWasmEHFuncInfo();
238 SmallVector
<MachineInstr
*, 16> ExtractInstrs
;
239 SmallVector
<MachineInstr
*, 8> ToDelete
;
240 for (auto &MBB
: MF
) {
241 for (auto &MI
: MBB
) {
242 if (MI
.getOpcode() == WebAssembly::EXTRACT_EXCEPTION_I32
) {
243 if (MI
.getOperand(0).isDead())
244 ToDelete
.push_back(&MI
);
246 ExtractInstrs
.push_back(&MI
);
250 bool Changed
= !ToDelete
.empty() || !ExtractInstrs
.empty();
251 for (auto *MI
: ToDelete
)
252 MI
->eraseFromParent();
253 if (ExtractInstrs
.empty())
256 // Find terminate pads.
257 SmallSet
<MachineBasicBlock
*, 8> TerminatePads
;
258 for (auto &MBB
: MF
) {
259 for (auto &MI
: MBB
) {
261 const MachineOperand
&CalleeOp
= MI
.getOperand(0);
262 if (CalleeOp
.isGlobal() && CalleeOp
.getGlobal()->getName() ==
263 WebAssembly::ClangCallTerminateFn
)
264 TerminatePads
.insert(getMatchingEHPad(&MI
));
269 for (auto *Extract
: ExtractInstrs
) {
270 MachineBasicBlock
*EHPad
= getMatchingEHPad(Extract
);
271 assert(EHPad
&& "No matching EH pad for extract_exception");
272 auto CatchPos
= EHPad
->begin();
273 if (CatchPos
->isEHLabel()) // EH pad starts with an EH label
275 MachineInstr
*Catch
= &*CatchPos
;
277 if (Catch
->getNextNode() != Extract
)
278 EHPad
->insert(Catch
->getNextNode(), Extract
->removeFromParent());
282 // %exnref:exnref = catch
283 // %exn:i32 = extract_exception
288 // %exnref:exnref = catch
289 // br_on_exn %thenbb, $__cpp_exception, %exnref
294 // %exn:i32 = extract_exception
296 Register ExnReg
= Catch
->getOperand(0).getReg();
297 auto *ThenMBB
= MF
.CreateMachineBasicBlock();
298 auto *ElseMBB
= MF
.CreateMachineBasicBlock();
299 MF
.insert(std::next(MachineFunction::iterator(EHPad
)), ElseMBB
);
300 MF
.insert(std::next(MachineFunction::iterator(ElseMBB
)), ThenMBB
);
301 ThenMBB
->splice(ThenMBB
->end(), EHPad
, Extract
, EHPad
->end());
302 ThenMBB
->transferSuccessors(EHPad
);
303 EHPad
->addSuccessor(ThenMBB
);
304 EHPad
->addSuccessor(ElseMBB
);
306 DebugLoc DL
= Extract
->getDebugLoc();
307 const char *CPPExnSymbol
= MF
.createExternalSymbolName("__cpp_exception");
308 BuildMI(EHPad
, DL
, TII
.get(WebAssembly::BR_ON_EXN
))
310 .addExternalSymbol(CPPExnSymbol
)
312 BuildMI(EHPad
, DL
, TII
.get(WebAssembly::BR
)).addMBB(ElseMBB
);
314 // When this is a terminate pad with __clang_call_terminate() call, we don't
315 // rethrow it anymore and call __clang_call_terminate() with a nullptr
316 // argument, which will call std::terminate().
320 // %exnref:exnref = catch
321 // %exn:i32 = extract_exception
322 // call @__clang_call_terminate(%exn)
327 // %exnref:exnref = catch
328 // br_on_exn %thenbb, $__cpp_exception, %exnref
331 // call @__clang_call_terminate(0)
334 // %exn:i32 = extract_exception
335 // call @__clang_call_terminate(%exn)
337 if (TerminatePads
.count(EHPad
)) {
338 Function
*ClangCallTerminateFn
=
339 MF
.getFunction().getParent()->getFunction(
340 WebAssembly::ClangCallTerminateFn
);
341 assert(ClangCallTerminateFn
&&
342 "There is no __clang_call_terminate() function");
343 Register Reg
= MRI
.createVirtualRegister(&WebAssembly::I32RegClass
);
344 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::CONST_I32
), Reg
).addImm(0);
345 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::CALL_VOID
))
346 .addGlobalAddress(ClangCallTerminateFn
)
348 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::UNREACHABLE
));
351 BuildMI(ElseMBB
, DL
, TII
.get(WebAssembly::RETHROW
)).addReg(ExnReg
);
352 if (EHInfo
->hasEHPadUnwindDest(EHPad
))
353 ElseMBB
->addSuccessor(EHInfo
->getEHPadUnwindDest(EHPad
));
360 // After the stack is unwound due to a thrown exception, the __stack_pointer
361 // global can point to an invalid address. This inserts instructions that
362 // restore __stack_pointer global.
363 bool WebAssemblyLateEHPrepare::restoreStackPointer(MachineFunction
&MF
) {
364 const auto *FrameLowering
= static_cast<const WebAssemblyFrameLowering
*>(
365 MF
.getSubtarget().getFrameLowering());
366 if (!FrameLowering
->needsPrologForEH(MF
))
368 bool Changed
= false;
370 for (auto &MBB
: MF
) {
375 // Insert __stack_pointer restoring instructions at the beginning of each EH
376 // pad, after the catch instruction. Here it is safe to assume that SP32
377 // holds the latest value of __stack_pointer, because the only exception for
378 // this case is when a function uses the red zone, but that only happens
379 // with leaf functions, and we don't restore __stack_pointer in leaf
381 auto InsertPos
= MBB
.begin();
382 if (InsertPos
->isEHLabel()) // EH pad starts with an EH label
384 if (InsertPos
->getOpcode() == WebAssembly::CATCH
)
386 FrameLowering
->writeSPToGlobal(WebAssembly::SP32
, MF
, MBB
, InsertPos
,
387 MBB
.begin()->getDebugLoc());