1950a13cfSDan Gohman //===-- WebAssemblyCFGStackify.cpp - CFG Stackification -------------------===// 2950a13cfSDan Gohman // 32946cd70SChandler Carruth // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 42946cd70SChandler Carruth // See https://llvm.org/LICENSE.txt for license information. 52946cd70SChandler Carruth // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6950a13cfSDan Gohman // 7950a13cfSDan Gohman //===----------------------------------------------------------------------===// 8950a13cfSDan Gohman /// 9950a13cfSDan Gohman /// \file 105f8f34e4SAdrian Prantl /// This file implements a CFG stacking pass. 11950a13cfSDan Gohman /// 12e76fa9ecSHeejin Ahn /// This pass inserts BLOCK, LOOP, and TRY markers to mark the start of scopes, 13e76fa9ecSHeejin Ahn /// since scope boundaries serve as the labels for WebAssembly's control 14e76fa9ecSHeejin Ahn /// transfers. 15950a13cfSDan Gohman /// 16950a13cfSDan Gohman /// This is sufficient to convert arbitrary CFGs into a form that works on 17950a13cfSDan Gohman /// WebAssembly, provided that all loops are single-entry. 18950a13cfSDan Gohman /// 19e76fa9ecSHeejin Ahn /// In case we use exceptions, this pass also fixes mismatches in unwind 20e76fa9ecSHeejin Ahn /// destinations created during transforming CFG into wasm structured format. 21e76fa9ecSHeejin Ahn /// 22950a13cfSDan Gohman //===----------------------------------------------------------------------===// 23950a13cfSDan Gohman 246bda14b3SChandler Carruth #include "WebAssembly.h" 25e76fa9ecSHeejin Ahn #include "WebAssemblyExceptionInfo.h" 26ed0f1138SDan Gohman #include "WebAssemblyMachineFunctionInfo.h" 27276f9e8cSHeejin Ahn #include "WebAssemblySortRegion.h" 28950a13cfSDan Gohman #include "WebAssemblySubtarget.h" 294fc4e42dSDan Gohman #include "WebAssemblyUtilities.h" 30c4ac74fbSHeejin Ahn #include "llvm/ADT/Statistic.h" 3132807932SDan Gohman #include "llvm/CodeGen/MachineDominators.h" 32950a13cfSDan Gohman #include "llvm/CodeGen/MachineInstrBuilder.h" 33904cd3e0SReid Kleckner #include "llvm/CodeGen/MachineLoopInfo.h" 34e76fa9ecSHeejin Ahn #include "llvm/MC/MCAsmInfo.h" 35fe0006c8SSimon Pilgrim #include "llvm/Target/TargetMachine.h" 36950a13cfSDan Gohman using namespace llvm; 37276f9e8cSHeejin Ahn using WebAssembly::SortRegionInfo; 38950a13cfSDan Gohman 39950a13cfSDan Gohman #define DEBUG_TYPE "wasm-cfg-stackify" 40950a13cfSDan Gohman 41*ed41945fSHeejin Ahn STATISTIC(NumCallUnwindMismatches, "Number of call unwind mismatches found"); 42c4ac74fbSHeejin Ahn 43950a13cfSDan Gohman namespace { 44950a13cfSDan Gohman class WebAssemblyCFGStackify final : public MachineFunctionPass { 45117296c0SMehdi Amini StringRef getPassName() const override { return "WebAssembly CFG Stackify"; } 46950a13cfSDan Gohman 47950a13cfSDan Gohman void getAnalysisUsage(AnalysisUsage &AU) const override { 4832807932SDan Gohman AU.addRequired<MachineDominatorTree>(); 49950a13cfSDan Gohman AU.addRequired<MachineLoopInfo>(); 50e76fa9ecSHeejin Ahn AU.addRequired<WebAssemblyExceptionInfo>(); 51950a13cfSDan Gohman MachineFunctionPass::getAnalysisUsage(AU); 52950a13cfSDan Gohman } 53950a13cfSDan Gohman 54950a13cfSDan Gohman bool runOnMachineFunction(MachineFunction &MF) override; 55950a13cfSDan Gohman 56e76fa9ecSHeejin Ahn // For each block whose label represents the end of a scope, record the block 57e76fa9ecSHeejin Ahn // which holds the beginning of the scope. This will allow us to quickly skip 58e76fa9ecSHeejin Ahn // over scoped regions when walking blocks. 59e76fa9ecSHeejin Ahn SmallVector<MachineBasicBlock *, 8> ScopeTops; 601cc52357SHeejin Ahn void updateScopeTops(MachineBasicBlock *Begin, MachineBasicBlock *End) { 611cc52357SHeejin Ahn int EndNo = End->getNumber(); 621cc52357SHeejin Ahn if (!ScopeTops[EndNo] || ScopeTops[EndNo]->getNumber() > Begin->getNumber()) 631cc52357SHeejin Ahn ScopeTops[EndNo] = Begin; 641cc52357SHeejin Ahn } 65e76fa9ecSHeejin Ahn 66c4ac74fbSHeejin Ahn // Placing markers. 67e76fa9ecSHeejin Ahn void placeMarkers(MachineFunction &MF); 68e76fa9ecSHeejin Ahn void placeBlockMarker(MachineBasicBlock &MBB); 69e76fa9ecSHeejin Ahn void placeLoopMarker(MachineBasicBlock &MBB); 70e76fa9ecSHeejin Ahn void placeTryMarker(MachineBasicBlock &MBB); 71*ed41945fSHeejin Ahn 72*ed41945fSHeejin Ahn // Exception handling related functions 73*ed41945fSHeejin Ahn bool fixCallUnwindMismatches(MachineFunction &MF); 74*ed41945fSHeejin Ahn bool fixCatchUnwindMismatches(MachineFunction &MF); 75*ed41945fSHeejin Ahn void addTryDelegate(MachineInstr *RangeBegin, MachineInstr *RangeEnd, 76*ed41945fSHeejin Ahn MachineBasicBlock *DelegateDest); 77*ed41945fSHeejin Ahn void recalculateScopeTops(MachineFunction &MF); 78cf699b45SHeejin Ahn void removeUnnecessaryInstrs(MachineFunction &MF); 79*ed41945fSHeejin Ahn 80*ed41945fSHeejin Ahn // Wrap-up 81*ed41945fSHeejin Ahn unsigned getDepth(const SmallVectorImpl<const MachineBasicBlock *> &Stack, 82*ed41945fSHeejin Ahn const MachineBasicBlock *MBB); 83e76fa9ecSHeejin Ahn void rewriteDepthImmediates(MachineFunction &MF); 84e76fa9ecSHeejin Ahn void fixEndsAtEndOfFunction(MachineFunction &MF); 85*ed41945fSHeejin Ahn void cleanupFunctionData(MachineFunction &MF); 86e76fa9ecSHeejin Ahn 87*ed41945fSHeejin Ahn // For each BLOCK|LOOP|TRY, the corresponding END_(BLOCK|LOOP|TRY) or DELEGATE 88*ed41945fSHeejin Ahn // (in case of TRY). 89e76fa9ecSHeejin Ahn DenseMap<const MachineInstr *, MachineInstr *> BeginToEnd; 90*ed41945fSHeejin Ahn // For each END_(BLOCK|LOOP|TRY) or DELEGATE, the corresponding 91*ed41945fSHeejin Ahn // BLOCK|LOOP|TRY. 92e76fa9ecSHeejin Ahn DenseMap<const MachineInstr *, MachineInstr *> EndToBegin; 93e76fa9ecSHeejin Ahn // <TRY marker, EH pad> map 94e76fa9ecSHeejin Ahn DenseMap<const MachineInstr *, MachineBasicBlock *> TryToEHPad; 95e76fa9ecSHeejin Ahn // <EH pad, TRY marker> map 96e76fa9ecSHeejin Ahn DenseMap<const MachineBasicBlock *, MachineInstr *> EHPadToTry; 97e76fa9ecSHeejin Ahn 98*ed41945fSHeejin Ahn // We need an appendix block to place 'end_loop' or 'end_try' marker when the 99*ed41945fSHeejin Ahn // loop / exception bottom block is the last block in a function 100c4ac74fbSHeejin Ahn MachineBasicBlock *AppendixBB = nullptr; 101c4ac74fbSHeejin Ahn MachineBasicBlock *getAppendixBlock(MachineFunction &MF) { 102c4ac74fbSHeejin Ahn if (!AppendixBB) { 103c4ac74fbSHeejin Ahn AppendixBB = MF.CreateMachineBasicBlock(); 104c4ac74fbSHeejin Ahn // Give it a fake predecessor so that AsmPrinter prints its label. 105c4ac74fbSHeejin Ahn AppendixBB->addSuccessor(AppendixBB); 106c4ac74fbSHeejin Ahn MF.push_back(AppendixBB); 107c4ac74fbSHeejin Ahn } 108c4ac74fbSHeejin Ahn return AppendixBB; 109c4ac74fbSHeejin Ahn } 110c4ac74fbSHeejin Ahn 111*ed41945fSHeejin Ahn // Before running rewriteDepthImmediates function, 'delegate' has a BB as its 112*ed41945fSHeejin Ahn // destination operand. getFakeCallerBlock() returns a fake BB that will be 113*ed41945fSHeejin Ahn // used for the operand when 'delegate' needs to rethrow to the caller. This 114*ed41945fSHeejin Ahn // will be rewritten as an immediate value that is the number of block depths 115*ed41945fSHeejin Ahn // + 1 in rewriteDepthImmediates, and this fake BB will be removed at the end 116*ed41945fSHeejin Ahn // of the pass. 117*ed41945fSHeejin Ahn MachineBasicBlock *FakeCallerBB = nullptr; 118*ed41945fSHeejin Ahn MachineBasicBlock *getFakeCallerBlock(MachineFunction &MF) { 119*ed41945fSHeejin Ahn if (!FakeCallerBB) 120*ed41945fSHeejin Ahn FakeCallerBB = MF.CreateMachineBasicBlock(); 121*ed41945fSHeejin Ahn return FakeCallerBB; 122*ed41945fSHeejin Ahn } 123*ed41945fSHeejin Ahn 124cf699b45SHeejin Ahn // Helper functions to register / unregister scope information created by 125cf699b45SHeejin Ahn // marker instructions. 126e76fa9ecSHeejin Ahn void registerScope(MachineInstr *Begin, MachineInstr *End); 127e76fa9ecSHeejin Ahn void registerTryScope(MachineInstr *Begin, MachineInstr *End, 128e76fa9ecSHeejin Ahn MachineBasicBlock *EHPad); 129cf699b45SHeejin Ahn void unregisterScope(MachineInstr *Begin); 130e76fa9ecSHeejin Ahn 131950a13cfSDan Gohman public: 132950a13cfSDan Gohman static char ID; // Pass identification, replacement for typeid 133950a13cfSDan Gohman WebAssemblyCFGStackify() : MachineFunctionPass(ID) {} 134e76fa9ecSHeejin Ahn ~WebAssemblyCFGStackify() override { releaseMemory(); } 135e76fa9ecSHeejin Ahn void releaseMemory() override; 136950a13cfSDan Gohman }; 137950a13cfSDan Gohman } // end anonymous namespace 138950a13cfSDan Gohman 139950a13cfSDan Gohman char WebAssemblyCFGStackify::ID = 0; 14040926451SJacob Gravelle INITIALIZE_PASS(WebAssemblyCFGStackify, DEBUG_TYPE, 141c4ac74fbSHeejin Ahn "Insert BLOCK/LOOP/TRY markers for WebAssembly scopes", false, 142f208f631SHeejin Ahn false) 14340926451SJacob Gravelle 144950a13cfSDan Gohman FunctionPass *llvm::createWebAssemblyCFGStackify() { 145950a13cfSDan Gohman return new WebAssemblyCFGStackify(); 146950a13cfSDan Gohman } 147950a13cfSDan Gohman 148b3aa1ecaSDan Gohman /// Test whether Pred has any terminators explicitly branching to MBB, as 149b3aa1ecaSDan Gohman /// opposed to falling through. Note that it's possible (eg. in unoptimized 150b3aa1ecaSDan Gohman /// code) for a branch instruction to both branch to a block and fallthrough 151b3aa1ecaSDan Gohman /// to it, so we check the actual branch operands to see if there are any 152b3aa1ecaSDan Gohman /// explicit mentions. 15318c56a07SHeejin Ahn static bool explicitlyBranchesTo(MachineBasicBlock *Pred, 15435e4a289SDan Gohman MachineBasicBlock *MBB) { 155b3aa1ecaSDan Gohman for (MachineInstr &MI : Pred->terminators()) 156b3aa1ecaSDan Gohman for (MachineOperand &MO : MI.explicit_operands()) 157b3aa1ecaSDan Gohman if (MO.isMBB() && MO.getMBB() == MBB) 158b3aa1ecaSDan Gohman return true; 159b3aa1ecaSDan Gohman return false; 160b3aa1ecaSDan Gohman } 161b3aa1ecaSDan Gohman 162e76fa9ecSHeejin Ahn // Returns an iterator to the earliest position possible within the MBB, 163e76fa9ecSHeejin Ahn // satisfying the restrictions given by BeforeSet and AfterSet. BeforeSet 164e76fa9ecSHeejin Ahn // contains instructions that should go before the marker, and AfterSet contains 165e76fa9ecSHeejin Ahn // ones that should go after the marker. In this function, AfterSet is only 166e76fa9ecSHeejin Ahn // used for sanity checking. 1671cc52357SHeejin Ahn template <typename Container> 168e76fa9ecSHeejin Ahn static MachineBasicBlock::iterator 1691cc52357SHeejin Ahn getEarliestInsertPos(MachineBasicBlock *MBB, const Container &BeforeSet, 1701cc52357SHeejin Ahn const Container &AfterSet) { 171e76fa9ecSHeejin Ahn auto InsertPos = MBB->end(); 172e76fa9ecSHeejin Ahn while (InsertPos != MBB->begin()) { 173e76fa9ecSHeejin Ahn if (BeforeSet.count(&*std::prev(InsertPos))) { 174e76fa9ecSHeejin Ahn #ifndef NDEBUG 175e76fa9ecSHeejin Ahn // Sanity check 176e76fa9ecSHeejin Ahn for (auto Pos = InsertPos, E = MBB->begin(); Pos != E; --Pos) 177e76fa9ecSHeejin Ahn assert(!AfterSet.count(&*std::prev(Pos))); 178e76fa9ecSHeejin Ahn #endif 179e76fa9ecSHeejin Ahn break; 180e76fa9ecSHeejin Ahn } 181e76fa9ecSHeejin Ahn --InsertPos; 182e76fa9ecSHeejin Ahn } 183e76fa9ecSHeejin Ahn return InsertPos; 184e76fa9ecSHeejin Ahn } 185e76fa9ecSHeejin Ahn 186e76fa9ecSHeejin Ahn // Returns an iterator to the latest position possible within the MBB, 187e76fa9ecSHeejin Ahn // satisfying the restrictions given by BeforeSet and AfterSet. BeforeSet 188e76fa9ecSHeejin Ahn // contains instructions that should go before the marker, and AfterSet contains 189e76fa9ecSHeejin Ahn // ones that should go after the marker. In this function, BeforeSet is only 190e76fa9ecSHeejin Ahn // used for sanity checking. 1911cc52357SHeejin Ahn template <typename Container> 192e76fa9ecSHeejin Ahn static MachineBasicBlock::iterator 1931cc52357SHeejin Ahn getLatestInsertPos(MachineBasicBlock *MBB, const Container &BeforeSet, 1941cc52357SHeejin Ahn const Container &AfterSet) { 195e76fa9ecSHeejin Ahn auto InsertPos = MBB->begin(); 196e76fa9ecSHeejin Ahn while (InsertPos != MBB->end()) { 197e76fa9ecSHeejin Ahn if (AfterSet.count(&*InsertPos)) { 198e76fa9ecSHeejin Ahn #ifndef NDEBUG 199e76fa9ecSHeejin Ahn // Sanity check 200e76fa9ecSHeejin Ahn for (auto Pos = InsertPos, E = MBB->end(); Pos != E; ++Pos) 201e76fa9ecSHeejin Ahn assert(!BeforeSet.count(&*Pos)); 202e76fa9ecSHeejin Ahn #endif 203e76fa9ecSHeejin Ahn break; 204e76fa9ecSHeejin Ahn } 205e76fa9ecSHeejin Ahn ++InsertPos; 206e76fa9ecSHeejin Ahn } 207e76fa9ecSHeejin Ahn return InsertPos; 208e76fa9ecSHeejin Ahn } 209e76fa9ecSHeejin Ahn 210e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::registerScope(MachineInstr *Begin, 211e76fa9ecSHeejin Ahn MachineInstr *End) { 212e76fa9ecSHeejin Ahn BeginToEnd[Begin] = End; 213e76fa9ecSHeejin Ahn EndToBegin[End] = Begin; 214e76fa9ecSHeejin Ahn } 215e76fa9ecSHeejin Ahn 216*ed41945fSHeejin Ahn // When 'End' is not an 'end_try' but 'delegate, EHPad is nullptr. 217e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::registerTryScope(MachineInstr *Begin, 218e76fa9ecSHeejin Ahn MachineInstr *End, 219e76fa9ecSHeejin Ahn MachineBasicBlock *EHPad) { 220e76fa9ecSHeejin Ahn registerScope(Begin, End); 221e76fa9ecSHeejin Ahn TryToEHPad[Begin] = EHPad; 222e76fa9ecSHeejin Ahn EHPadToTry[EHPad] = Begin; 223e76fa9ecSHeejin Ahn } 224e76fa9ecSHeejin Ahn 225cf699b45SHeejin Ahn void WebAssemblyCFGStackify::unregisterScope(MachineInstr *Begin) { 226cf699b45SHeejin Ahn assert(BeginToEnd.count(Begin)); 227cf699b45SHeejin Ahn MachineInstr *End = BeginToEnd[Begin]; 228cf699b45SHeejin Ahn assert(EndToBegin.count(End)); 229cf699b45SHeejin Ahn BeginToEnd.erase(Begin); 230cf699b45SHeejin Ahn EndToBegin.erase(End); 231cf699b45SHeejin Ahn MachineBasicBlock *EHPad = TryToEHPad.lookup(Begin); 232cf699b45SHeejin Ahn if (EHPad) { 233cf699b45SHeejin Ahn assert(EHPadToTry.count(EHPad)); 234cf699b45SHeejin Ahn TryToEHPad.erase(Begin); 235cf699b45SHeejin Ahn EHPadToTry.erase(EHPad); 236cf699b45SHeejin Ahn } 237cf699b45SHeejin Ahn } 238cf699b45SHeejin Ahn 23932807932SDan Gohman /// Insert a BLOCK marker for branches to MBB (if needed). 240c4ac74fbSHeejin Ahn // TODO Consider a more generalized way of handling block (and also loop and 241c4ac74fbSHeejin Ahn // try) signatures when we implement the multi-value proposal later. 242e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::placeBlockMarker(MachineBasicBlock &MBB) { 24344a5a4b1SHeejin Ahn assert(!MBB.isEHPad()); 244e76fa9ecSHeejin Ahn MachineFunction &MF = *MBB.getParent(); 245e76fa9ecSHeejin Ahn auto &MDT = getAnalysis<MachineDominatorTree>(); 246e76fa9ecSHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 247e76fa9ecSHeejin Ahn const auto &MFI = *MF.getInfo<WebAssemblyFunctionInfo>(); 248e76fa9ecSHeejin Ahn 2498fe7e86bSDan Gohman // First compute the nearest common dominator of all forward non-fallthrough 2508fe7e86bSDan Gohman // predecessors so that we minimize the time that the BLOCK is on the stack, 2518fe7e86bSDan Gohman // which reduces overall stack height. 25232807932SDan Gohman MachineBasicBlock *Header = nullptr; 25332807932SDan Gohman bool IsBranchedTo = false; 25432807932SDan Gohman int MBBNumber = MBB.getNumber(); 255e76fa9ecSHeejin Ahn for (MachineBasicBlock *Pred : MBB.predecessors()) { 25632807932SDan Gohman if (Pred->getNumber() < MBBNumber) { 25732807932SDan Gohman Header = Header ? MDT.findNearestCommonDominator(Header, Pred) : Pred; 25852e240a0SHeejin Ahn if (explicitlyBranchesTo(Pred, &MBB)) 25932807932SDan Gohman IsBranchedTo = true; 26032807932SDan Gohman } 261e76fa9ecSHeejin Ahn } 26232807932SDan Gohman if (!Header) 26332807932SDan Gohman return; 26432807932SDan Gohman if (!IsBranchedTo) 26532807932SDan Gohman return; 26632807932SDan Gohman 2678fe7e86bSDan Gohman assert(&MBB != &MF.front() && "Header blocks shouldn't have predecessors"); 2685c644c9bSHeejin Ahn MachineBasicBlock *LayoutPred = MBB.getPrevNode(); 2698fe7e86bSDan Gohman 2708fe7e86bSDan Gohman // If the nearest common dominator is inside a more deeply nested context, 2718fe7e86bSDan Gohman // walk out to the nearest scope which isn't more deeply nested. 2728fe7e86bSDan Gohman for (MachineFunction::iterator I(LayoutPred), E(Header); I != E; --I) { 2738fe7e86bSDan Gohman if (MachineBasicBlock *ScopeTop = ScopeTops[I->getNumber()]) { 2748fe7e86bSDan Gohman if (ScopeTop->getNumber() > Header->getNumber()) { 2758fe7e86bSDan Gohman // Skip over an intervening scope. 2765c644c9bSHeejin Ahn I = std::next(ScopeTop->getIterator()); 2778fe7e86bSDan Gohman } else { 2788fe7e86bSDan Gohman // We found a scope level at an appropriate depth. 2798fe7e86bSDan Gohman Header = ScopeTop; 2808fe7e86bSDan Gohman break; 2818fe7e86bSDan Gohman } 2828fe7e86bSDan Gohman } 2838fe7e86bSDan Gohman } 2848fe7e86bSDan Gohman 2858fe7e86bSDan Gohman // Decide where in Header to put the BLOCK. 286e76fa9ecSHeejin Ahn 287e76fa9ecSHeejin Ahn // Instructions that should go before the BLOCK. 288e76fa9ecSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> BeforeSet; 289e76fa9ecSHeejin Ahn // Instructions that should go after the BLOCK. 290e76fa9ecSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> AfterSet; 291e76fa9ecSHeejin Ahn for (const auto &MI : *Header) { 29244a5a4b1SHeejin Ahn // If there is a previously placed LOOP marker and the bottom block of the 29344a5a4b1SHeejin Ahn // loop is above MBB, it should be after the BLOCK, because the loop is 29444a5a4b1SHeejin Ahn // nested in this BLOCK. Otherwise it should be before the BLOCK. 29544a5a4b1SHeejin Ahn if (MI.getOpcode() == WebAssembly::LOOP) { 29644a5a4b1SHeejin Ahn auto *LoopBottom = BeginToEnd[&MI]->getParent()->getPrevNode(); 29744a5a4b1SHeejin Ahn if (MBB.getNumber() > LoopBottom->getNumber()) 298e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 299e76fa9ecSHeejin Ahn #ifndef NDEBUG 300e76fa9ecSHeejin Ahn else 301e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 302e76fa9ecSHeejin Ahn #endif 303e76fa9ecSHeejin Ahn } 304e76fa9ecSHeejin Ahn 305834debffSHeejin Ahn // If there is a previously placed BLOCK/TRY marker and its corresponding 306834debffSHeejin Ahn // END marker is before the current BLOCK's END marker, that should be 307834debffSHeejin Ahn // placed after this BLOCK. Otherwise it should be placed before this BLOCK 308834debffSHeejin Ahn // marker. 30944a5a4b1SHeejin Ahn if (MI.getOpcode() == WebAssembly::BLOCK || 310834debffSHeejin Ahn MI.getOpcode() == WebAssembly::TRY) { 311834debffSHeejin Ahn if (BeginToEnd[&MI]->getParent()->getNumber() <= MBB.getNumber()) 312e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 313834debffSHeejin Ahn #ifndef NDEBUG 314834debffSHeejin Ahn else 315834debffSHeejin Ahn BeforeSet.insert(&MI); 316834debffSHeejin Ahn #endif 317834debffSHeejin Ahn } 318e76fa9ecSHeejin Ahn 319e76fa9ecSHeejin Ahn #ifndef NDEBUG 320e76fa9ecSHeejin Ahn // All END_(BLOCK|LOOP|TRY) markers should be before the BLOCK. 321e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::END_BLOCK || 322e76fa9ecSHeejin Ahn MI.getOpcode() == WebAssembly::END_LOOP || 323e76fa9ecSHeejin Ahn MI.getOpcode() == WebAssembly::END_TRY) 324e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 325e76fa9ecSHeejin Ahn #endif 326e76fa9ecSHeejin Ahn 327e76fa9ecSHeejin Ahn // Terminators should go after the BLOCK. 328e76fa9ecSHeejin Ahn if (MI.isTerminator()) 329e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 330e76fa9ecSHeejin Ahn } 331e76fa9ecSHeejin Ahn 332e76fa9ecSHeejin Ahn // Local expression tree should go after the BLOCK. 333e76fa9ecSHeejin Ahn for (auto I = Header->getFirstTerminator(), E = Header->begin(); I != E; 334e76fa9ecSHeejin Ahn --I) { 335409b4391SYury Delendik if (std::prev(I)->isDebugInstr() || std::prev(I)->isPosition()) 336409b4391SYury Delendik continue; 337e76fa9ecSHeejin Ahn if (WebAssembly::isChild(*std::prev(I), MFI)) 338e76fa9ecSHeejin Ahn AfterSet.insert(&*std::prev(I)); 339e76fa9ecSHeejin Ahn else 340e76fa9ecSHeejin Ahn break; 34132807932SDan Gohman } 34232807932SDan Gohman 3438fe7e86bSDan Gohman // Add the BLOCK. 3442cb27072SThomas Lively WebAssembly::BlockType ReturnType = WebAssembly::BlockType::Void; 34518c56a07SHeejin Ahn auto InsertPos = getLatestInsertPos(Header, BeforeSet, AfterSet); 34692401cc1SHeejin Ahn MachineInstr *Begin = 34792401cc1SHeejin Ahn BuildMI(*Header, InsertPos, Header->findDebugLoc(InsertPos), 3482726b88cSDan Gohman TII.get(WebAssembly::BLOCK)) 349d6f48786SHeejin Ahn .addImm(int64_t(ReturnType)); 3501d68e80fSDan Gohman 351e76fa9ecSHeejin Ahn // Decide where in Header to put the END_BLOCK. 352e76fa9ecSHeejin Ahn BeforeSet.clear(); 353e76fa9ecSHeejin Ahn AfterSet.clear(); 354e76fa9ecSHeejin Ahn for (auto &MI : MBB) { 355e76fa9ecSHeejin Ahn #ifndef NDEBUG 356e76fa9ecSHeejin Ahn // END_BLOCK should precede existing LOOP and TRY markers. 357e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::LOOP || 358e76fa9ecSHeejin Ahn MI.getOpcode() == WebAssembly::TRY) 359e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 360e76fa9ecSHeejin Ahn #endif 361e76fa9ecSHeejin Ahn 362e76fa9ecSHeejin Ahn // If there is a previously placed END_LOOP marker and the header of the 363e76fa9ecSHeejin Ahn // loop is above this block's header, the END_LOOP should be placed after 364e76fa9ecSHeejin Ahn // the BLOCK, because the loop contains this block. Otherwise the END_LOOP 365e76fa9ecSHeejin Ahn // should be placed before the BLOCK. The same for END_TRY. 366e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::END_LOOP || 367e76fa9ecSHeejin Ahn MI.getOpcode() == WebAssembly::END_TRY) { 368e76fa9ecSHeejin Ahn if (EndToBegin[&MI]->getParent()->getNumber() >= Header->getNumber()) 369e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 370e76fa9ecSHeejin Ahn #ifndef NDEBUG 371e76fa9ecSHeejin Ahn else 372e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 373e76fa9ecSHeejin Ahn #endif 374e76fa9ecSHeejin Ahn } 375e76fa9ecSHeejin Ahn } 376e76fa9ecSHeejin Ahn 3771d68e80fSDan Gohman // Mark the end of the block. 37818c56a07SHeejin Ahn InsertPos = getEarliestInsertPos(&MBB, BeforeSet, AfterSet); 37910b31358SDerek Schuff MachineInstr *End = BuildMI(MBB, InsertPos, MBB.findPrevDebugLoc(InsertPos), 3802726b88cSDan Gohman TII.get(WebAssembly::END_BLOCK)); 381e76fa9ecSHeejin Ahn registerScope(Begin, End); 3828fe7e86bSDan Gohman 3838fe7e86bSDan Gohman // Track the farthest-spanning scope that ends at this point. 3841cc52357SHeejin Ahn updateScopeTops(Header, &MBB); 385950a13cfSDan Gohman } 386950a13cfSDan Gohman 3878fe7e86bSDan Gohman /// Insert a LOOP marker for a loop starting at MBB (if it's a loop header). 388e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::placeLoopMarker(MachineBasicBlock &MBB) { 389e76fa9ecSHeejin Ahn MachineFunction &MF = *MBB.getParent(); 390e76fa9ecSHeejin Ahn const auto &MLI = getAnalysis<MachineLoopInfo>(); 391276f9e8cSHeejin Ahn const auto &WEI = getAnalysis<WebAssemblyExceptionInfo>(); 392276f9e8cSHeejin Ahn SortRegionInfo SRI(MLI, WEI); 393e76fa9ecSHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 394e76fa9ecSHeejin Ahn 3958fe7e86bSDan Gohman MachineLoop *Loop = MLI.getLoopFor(&MBB); 3968fe7e86bSDan Gohman if (!Loop || Loop->getHeader() != &MBB) 3978fe7e86bSDan Gohman return; 3988fe7e86bSDan Gohman 3998fe7e86bSDan Gohman // The operand of a LOOP is the first block after the loop. If the loop is the 4008fe7e86bSDan Gohman // bottom of the function, insert a dummy block at the end. 401276f9e8cSHeejin Ahn MachineBasicBlock *Bottom = SRI.getBottom(Loop); 4025c644c9bSHeejin Ahn auto Iter = std::next(Bottom->getIterator()); 403e3e4a5ffSDan Gohman if (Iter == MF.end()) { 404c4ac74fbSHeejin Ahn getAppendixBlock(MF); 4055c644c9bSHeejin Ahn Iter = std::next(Bottom->getIterator()); 406e3e4a5ffSDan Gohman } 4078fe7e86bSDan Gohman MachineBasicBlock *AfterLoop = &*Iter; 408f6857223SDan Gohman 409e76fa9ecSHeejin Ahn // Decide where in Header to put the LOOP. 410e76fa9ecSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> BeforeSet; 411e76fa9ecSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> AfterSet; 412e76fa9ecSHeejin Ahn for (const auto &MI : MBB) { 413e76fa9ecSHeejin Ahn // LOOP marker should be after any existing loop that ends here. Otherwise 414e76fa9ecSHeejin Ahn // we assume the instruction belongs to the loop. 415e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::END_LOOP) 416e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 417e76fa9ecSHeejin Ahn #ifndef NDEBUG 418e76fa9ecSHeejin Ahn else 419e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 420e76fa9ecSHeejin Ahn #endif 421e76fa9ecSHeejin Ahn } 422e76fa9ecSHeejin Ahn 423e76fa9ecSHeejin Ahn // Mark the beginning of the loop. 42418c56a07SHeejin Ahn auto InsertPos = getEarliestInsertPos(&MBB, BeforeSet, AfterSet); 42510b31358SDerek Schuff MachineInstr *Begin = BuildMI(MBB, InsertPos, MBB.findDebugLoc(InsertPos), 4262726b88cSDan Gohman TII.get(WebAssembly::LOOP)) 4272cb27072SThomas Lively .addImm(int64_t(WebAssembly::BlockType::Void)); 4281d68e80fSDan Gohman 429e76fa9ecSHeejin Ahn // Decide where in Header to put the END_LOOP. 430e76fa9ecSHeejin Ahn BeforeSet.clear(); 431e76fa9ecSHeejin Ahn AfterSet.clear(); 432e76fa9ecSHeejin Ahn #ifndef NDEBUG 433e76fa9ecSHeejin Ahn for (const auto &MI : MBB) 434e76fa9ecSHeejin Ahn // Existing END_LOOP markers belong to parent loops of this loop 435e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::END_LOOP) 436e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 437e76fa9ecSHeejin Ahn #endif 438e76fa9ecSHeejin Ahn 439e76fa9ecSHeejin Ahn // Mark the end of the loop (using arbitrary debug location that branched to 440e76fa9ecSHeejin Ahn // the loop end as its location). 44118c56a07SHeejin Ahn InsertPos = getEarliestInsertPos(AfterLoop, BeforeSet, AfterSet); 44267f74aceSHeejin Ahn DebugLoc EndDL = AfterLoop->pred_empty() 44367f74aceSHeejin Ahn ? DebugLoc() 44467f74aceSHeejin Ahn : (*AfterLoop->pred_rbegin())->findBranchDebugLoc(); 445e76fa9ecSHeejin Ahn MachineInstr *End = 446e76fa9ecSHeejin Ahn BuildMI(*AfterLoop, InsertPos, EndDL, TII.get(WebAssembly::END_LOOP)); 447e76fa9ecSHeejin Ahn registerScope(Begin, End); 4488fe7e86bSDan Gohman 4498fe7e86bSDan Gohman assert((!ScopeTops[AfterLoop->getNumber()] || 4508fe7e86bSDan Gohman ScopeTops[AfterLoop->getNumber()]->getNumber() < MBB.getNumber()) && 451442bfcecSDan Gohman "With block sorting the outermost loop for a block should be first."); 4521cc52357SHeejin Ahn updateScopeTops(&MBB, AfterLoop); 453e3e4a5ffSDan Gohman } 454950a13cfSDan Gohman 455e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::placeTryMarker(MachineBasicBlock &MBB) { 45644a5a4b1SHeejin Ahn assert(MBB.isEHPad()); 457e76fa9ecSHeejin Ahn MachineFunction &MF = *MBB.getParent(); 458e76fa9ecSHeejin Ahn auto &MDT = getAnalysis<MachineDominatorTree>(); 459e76fa9ecSHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 460276f9e8cSHeejin Ahn const auto &MLI = getAnalysis<MachineLoopInfo>(); 461e76fa9ecSHeejin Ahn const auto &WEI = getAnalysis<WebAssemblyExceptionInfo>(); 462276f9e8cSHeejin Ahn SortRegionInfo SRI(MLI, WEI); 463e76fa9ecSHeejin Ahn const auto &MFI = *MF.getInfo<WebAssemblyFunctionInfo>(); 464e76fa9ecSHeejin Ahn 465e76fa9ecSHeejin Ahn // Compute the nearest common dominator of all unwind predecessors 466e76fa9ecSHeejin Ahn MachineBasicBlock *Header = nullptr; 467e76fa9ecSHeejin Ahn int MBBNumber = MBB.getNumber(); 468e76fa9ecSHeejin Ahn for (auto *Pred : MBB.predecessors()) { 469e76fa9ecSHeejin Ahn if (Pred->getNumber() < MBBNumber) { 470e76fa9ecSHeejin Ahn Header = Header ? MDT.findNearestCommonDominator(Header, Pred) : Pred; 47118c56a07SHeejin Ahn assert(!explicitlyBranchesTo(Pred, &MBB) && 472e76fa9ecSHeejin Ahn "Explicit branch to an EH pad!"); 473e76fa9ecSHeejin Ahn } 474e76fa9ecSHeejin Ahn } 475e76fa9ecSHeejin Ahn if (!Header) 476e76fa9ecSHeejin Ahn return; 477e76fa9ecSHeejin Ahn 478e76fa9ecSHeejin Ahn // If this try is at the bottom of the function, insert a dummy block at the 479e76fa9ecSHeejin Ahn // end. 480e76fa9ecSHeejin Ahn WebAssemblyException *WE = WEI.getExceptionFor(&MBB); 481e76fa9ecSHeejin Ahn assert(WE); 482276f9e8cSHeejin Ahn MachineBasicBlock *Bottom = SRI.getBottom(WE); 483e76fa9ecSHeejin Ahn 4845c644c9bSHeejin Ahn auto Iter = std::next(Bottom->getIterator()); 485e76fa9ecSHeejin Ahn if (Iter == MF.end()) { 486c4ac74fbSHeejin Ahn getAppendixBlock(MF); 4875c644c9bSHeejin Ahn Iter = std::next(Bottom->getIterator()); 488e76fa9ecSHeejin Ahn } 48920cf0749SHeejin Ahn MachineBasicBlock *Cont = &*Iter; 490e76fa9ecSHeejin Ahn 49120cf0749SHeejin Ahn assert(Cont != &MF.front()); 4925c644c9bSHeejin Ahn MachineBasicBlock *LayoutPred = Cont->getPrevNode(); 493e76fa9ecSHeejin Ahn 494e76fa9ecSHeejin Ahn // If the nearest common dominator is inside a more deeply nested context, 495e76fa9ecSHeejin Ahn // walk out to the nearest scope which isn't more deeply nested. 496e76fa9ecSHeejin Ahn for (MachineFunction::iterator I(LayoutPred), E(Header); I != E; --I) { 497e76fa9ecSHeejin Ahn if (MachineBasicBlock *ScopeTop = ScopeTops[I->getNumber()]) { 498e76fa9ecSHeejin Ahn if (ScopeTop->getNumber() > Header->getNumber()) { 499e76fa9ecSHeejin Ahn // Skip over an intervening scope. 5005c644c9bSHeejin Ahn I = std::next(ScopeTop->getIterator()); 501e76fa9ecSHeejin Ahn } else { 502e76fa9ecSHeejin Ahn // We found a scope level at an appropriate depth. 503e76fa9ecSHeejin Ahn Header = ScopeTop; 504e76fa9ecSHeejin Ahn break; 505e76fa9ecSHeejin Ahn } 506e76fa9ecSHeejin Ahn } 507e76fa9ecSHeejin Ahn } 508e76fa9ecSHeejin Ahn 509e76fa9ecSHeejin Ahn // Decide where in Header to put the TRY. 510e76fa9ecSHeejin Ahn 51144a5a4b1SHeejin Ahn // Instructions that should go before the TRY. 512e76fa9ecSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> BeforeSet; 51344a5a4b1SHeejin Ahn // Instructions that should go after the TRY. 514e76fa9ecSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> AfterSet; 515e76fa9ecSHeejin Ahn for (const auto &MI : *Header) { 51644a5a4b1SHeejin Ahn // If there is a previously placed LOOP marker and the bottom block of the 51744a5a4b1SHeejin Ahn // loop is above MBB, it should be after the TRY, because the loop is nested 51844a5a4b1SHeejin Ahn // in this TRY. Otherwise it should be before the TRY. 519e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::LOOP) { 52044a5a4b1SHeejin Ahn auto *LoopBottom = BeginToEnd[&MI]->getParent()->getPrevNode(); 52144a5a4b1SHeejin Ahn if (MBB.getNumber() > LoopBottom->getNumber()) 522e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 523e76fa9ecSHeejin Ahn #ifndef NDEBUG 524e76fa9ecSHeejin Ahn else 525e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 526e76fa9ecSHeejin Ahn #endif 527e76fa9ecSHeejin Ahn } 528e76fa9ecSHeejin Ahn 52944a5a4b1SHeejin Ahn // All previously inserted BLOCK/TRY markers should be after the TRY because 53044a5a4b1SHeejin Ahn // they are all nested trys. 53144a5a4b1SHeejin Ahn if (MI.getOpcode() == WebAssembly::BLOCK || 53244a5a4b1SHeejin Ahn MI.getOpcode() == WebAssembly::TRY) 533e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 534e76fa9ecSHeejin Ahn 535e76fa9ecSHeejin Ahn #ifndef NDEBUG 53644a5a4b1SHeejin Ahn // All END_(BLOCK/LOOP/TRY) markers should be before the TRY. 53744a5a4b1SHeejin Ahn if (MI.getOpcode() == WebAssembly::END_BLOCK || 53844a5a4b1SHeejin Ahn MI.getOpcode() == WebAssembly::END_LOOP || 539e76fa9ecSHeejin Ahn MI.getOpcode() == WebAssembly::END_TRY) 540e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 541e76fa9ecSHeejin Ahn #endif 542e76fa9ecSHeejin Ahn 543e76fa9ecSHeejin Ahn // Terminators should go after the TRY. 544e76fa9ecSHeejin Ahn if (MI.isTerminator()) 545e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 546e76fa9ecSHeejin Ahn } 547e76fa9ecSHeejin Ahn 5486a37c5d6SHeejin Ahn // If Header unwinds to MBB (= Header contains 'invoke'), the try block should 5496a37c5d6SHeejin Ahn // contain the call within it. So the call should go after the TRY. The 5506a37c5d6SHeejin Ahn // exception is when the header's terminator is a rethrow instruction, in 5516a37c5d6SHeejin Ahn // which case that instruction, not a call instruction before it, is gonna 5526a37c5d6SHeejin Ahn // throw. 5536a37c5d6SHeejin Ahn MachineInstr *ThrowingCall = nullptr; 5546a37c5d6SHeejin Ahn if (MBB.isPredecessor(Header)) { 5556a37c5d6SHeejin Ahn auto TermPos = Header->getFirstTerminator(); 5566a37c5d6SHeejin Ahn if (TermPos == Header->end() || 5576a37c5d6SHeejin Ahn TermPos->getOpcode() != WebAssembly::RETHROW) { 5586a37c5d6SHeejin Ahn for (auto &MI : reverse(*Header)) { 5596a37c5d6SHeejin Ahn if (MI.isCall()) { 5606a37c5d6SHeejin Ahn AfterSet.insert(&MI); 5616a37c5d6SHeejin Ahn ThrowingCall = &MI; 5626a37c5d6SHeejin Ahn // Possibly throwing calls are usually wrapped by EH_LABEL 5636a37c5d6SHeejin Ahn // instructions. We don't want to split them and the call. 5646a37c5d6SHeejin Ahn if (MI.getIterator() != Header->begin() && 5656a37c5d6SHeejin Ahn std::prev(MI.getIterator())->isEHLabel()) { 5666a37c5d6SHeejin Ahn AfterSet.insert(&*std::prev(MI.getIterator())); 5676a37c5d6SHeejin Ahn ThrowingCall = &*std::prev(MI.getIterator()); 5686a37c5d6SHeejin Ahn } 5696a37c5d6SHeejin Ahn break; 5706a37c5d6SHeejin Ahn } 5716a37c5d6SHeejin Ahn } 5726a37c5d6SHeejin Ahn } 5736a37c5d6SHeejin Ahn } 5746a37c5d6SHeejin Ahn 575e76fa9ecSHeejin Ahn // Local expression tree should go after the TRY. 5766a37c5d6SHeejin Ahn // For BLOCK placement, we start the search from the previous instruction of a 5776a37c5d6SHeejin Ahn // BB's terminator, but in TRY's case, we should start from the previous 5786a37c5d6SHeejin Ahn // instruction of a call that can throw, or a EH_LABEL that precedes the call, 5796a37c5d6SHeejin Ahn // because the return values of the call's previous instructions can be 5806a37c5d6SHeejin Ahn // stackified and consumed by the throwing call. 5816a37c5d6SHeejin Ahn auto SearchStartPt = ThrowingCall ? MachineBasicBlock::iterator(ThrowingCall) 5826a37c5d6SHeejin Ahn : Header->getFirstTerminator(); 5836a37c5d6SHeejin Ahn for (auto I = SearchStartPt, E = Header->begin(); I != E; --I) { 584409b4391SYury Delendik if (std::prev(I)->isDebugInstr() || std::prev(I)->isPosition()) 585409b4391SYury Delendik continue; 586e76fa9ecSHeejin Ahn if (WebAssembly::isChild(*std::prev(I), MFI)) 587e76fa9ecSHeejin Ahn AfterSet.insert(&*std::prev(I)); 588e76fa9ecSHeejin Ahn else 589e76fa9ecSHeejin Ahn break; 590e76fa9ecSHeejin Ahn } 591e76fa9ecSHeejin Ahn 592e76fa9ecSHeejin Ahn // Add the TRY. 59318c56a07SHeejin Ahn auto InsertPos = getLatestInsertPos(Header, BeforeSet, AfterSet); 594e76fa9ecSHeejin Ahn MachineInstr *Begin = 595e76fa9ecSHeejin Ahn BuildMI(*Header, InsertPos, Header->findDebugLoc(InsertPos), 596e76fa9ecSHeejin Ahn TII.get(WebAssembly::TRY)) 5972cb27072SThomas Lively .addImm(int64_t(WebAssembly::BlockType::Void)); 598e76fa9ecSHeejin Ahn 599e76fa9ecSHeejin Ahn // Decide where in Header to put the END_TRY. 600e76fa9ecSHeejin Ahn BeforeSet.clear(); 601e76fa9ecSHeejin Ahn AfterSet.clear(); 60220cf0749SHeejin Ahn for (const auto &MI : *Cont) { 603e76fa9ecSHeejin Ahn #ifndef NDEBUG 60444a5a4b1SHeejin Ahn // END_TRY should precede existing LOOP and BLOCK markers. 60544a5a4b1SHeejin Ahn if (MI.getOpcode() == WebAssembly::LOOP || 60644a5a4b1SHeejin Ahn MI.getOpcode() == WebAssembly::BLOCK) 607e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 608e76fa9ecSHeejin Ahn 609e76fa9ecSHeejin Ahn // All END_TRY markers placed earlier belong to exceptions that contains 610e76fa9ecSHeejin Ahn // this one. 611e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::END_TRY) 612e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 613e76fa9ecSHeejin Ahn #endif 614e76fa9ecSHeejin Ahn 615e76fa9ecSHeejin Ahn // If there is a previously placed END_LOOP marker and its header is after 616e76fa9ecSHeejin Ahn // where TRY marker is, this loop is contained within the 'catch' part, so 617e76fa9ecSHeejin Ahn // the END_TRY marker should go after that. Otherwise, the whole try-catch 618e76fa9ecSHeejin Ahn // is contained within this loop, so the END_TRY should go before that. 619e76fa9ecSHeejin Ahn if (MI.getOpcode() == WebAssembly::END_LOOP) { 620222718fdSHeejin Ahn // For a LOOP to be after TRY, LOOP's BB should be after TRY's BB; if they 621222718fdSHeejin Ahn // are in the same BB, LOOP is always before TRY. 622222718fdSHeejin Ahn if (EndToBegin[&MI]->getParent()->getNumber() > Header->getNumber()) 623e76fa9ecSHeejin Ahn BeforeSet.insert(&MI); 624e76fa9ecSHeejin Ahn #ifndef NDEBUG 625e76fa9ecSHeejin Ahn else 626e76fa9ecSHeejin Ahn AfterSet.insert(&MI); 627e76fa9ecSHeejin Ahn #endif 628e76fa9ecSHeejin Ahn } 62944a5a4b1SHeejin Ahn 63044a5a4b1SHeejin Ahn // It is not possible for an END_BLOCK to be already in this block. 631e76fa9ecSHeejin Ahn } 632e76fa9ecSHeejin Ahn 633e76fa9ecSHeejin Ahn // Mark the end of the TRY. 63420cf0749SHeejin Ahn InsertPos = getEarliestInsertPos(Cont, BeforeSet, AfterSet); 635e76fa9ecSHeejin Ahn MachineInstr *End = 63620cf0749SHeejin Ahn BuildMI(*Cont, InsertPos, Bottom->findBranchDebugLoc(), 637e76fa9ecSHeejin Ahn TII.get(WebAssembly::END_TRY)); 638e76fa9ecSHeejin Ahn registerTryScope(Begin, End, &MBB); 639e76fa9ecSHeejin Ahn 64082da1ffcSHeejin Ahn // Track the farthest-spanning scope that ends at this point. We create two 64182da1ffcSHeejin Ahn // mappings: (BB with 'end_try' -> BB with 'try') and (BB with 'catch' -> BB 64282da1ffcSHeejin Ahn // with 'try'). We need to create 'catch' -> 'try' mapping here too because 64382da1ffcSHeejin Ahn // markers should not span across 'catch'. For example, this should not 64482da1ffcSHeejin Ahn // happen: 64582da1ffcSHeejin Ahn // 64682da1ffcSHeejin Ahn // try 64782da1ffcSHeejin Ahn // block --| (X) 64882da1ffcSHeejin Ahn // catch | 64982da1ffcSHeejin Ahn // end_block --| 65082da1ffcSHeejin Ahn // end_try 6511cc52357SHeejin Ahn for (auto *End : {&MBB, Cont}) 6521cc52357SHeejin Ahn updateScopeTops(Header, End); 65382da1ffcSHeejin Ahn } 654e76fa9ecSHeejin Ahn 655cf699b45SHeejin Ahn void WebAssemblyCFGStackify::removeUnnecessaryInstrs(MachineFunction &MF) { 656cf699b45SHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 657cf699b45SHeejin Ahn 658cf699b45SHeejin Ahn // When there is an unconditional branch right before a catch instruction and 659cf699b45SHeejin Ahn // it branches to the end of end_try marker, we don't need the branch, because 660cf699b45SHeejin Ahn // it there is no exception, the control flow transfers to that point anyway. 661cf699b45SHeejin Ahn // bb0: 662cf699b45SHeejin Ahn // try 663cf699b45SHeejin Ahn // ... 664cf699b45SHeejin Ahn // br bb2 <- Not necessary 665c93b9559SHeejin Ahn // bb1 (ehpad): 666cf699b45SHeejin Ahn // catch 667cf699b45SHeejin Ahn // ... 668c93b9559SHeejin Ahn // bb2: <- Continuation BB 669cf699b45SHeejin Ahn // end 670c93b9559SHeejin Ahn // 671c93b9559SHeejin Ahn // A more involved case: When the BB where 'end' is located is an another EH 672c93b9559SHeejin Ahn // pad, the Cont (= continuation) BB is that EH pad's 'end' BB. For example, 673c93b9559SHeejin Ahn // bb0: 674c93b9559SHeejin Ahn // try 675c93b9559SHeejin Ahn // try 676c93b9559SHeejin Ahn // ... 677c93b9559SHeejin Ahn // br bb3 <- Not necessary 678c93b9559SHeejin Ahn // bb1 (ehpad): 679c93b9559SHeejin Ahn // catch 680c93b9559SHeejin Ahn // bb2 (ehpad): 681c93b9559SHeejin Ahn // end 682c93b9559SHeejin Ahn // catch 683c93b9559SHeejin Ahn // ... 684c93b9559SHeejin Ahn // bb3: <- Continuation BB 685c93b9559SHeejin Ahn // end 686c93b9559SHeejin Ahn // 687c93b9559SHeejin Ahn // When the EH pad at hand is bb1, its matching end_try is in bb2. But it is 688c93b9559SHeejin Ahn // another EH pad, so bb0's continuation BB becomes bb3. So 'br bb3' in the 689c93b9559SHeejin Ahn // code can be deleted. This is why we run 'while' until 'Cont' is not an EH 690c93b9559SHeejin Ahn // pad. 691cf699b45SHeejin Ahn for (auto &MBB : MF) { 692cf699b45SHeejin Ahn if (!MBB.isEHPad()) 693cf699b45SHeejin Ahn continue; 694cf699b45SHeejin Ahn 695cf699b45SHeejin Ahn MachineBasicBlock *TBB = nullptr, *FBB = nullptr; 696cf699b45SHeejin Ahn SmallVector<MachineOperand, 4> Cond; 6975c644c9bSHeejin Ahn MachineBasicBlock *EHPadLayoutPred = MBB.getPrevNode(); 698c93b9559SHeejin Ahn 699c93b9559SHeejin Ahn MachineBasicBlock *Cont = &MBB; 700c93b9559SHeejin Ahn while (Cont->isEHPad()) { 701c93b9559SHeejin Ahn MachineInstr *Try = EHPadToTry[Cont]; 702c93b9559SHeejin Ahn MachineInstr *EndTry = BeginToEnd[Try]; 703*ed41945fSHeejin Ahn // We started from an EH pad, so the end marker cannot be a delegate 704*ed41945fSHeejin Ahn assert(EndTry->getOpcode() != WebAssembly::DELEGATE); 705c93b9559SHeejin Ahn Cont = EndTry->getParent(); 706c93b9559SHeejin Ahn } 707c93b9559SHeejin Ahn 708cf699b45SHeejin Ahn bool Analyzable = !TII.analyzeBranch(*EHPadLayoutPred, TBB, FBB, Cond); 7093fe6ea46SHeejin Ahn // This condition means either 7103fe6ea46SHeejin Ahn // 1. This BB ends with a single unconditional branch whose destinaion is 7113fe6ea46SHeejin Ahn // Cont. 7123fe6ea46SHeejin Ahn // 2. This BB ends with a conditional branch followed by an unconditional 7133fe6ea46SHeejin Ahn // branch, and the unconditional branch's destination is Cont. 7143fe6ea46SHeejin Ahn // In both cases, we want to remove the last (= unconditional) branch. 715cf699b45SHeejin Ahn if (Analyzable && ((Cond.empty() && TBB && TBB == Cont) || 7163fe6ea46SHeejin Ahn (!Cond.empty() && FBB && FBB == Cont))) { 7173fe6ea46SHeejin Ahn bool ErasedUncondBr = false; 718a5099ad9SHeejin Ahn (void)ErasedUncondBr; 7193fe6ea46SHeejin Ahn for (auto I = EHPadLayoutPred->end(), E = EHPadLayoutPred->begin(); 7203fe6ea46SHeejin Ahn I != E; --I) { 7213fe6ea46SHeejin Ahn auto PrevI = std::prev(I); 7223fe6ea46SHeejin Ahn if (PrevI->isTerminator()) { 7233fe6ea46SHeejin Ahn assert(PrevI->getOpcode() == WebAssembly::BR); 7243fe6ea46SHeejin Ahn PrevI->eraseFromParent(); 7253fe6ea46SHeejin Ahn ErasedUncondBr = true; 7263fe6ea46SHeejin Ahn break; 7273fe6ea46SHeejin Ahn } 7283fe6ea46SHeejin Ahn } 7293fe6ea46SHeejin Ahn assert(ErasedUncondBr && "Unconditional branch not erased!"); 7303fe6ea46SHeejin Ahn } 731cf699b45SHeejin Ahn } 732cf699b45SHeejin Ahn 733cf699b45SHeejin Ahn // When there are block / end_block markers that overlap with try / end_try 734cf699b45SHeejin Ahn // markers, and the block and try markers' return types are the same, the 735cf699b45SHeejin Ahn // block /end_block markers are not necessary, because try / end_try markers 736cf699b45SHeejin Ahn // also can serve as boundaries for branches. 737cf699b45SHeejin Ahn // block <- Not necessary 738cf699b45SHeejin Ahn // try 739cf699b45SHeejin Ahn // ... 740cf699b45SHeejin Ahn // catch 741cf699b45SHeejin Ahn // ... 742cf699b45SHeejin Ahn // end 743cf699b45SHeejin Ahn // end <- Not necessary 744cf699b45SHeejin Ahn SmallVector<MachineInstr *, 32> ToDelete; 745cf699b45SHeejin Ahn for (auto &MBB : MF) { 746cf699b45SHeejin Ahn for (auto &MI : MBB) { 747cf699b45SHeejin Ahn if (MI.getOpcode() != WebAssembly::TRY) 748cf699b45SHeejin Ahn continue; 749cf699b45SHeejin Ahn MachineInstr *Try = &MI, *EndTry = BeginToEnd[Try]; 750*ed41945fSHeejin Ahn if (EndTry->getOpcode() == WebAssembly::DELEGATE) 751*ed41945fSHeejin Ahn continue; 752*ed41945fSHeejin Ahn 753cf699b45SHeejin Ahn MachineBasicBlock *TryBB = Try->getParent(); 754cf699b45SHeejin Ahn MachineBasicBlock *Cont = EndTry->getParent(); 755cf699b45SHeejin Ahn int64_t RetType = Try->getOperand(0).getImm(); 7565c644c9bSHeejin Ahn for (auto B = Try->getIterator(), E = std::next(EndTry->getIterator()); 757cf699b45SHeejin Ahn B != TryBB->begin() && E != Cont->end() && 758cf699b45SHeejin Ahn std::prev(B)->getOpcode() == WebAssembly::BLOCK && 759cf699b45SHeejin Ahn E->getOpcode() == WebAssembly::END_BLOCK && 760cf699b45SHeejin Ahn std::prev(B)->getOperand(0).getImm() == RetType; 761cf699b45SHeejin Ahn --B, ++E) { 762cf699b45SHeejin Ahn ToDelete.push_back(&*std::prev(B)); 763cf699b45SHeejin Ahn ToDelete.push_back(&*E); 764cf699b45SHeejin Ahn } 765cf699b45SHeejin Ahn } 766cf699b45SHeejin Ahn } 767cf699b45SHeejin Ahn for (auto *MI : ToDelete) { 768cf699b45SHeejin Ahn if (MI->getOpcode() == WebAssembly::BLOCK) 769cf699b45SHeejin Ahn unregisterScope(MI); 770cf699b45SHeejin Ahn MI->eraseFromParent(); 771cf699b45SHeejin Ahn } 772cf699b45SHeejin Ahn } 773cf699b45SHeejin Ahn 77483c26eaeSHeejin Ahn // Get the appropriate copy opcode for the given register class. 77583c26eaeSHeejin Ahn static unsigned getCopyOpcode(const TargetRegisterClass *RC) { 77683c26eaeSHeejin Ahn if (RC == &WebAssembly::I32RegClass) 77783c26eaeSHeejin Ahn return WebAssembly::COPY_I32; 77883c26eaeSHeejin Ahn if (RC == &WebAssembly::I64RegClass) 77983c26eaeSHeejin Ahn return WebAssembly::COPY_I64; 78083c26eaeSHeejin Ahn if (RC == &WebAssembly::F32RegClass) 78183c26eaeSHeejin Ahn return WebAssembly::COPY_F32; 78283c26eaeSHeejin Ahn if (RC == &WebAssembly::F64RegClass) 78383c26eaeSHeejin Ahn return WebAssembly::COPY_F64; 78483c26eaeSHeejin Ahn if (RC == &WebAssembly::V128RegClass) 78583c26eaeSHeejin Ahn return WebAssembly::COPY_V128; 78660653e24SHeejin Ahn if (RC == &WebAssembly::FUNCREFRegClass) 78760653e24SHeejin Ahn return WebAssembly::COPY_FUNCREF; 78860653e24SHeejin Ahn if (RC == &WebAssembly::EXTERNREFRegClass) 78960653e24SHeejin Ahn return WebAssembly::COPY_EXTERNREF; 79083c26eaeSHeejin Ahn llvm_unreachable("Unexpected register class"); 79183c26eaeSHeejin Ahn } 79283c26eaeSHeejin Ahn 79361d5c76aSHeejin Ahn // When MBB is split into MBB and Split, we should unstackify defs in MBB that 79461d5c76aSHeejin Ahn // have their uses in Split. 795*ed41945fSHeejin Ahn static void unstackifyVRegsUsedInSplitBB(MachineBasicBlock &MBB, 796*ed41945fSHeejin Ahn MachineBasicBlock &Split) { 7971cc52357SHeejin Ahn MachineFunction &MF = *MBB.getParent(); 7981cc52357SHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 7991cc52357SHeejin Ahn auto &MFI = *MF.getInfo<WebAssemblyFunctionInfo>(); 8001cc52357SHeejin Ahn auto &MRI = MF.getRegInfo(); 8011cc52357SHeejin Ahn 80261d5c76aSHeejin Ahn for (auto &MI : Split) { 80361d5c76aSHeejin Ahn for (auto &MO : MI.explicit_uses()) { 80461d5c76aSHeejin Ahn if (!MO.isReg() || Register::isPhysicalRegister(MO.getReg())) 80561d5c76aSHeejin Ahn continue; 80661d5c76aSHeejin Ahn if (MachineInstr *Def = MRI.getUniqueVRegDef(MO.getReg())) 80761d5c76aSHeejin Ahn if (Def->getParent() == &MBB) 80861d5c76aSHeejin Ahn MFI.unstackifyVReg(MO.getReg()); 80961d5c76aSHeejin Ahn } 81061d5c76aSHeejin Ahn } 81183c26eaeSHeejin Ahn 81283c26eaeSHeejin Ahn // In RegStackify, when a register definition is used multiple times, 81383c26eaeSHeejin Ahn // Reg = INST ... 81483c26eaeSHeejin Ahn // INST ..., Reg, ... 81583c26eaeSHeejin Ahn // INST ..., Reg, ... 81683c26eaeSHeejin Ahn // INST ..., Reg, ... 81783c26eaeSHeejin Ahn // 81883c26eaeSHeejin Ahn // we introduce a TEE, which has the following form: 81983c26eaeSHeejin Ahn // DefReg = INST ... 82083c26eaeSHeejin Ahn // TeeReg, Reg = TEE_... DefReg 82183c26eaeSHeejin Ahn // INST ..., TeeReg, ... 82283c26eaeSHeejin Ahn // INST ..., Reg, ... 82383c26eaeSHeejin Ahn // INST ..., Reg, ... 82483c26eaeSHeejin Ahn // with DefReg and TeeReg stackified but Reg not stackified. 82583c26eaeSHeejin Ahn // 82683c26eaeSHeejin Ahn // But the invariant that TeeReg should be stackified can be violated while we 82783c26eaeSHeejin Ahn // unstackify registers in the split BB above. In this case, we convert TEEs 82883c26eaeSHeejin Ahn // into two COPYs. This COPY will be eventually eliminated in ExplicitLocals. 82983c26eaeSHeejin Ahn // DefReg = INST ... 83083c26eaeSHeejin Ahn // TeeReg = COPY DefReg 83183c26eaeSHeejin Ahn // Reg = COPY DefReg 83283c26eaeSHeejin Ahn // INST ..., TeeReg, ... 83383c26eaeSHeejin Ahn // INST ..., Reg, ... 83483c26eaeSHeejin Ahn // INST ..., Reg, ... 83583c26eaeSHeejin Ahn for (auto I = MBB.begin(), E = MBB.end(); I != E;) { 83683c26eaeSHeejin Ahn MachineInstr &MI = *I++; 83783c26eaeSHeejin Ahn if (!WebAssembly::isTee(MI.getOpcode())) 83883c26eaeSHeejin Ahn continue; 83983c26eaeSHeejin Ahn Register TeeReg = MI.getOperand(0).getReg(); 84083c26eaeSHeejin Ahn Register Reg = MI.getOperand(1).getReg(); 84183c26eaeSHeejin Ahn Register DefReg = MI.getOperand(2).getReg(); 84283c26eaeSHeejin Ahn if (!MFI.isVRegStackified(TeeReg)) { 84383c26eaeSHeejin Ahn // Now we are not using TEE anymore, so unstackify DefReg too 84483c26eaeSHeejin Ahn MFI.unstackifyVReg(DefReg); 84583c26eaeSHeejin Ahn unsigned CopyOpc = getCopyOpcode(MRI.getRegClass(DefReg)); 84683c26eaeSHeejin Ahn BuildMI(MBB, &MI, MI.getDebugLoc(), TII.get(CopyOpc), TeeReg) 84783c26eaeSHeejin Ahn .addReg(DefReg); 84883c26eaeSHeejin Ahn BuildMI(MBB, &MI, MI.getDebugLoc(), TII.get(CopyOpc), Reg).addReg(DefReg); 84983c26eaeSHeejin Ahn MI.eraseFromParent(); 85083c26eaeSHeejin Ahn } 85183c26eaeSHeejin Ahn } 85261d5c76aSHeejin Ahn } 85361d5c76aSHeejin Ahn 854*ed41945fSHeejin Ahn // Wrap the given range of instruction with try-delegate. RangeBegin and 855*ed41945fSHeejin Ahn // RangeEnd are inclusive. 856*ed41945fSHeejin Ahn void WebAssemblyCFGStackify::addTryDelegate(MachineInstr *RangeBegin, 857*ed41945fSHeejin Ahn MachineInstr *RangeEnd, 858*ed41945fSHeejin Ahn MachineBasicBlock *DelegateDest) { 859*ed41945fSHeejin Ahn auto *BeginBB = RangeBegin->getParent(); 860*ed41945fSHeejin Ahn auto *EndBB = RangeEnd->getParent(); 861*ed41945fSHeejin Ahn MachineFunction &MF = *BeginBB->getParent(); 862*ed41945fSHeejin Ahn const auto &MFI = *MF.getInfo<WebAssemblyFunctionInfo>(); 863*ed41945fSHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 864*ed41945fSHeejin Ahn 865*ed41945fSHeejin Ahn // Local expression tree before the first call of this range should go 866*ed41945fSHeejin Ahn // after the nested TRY. 867*ed41945fSHeejin Ahn SmallPtrSet<const MachineInstr *, 4> AfterSet; 868*ed41945fSHeejin Ahn AfterSet.insert(RangeBegin); 869*ed41945fSHeejin Ahn for (auto I = MachineBasicBlock::iterator(RangeBegin), E = BeginBB->begin(); 870*ed41945fSHeejin Ahn I != E; --I) { 871*ed41945fSHeejin Ahn if (std::prev(I)->isDebugInstr() || std::prev(I)->isPosition()) 872*ed41945fSHeejin Ahn continue; 873*ed41945fSHeejin Ahn if (WebAssembly::isChild(*std::prev(I), MFI)) 874*ed41945fSHeejin Ahn AfterSet.insert(&*std::prev(I)); 875*ed41945fSHeejin Ahn else 876*ed41945fSHeejin Ahn break; 877*ed41945fSHeejin Ahn } 878*ed41945fSHeejin Ahn 879*ed41945fSHeejin Ahn // Create the nested try instruction. 880*ed41945fSHeejin Ahn auto TryPos = getLatestInsertPos( 881*ed41945fSHeejin Ahn BeginBB, SmallPtrSet<const MachineInstr *, 4>(), AfterSet); 882*ed41945fSHeejin Ahn MachineInstr *Try = BuildMI(*BeginBB, TryPos, RangeBegin->getDebugLoc(), 883*ed41945fSHeejin Ahn TII.get(WebAssembly::TRY)) 884*ed41945fSHeejin Ahn .addImm(int64_t(WebAssembly::BlockType::Void)); 885*ed41945fSHeejin Ahn 886*ed41945fSHeejin Ahn // Create a BB to insert the 'delegate' instruction. 887*ed41945fSHeejin Ahn MachineBasicBlock *DelegateBB = MF.CreateMachineBasicBlock(); 888*ed41945fSHeejin Ahn // If the destination of 'delegate' is not the caller, adds the destination to 889*ed41945fSHeejin Ahn // the BB's successors. 890*ed41945fSHeejin Ahn if (DelegateDest != FakeCallerBB) 891*ed41945fSHeejin Ahn DelegateBB->addSuccessor(DelegateDest); 892*ed41945fSHeejin Ahn 893*ed41945fSHeejin Ahn auto SplitPos = std::next(RangeEnd->getIterator()); 894*ed41945fSHeejin Ahn if (SplitPos == EndBB->end()) { 895*ed41945fSHeejin Ahn // If the range's end instruction is at the end of the BB, insert the new 896*ed41945fSHeejin Ahn // delegate BB after the current BB. 897*ed41945fSHeejin Ahn MF.insert(std::next(EndBB->getIterator()), DelegateBB); 898*ed41945fSHeejin Ahn EndBB->addSuccessor(DelegateBB); 899*ed41945fSHeejin Ahn 900*ed41945fSHeejin Ahn } else { 901*ed41945fSHeejin Ahn // If the range's end instruction is in the middle of the BB, we split the 902*ed41945fSHeejin Ahn // BB into two and insert the delegate BB in between. 903*ed41945fSHeejin Ahn // - Before: 904*ed41945fSHeejin Ahn // bb: 905*ed41945fSHeejin Ahn // range_end 906*ed41945fSHeejin Ahn // other_insts 907*ed41945fSHeejin Ahn // 908*ed41945fSHeejin Ahn // - After: 909*ed41945fSHeejin Ahn // pre_bb: (previous 'bb') 910*ed41945fSHeejin Ahn // range_end 911*ed41945fSHeejin Ahn // delegate_bb: (new) 912*ed41945fSHeejin Ahn // delegate 913*ed41945fSHeejin Ahn // post_bb: (new) 914*ed41945fSHeejin Ahn // other_insts 915*ed41945fSHeejin Ahn MachineBasicBlock *PreBB = EndBB; 916*ed41945fSHeejin Ahn MachineBasicBlock *PostBB = MF.CreateMachineBasicBlock(); 917*ed41945fSHeejin Ahn MF.insert(std::next(PreBB->getIterator()), PostBB); 918*ed41945fSHeejin Ahn MF.insert(std::next(PreBB->getIterator()), DelegateBB); 919*ed41945fSHeejin Ahn PostBB->splice(PostBB->end(), PreBB, SplitPos, PreBB->end()); 920*ed41945fSHeejin Ahn PostBB->transferSuccessors(PreBB); 921*ed41945fSHeejin Ahn unstackifyVRegsUsedInSplitBB(*PreBB, *PostBB); 922*ed41945fSHeejin Ahn PreBB->addSuccessor(DelegateBB); 923*ed41945fSHeejin Ahn PreBB->addSuccessor(PostBB); 924*ed41945fSHeejin Ahn } 925*ed41945fSHeejin Ahn 926*ed41945fSHeejin Ahn // Add 'delegate' instruction in the delegate BB created above. 927*ed41945fSHeejin Ahn MachineInstr *Delegate = BuildMI(DelegateBB, RangeEnd->getDebugLoc(), 928*ed41945fSHeejin Ahn TII.get(WebAssembly::DELEGATE)) 929*ed41945fSHeejin Ahn .addMBB(DelegateDest); 930*ed41945fSHeejin Ahn registerTryScope(Try, Delegate, nullptr); 931*ed41945fSHeejin Ahn } 932*ed41945fSHeejin Ahn 933*ed41945fSHeejin Ahn bool WebAssemblyCFGStackify::fixCallUnwindMismatches(MachineFunction &MF) { 934*ed41945fSHeejin Ahn // Linearizing the control flow by placing TRY / END_TRY markers can create 935*ed41945fSHeejin Ahn // mismatches in unwind destinations for throwing instructions, such as calls. 936*ed41945fSHeejin Ahn // 937*ed41945fSHeejin Ahn // We use the 'delegate' instruction to fix the unwind mismatches. 'delegate' 938*ed41945fSHeejin Ahn // instruction delegates an exception to an outer 'catch'. It can target not 939*ed41945fSHeejin Ahn // only 'catch' but all block-like structures including another 'delegate', 940*ed41945fSHeejin Ahn // but with slightly different semantics than branches. When it targets a 941*ed41945fSHeejin Ahn // 'catch', it will delegate the exception to that catch. It is being 942*ed41945fSHeejin Ahn // discussed how to define the semantics when 'delegate''s target is a non-try 943*ed41945fSHeejin Ahn // block: it will either be a validation failure or it will target the next 944*ed41945fSHeejin Ahn // outer try-catch. But anyway our LLVM backend currently does not generate 945*ed41945fSHeejin Ahn // such code. The example below illustrates where the 'delegate' instruction 946*ed41945fSHeejin Ahn // in the middle will delegate the exception to, depending on the value of N. 947*ed41945fSHeejin Ahn // try 948*ed41945fSHeejin Ahn // try 949*ed41945fSHeejin Ahn // block 950*ed41945fSHeejin Ahn // try 951*ed41945fSHeejin Ahn // try 952*ed41945fSHeejin Ahn // call @foo 953*ed41945fSHeejin Ahn // delegate N ;; Where will this delegate to? 954*ed41945fSHeejin Ahn // catch ;; N == 0 955*ed41945fSHeejin Ahn // end 956*ed41945fSHeejin Ahn // end ;; N == 1 (invalid; will not be generated) 957*ed41945fSHeejin Ahn // delegate ;; N == 2 958*ed41945fSHeejin Ahn // catch ;; N == 3 959*ed41945fSHeejin Ahn // end 960*ed41945fSHeejin Ahn // ;; N == 4 (to caller) 961*ed41945fSHeejin Ahn 962*ed41945fSHeejin Ahn // 1. When an instruction may throw, but the EH pad it will unwind to can be 963*ed41945fSHeejin Ahn // different from the original CFG. 964*ed41945fSHeejin Ahn // 965*ed41945fSHeejin Ahn // Example: we have the following CFG: 966*ed41945fSHeejin Ahn // bb0: 967*ed41945fSHeejin Ahn // call @foo ; if it throws, unwind to bb2 968*ed41945fSHeejin Ahn // bb1: 969*ed41945fSHeejin Ahn // call @bar ; if it throws, unwind to bb3 970*ed41945fSHeejin Ahn // bb2 (ehpad): 971*ed41945fSHeejin Ahn // catch 972*ed41945fSHeejin Ahn // ... 973*ed41945fSHeejin Ahn // bb3 (ehpad) 974*ed41945fSHeejin Ahn // catch 975*ed41945fSHeejin Ahn // ... 976*ed41945fSHeejin Ahn // 977*ed41945fSHeejin Ahn // And the CFG is sorted in this order. Then after placing TRY markers, it 978*ed41945fSHeejin Ahn // will look like: (BB markers are omitted) 979*ed41945fSHeejin Ahn // try 980*ed41945fSHeejin Ahn // try 981*ed41945fSHeejin Ahn // call @foo 982*ed41945fSHeejin Ahn // call @bar ;; if it throws, unwind to bb3 983*ed41945fSHeejin Ahn // catch ;; ehpad (bb2) 984*ed41945fSHeejin Ahn // ... 985*ed41945fSHeejin Ahn // end_try 986*ed41945fSHeejin Ahn // catch ;; ehpad (bb3) 987*ed41945fSHeejin Ahn // ... 988*ed41945fSHeejin Ahn // end_try 989*ed41945fSHeejin Ahn // 990*ed41945fSHeejin Ahn // Now if bar() throws, it is going to end up ip in bb2, not bb3, where it 991*ed41945fSHeejin Ahn // is supposed to end up. We solve this problem by wrapping the mismatching 992*ed41945fSHeejin Ahn // call with an inner try-delegate that rethrows the exception to the right 993*ed41945fSHeejin Ahn // 'catch'. 994*ed41945fSHeejin Ahn // 995*ed41945fSHeejin Ahn // 996*ed41945fSHeejin Ahn // try 997*ed41945fSHeejin Ahn // try 998*ed41945fSHeejin Ahn // call @foo 999*ed41945fSHeejin Ahn // try ;; (new) 1000*ed41945fSHeejin Ahn // call @bar 1001*ed41945fSHeejin Ahn // delegate 1 (bb3) ;; (new) 1002*ed41945fSHeejin Ahn // catch ;; ehpad (bb2) 1003*ed41945fSHeejin Ahn // ... 1004*ed41945fSHeejin Ahn // end_try 1005*ed41945fSHeejin Ahn // catch ;; ehpad (bb3) 1006*ed41945fSHeejin Ahn // ... 1007*ed41945fSHeejin Ahn // end_try 1008*ed41945fSHeejin Ahn // 1009*ed41945fSHeejin Ahn // --- 1010*ed41945fSHeejin Ahn // 2. The same as 1, but in this case an instruction unwinds to a caller 1011*ed41945fSHeejin Ahn // function and not another EH pad. 1012*ed41945fSHeejin Ahn // 1013*ed41945fSHeejin Ahn // Example: we have the following CFG: 1014*ed41945fSHeejin Ahn // bb0: 1015*ed41945fSHeejin Ahn // call @foo ; if it throws, unwind to bb2 1016*ed41945fSHeejin Ahn // bb1: 1017*ed41945fSHeejin Ahn // call @bar ; if it throws, unwind to caller 1018*ed41945fSHeejin Ahn // bb2 (ehpad): 1019*ed41945fSHeejin Ahn // catch 1020*ed41945fSHeejin Ahn // ... 1021*ed41945fSHeejin Ahn // 1022*ed41945fSHeejin Ahn // And the CFG is sorted in this order. Then after placing TRY markers, it 1023*ed41945fSHeejin Ahn // will look like: 1024*ed41945fSHeejin Ahn // try 1025*ed41945fSHeejin Ahn // call @foo 1026*ed41945fSHeejin Ahn // call @bar ;; if it throws, unwind to caller 1027*ed41945fSHeejin Ahn // catch ;; ehpad (bb2) 1028*ed41945fSHeejin Ahn // ... 1029*ed41945fSHeejin Ahn // end_try 1030*ed41945fSHeejin Ahn // 1031*ed41945fSHeejin Ahn // Now if bar() throws, it is going to end up ip in bb2, when it is supposed 1032*ed41945fSHeejin Ahn // throw up to the caller. We solve this problem in the same way, but in this 1033*ed41945fSHeejin Ahn // case 'delegate's immediate argument is the number of block depths + 1, 1034*ed41945fSHeejin Ahn // which means it rethrows to the caller. 1035*ed41945fSHeejin Ahn // try 1036*ed41945fSHeejin Ahn // call @foo 1037*ed41945fSHeejin Ahn // try ;; (new) 1038*ed41945fSHeejin Ahn // call @bar 1039*ed41945fSHeejin Ahn // delegate 1 (caller) ;; (new) 1040*ed41945fSHeejin Ahn // catch ;; ehpad (bb2) 1041*ed41945fSHeejin Ahn // ... 1042*ed41945fSHeejin Ahn // end_try 1043*ed41945fSHeejin Ahn // 1044*ed41945fSHeejin Ahn // Before rewriteDepthImmediates, delegate's argument is a BB. In case of the 1045*ed41945fSHeejin Ahn // caller, it will take a fake BB generated by getFakeCallerBlock(), which 1046*ed41945fSHeejin Ahn // will be converted to a correct immediate argument later. 1047*ed41945fSHeejin Ahn // 1048*ed41945fSHeejin Ahn // In case there are multiple calls in a BB that may throw to the caller, they 1049*ed41945fSHeejin Ahn // can be wrapped together in one nested try-delegate scope. (In 1, this 1050*ed41945fSHeejin Ahn // couldn't happen, because may-throwing instruction there had an unwind 1051*ed41945fSHeejin Ahn // destination, i.e., it was an invoke before, and there could be only one 1052*ed41945fSHeejin Ahn // invoke within a BB.) 1053*ed41945fSHeejin Ahn 1054*ed41945fSHeejin Ahn SmallVector<const MachineBasicBlock *, 8> EHPadStack; 1055*ed41945fSHeejin Ahn // Range of intructions to be wrapped in a new nested try/catch. A range 1056*ed41945fSHeejin Ahn // exists in a single BB and does not span multiple BBs. 1057*ed41945fSHeejin Ahn using TryRange = std::pair<MachineInstr *, MachineInstr *>; 1058*ed41945fSHeejin Ahn // In original CFG, <unwind destination BB, a vector of try ranges> 1059*ed41945fSHeejin Ahn DenseMap<MachineBasicBlock *, SmallVector<TryRange, 4>> UnwindDestToTryRanges; 1060*ed41945fSHeejin Ahn 1061*ed41945fSHeejin Ahn // Gather possibly throwing calls (i.e., previously invokes) whose current 1062*ed41945fSHeejin Ahn // unwind destination is not the same as the original CFG. (Case 1) 1063*ed41945fSHeejin Ahn 1064*ed41945fSHeejin Ahn for (auto &MBB : reverse(MF)) { 1065*ed41945fSHeejin Ahn bool SeenThrowableInstInBB = false; 1066*ed41945fSHeejin Ahn for (auto &MI : reverse(MBB)) { 1067*ed41945fSHeejin Ahn if (MI.getOpcode() == WebAssembly::TRY) 1068*ed41945fSHeejin Ahn EHPadStack.pop_back(); 1069*ed41945fSHeejin Ahn else if (WebAssembly::isCatch(MI.getOpcode())) 1070*ed41945fSHeejin Ahn EHPadStack.push_back(MI.getParent()); 1071*ed41945fSHeejin Ahn 1072*ed41945fSHeejin Ahn // In this loop we only gather calls that have an EH pad to unwind. So 1073*ed41945fSHeejin Ahn // there will be at most 1 such call (= invoke) in a BB, so after we've 1074*ed41945fSHeejin Ahn // seen one, we can skip the rest of BB. Also if MBB has no EH pad 1075*ed41945fSHeejin Ahn // successor or MI does not throw, this is not an invoke. 1076*ed41945fSHeejin Ahn if (SeenThrowableInstInBB || !MBB.hasEHPadSuccessor() || 1077*ed41945fSHeejin Ahn !WebAssembly::mayThrow(MI)) 1078*ed41945fSHeejin Ahn continue; 1079*ed41945fSHeejin Ahn SeenThrowableInstInBB = true; 1080*ed41945fSHeejin Ahn 1081*ed41945fSHeejin Ahn // If the EH pad on the stack top is where this instruction should unwind 1082*ed41945fSHeejin Ahn // next, we're good. 1083*ed41945fSHeejin Ahn MachineBasicBlock *UnwindDest = getFakeCallerBlock(MF); 1084*ed41945fSHeejin Ahn for (auto *Succ : MBB.successors()) { 1085*ed41945fSHeejin Ahn // Even though semantically a BB can have multiple successors in case an 1086*ed41945fSHeejin Ahn // exception is not caught by a catchpad, in our backend implementation 1087*ed41945fSHeejin Ahn // it is guaranteed that a BB can have at most one EH pad successor. For 1088*ed41945fSHeejin Ahn // details, refer to comments in findWasmUnwindDestinations function in 1089*ed41945fSHeejin Ahn // SelectionDAGBuilder.cpp. 1090*ed41945fSHeejin Ahn if (Succ->isEHPad()) { 1091*ed41945fSHeejin Ahn UnwindDest = Succ; 1092*ed41945fSHeejin Ahn break; 1093*ed41945fSHeejin Ahn } 1094*ed41945fSHeejin Ahn } 1095*ed41945fSHeejin Ahn if (EHPadStack.back() == UnwindDest) 1096*ed41945fSHeejin Ahn continue; 1097*ed41945fSHeejin Ahn 1098*ed41945fSHeejin Ahn // Include EH_LABELs in the range before and afer the invoke 1099*ed41945fSHeejin Ahn MachineInstr *RangeBegin = &MI, *RangeEnd = &MI; 1100*ed41945fSHeejin Ahn if (RangeBegin->getIterator() != MBB.begin() && 1101*ed41945fSHeejin Ahn std::prev(RangeBegin->getIterator())->isEHLabel()) 1102*ed41945fSHeejin Ahn RangeBegin = &*std::prev(RangeBegin->getIterator()); 1103*ed41945fSHeejin Ahn if (std::next(RangeEnd->getIterator()) != MBB.end() && 1104*ed41945fSHeejin Ahn std::next(RangeEnd->getIterator())->isEHLabel()) 1105*ed41945fSHeejin Ahn RangeEnd = &*std::next(RangeEnd->getIterator()); 1106*ed41945fSHeejin Ahn 1107*ed41945fSHeejin Ahn // If not, record the range. 1108*ed41945fSHeejin Ahn UnwindDestToTryRanges[UnwindDest].push_back( 1109*ed41945fSHeejin Ahn TryRange(RangeBegin, RangeEnd)); 1110*ed41945fSHeejin Ahn LLVM_DEBUG(dbgs() << "- Call unwind mismatch: MBB = " << MBB.getName() 1111*ed41945fSHeejin Ahn << "\nCall = " << MI 1112*ed41945fSHeejin Ahn << "\nOriginal dest = " << UnwindDest->getName() 1113*ed41945fSHeejin Ahn << " Current dest = " << EHPadStack.back()->getName() 1114*ed41945fSHeejin Ahn << "\n\n"); 1115*ed41945fSHeejin Ahn } 1116*ed41945fSHeejin Ahn } 1117*ed41945fSHeejin Ahn 1118*ed41945fSHeejin Ahn assert(EHPadStack.empty()); 1119*ed41945fSHeejin Ahn 1120*ed41945fSHeejin Ahn // Gather possibly throwing calls that are supposed to unwind up to the caller 1121*ed41945fSHeejin Ahn // if they throw, but currently unwind to an incorrect destination. Unlike the 1122*ed41945fSHeejin Ahn // loop above, there can be multiple calls within a BB that unwind to the 1123*ed41945fSHeejin Ahn // caller, which we should group together in a range. (Case 2) 1124*ed41945fSHeejin Ahn 1125*ed41945fSHeejin Ahn MachineInstr *RangeBegin = nullptr, *RangeEnd = nullptr; // inclusive 1126*ed41945fSHeejin Ahn 1127*ed41945fSHeejin Ahn // Record the range. 1128*ed41945fSHeejin Ahn auto RecordCallerMismatchRange = [&](const MachineBasicBlock *CurrentDest) { 1129*ed41945fSHeejin Ahn UnwindDestToTryRanges[getFakeCallerBlock(MF)].push_back( 1130*ed41945fSHeejin Ahn TryRange(RangeBegin, RangeEnd)); 1131*ed41945fSHeejin Ahn LLVM_DEBUG(dbgs() << "- Call unwind mismatch: MBB = " 1132*ed41945fSHeejin Ahn << RangeBegin->getParent()->getName() 1133*ed41945fSHeejin Ahn << "\nRange begin = " << *RangeBegin 1134*ed41945fSHeejin Ahn << "Range end = " << *RangeEnd 1135*ed41945fSHeejin Ahn << "\nOriginal dest = caller Current dest = " 1136*ed41945fSHeejin Ahn << CurrentDest->getName() << "\n\n"); 1137*ed41945fSHeejin Ahn RangeBegin = RangeEnd = nullptr; // Reset range pointers 1138*ed41945fSHeejin Ahn }; 1139*ed41945fSHeejin Ahn 1140*ed41945fSHeejin Ahn for (auto &MBB : reverse(MF)) { 1141*ed41945fSHeejin Ahn bool SeenThrowableInstInBB = false; 1142*ed41945fSHeejin Ahn for (auto &MI : reverse(MBB)) { 1143*ed41945fSHeejin Ahn if (MI.getOpcode() == WebAssembly::TRY) 1144*ed41945fSHeejin Ahn EHPadStack.pop_back(); 1145*ed41945fSHeejin Ahn else if (WebAssembly::isCatch(MI.getOpcode())) 1146*ed41945fSHeejin Ahn EHPadStack.push_back(MI.getParent()); 1147*ed41945fSHeejin Ahn bool MayThrow = WebAssembly::mayThrow(MI); 1148*ed41945fSHeejin Ahn 1149*ed41945fSHeejin Ahn // If MBB has an EH pad successor and this is the last instruction that 1150*ed41945fSHeejin Ahn // may throw, this instruction unwinds to the EH pad and not to the 1151*ed41945fSHeejin Ahn // caller. 1152*ed41945fSHeejin Ahn if (MBB.hasEHPadSuccessor() && MayThrow && !SeenThrowableInstInBB) { 1153*ed41945fSHeejin Ahn SeenThrowableInstInBB = true; 1154*ed41945fSHeejin Ahn continue; 1155*ed41945fSHeejin Ahn } 1156*ed41945fSHeejin Ahn 1157*ed41945fSHeejin Ahn // We wrap up the current range when we see a marker even if we haven't 1158*ed41945fSHeejin Ahn // finished a BB. 1159*ed41945fSHeejin Ahn if (RangeEnd && WebAssembly::isMarker(MI.getOpcode())) { 1160*ed41945fSHeejin Ahn RecordCallerMismatchRange(EHPadStack.back()); 1161*ed41945fSHeejin Ahn continue; 1162*ed41945fSHeejin Ahn } 1163*ed41945fSHeejin Ahn 1164*ed41945fSHeejin Ahn // If EHPadStack is empty, that means it correctly unwinds to the caller 1165*ed41945fSHeejin Ahn // if it throws, so we're good. If MI does not throw, we're good too. 1166*ed41945fSHeejin Ahn if (EHPadStack.empty() || !MayThrow) 1167*ed41945fSHeejin Ahn continue; 1168*ed41945fSHeejin Ahn 1169*ed41945fSHeejin Ahn // We found an instruction that unwinds to the caller but currently has an 1170*ed41945fSHeejin Ahn // incorrect unwind destination. Create a new range or increment the 1171*ed41945fSHeejin Ahn // currently existing range. 1172*ed41945fSHeejin Ahn if (!RangeEnd) 1173*ed41945fSHeejin Ahn RangeBegin = RangeEnd = &MI; 1174*ed41945fSHeejin Ahn else 1175*ed41945fSHeejin Ahn RangeBegin = &MI; 1176*ed41945fSHeejin Ahn } 1177*ed41945fSHeejin Ahn 1178*ed41945fSHeejin Ahn if (RangeEnd) 1179*ed41945fSHeejin Ahn RecordCallerMismatchRange(EHPadStack.back()); 1180*ed41945fSHeejin Ahn } 1181*ed41945fSHeejin Ahn 1182*ed41945fSHeejin Ahn assert(EHPadStack.empty()); 1183*ed41945fSHeejin Ahn 1184*ed41945fSHeejin Ahn // We don't have any unwind destination mismatches to resolve. 1185*ed41945fSHeejin Ahn if (UnwindDestToTryRanges.empty()) 1186*ed41945fSHeejin Ahn return false; 1187*ed41945fSHeejin Ahn 1188*ed41945fSHeejin Ahn // Now we fix the mismatches by wrapping calls with inner try-delegates. 1189*ed41945fSHeejin Ahn for (auto &P : UnwindDestToTryRanges) { 1190*ed41945fSHeejin Ahn NumCallUnwindMismatches += P.second.size(); 1191*ed41945fSHeejin Ahn MachineBasicBlock *UnwindDest = P.first; 1192*ed41945fSHeejin Ahn auto &TryRanges = P.second; 1193*ed41945fSHeejin Ahn 1194*ed41945fSHeejin Ahn for (auto Range : TryRanges) { 1195*ed41945fSHeejin Ahn MachineInstr *RangeBegin = nullptr, *RangeEnd = nullptr; 1196*ed41945fSHeejin Ahn std::tie(RangeBegin, RangeEnd) = Range; 1197*ed41945fSHeejin Ahn auto *MBB = RangeBegin->getParent(); 1198*ed41945fSHeejin Ahn 1199*ed41945fSHeejin Ahn // If this BB has an EH pad successor, i.e., ends with an 'invoke', now we 1200*ed41945fSHeejin Ahn // are going to wrap the invoke with try-delegate, making the 'delegate' 1201*ed41945fSHeejin Ahn // BB the new successor instead, so remove the EH pad succesor here. The 1202*ed41945fSHeejin Ahn // BB may not have an EH pad successor if calls in this BB throw to the 1203*ed41945fSHeejin Ahn // caller. 1204*ed41945fSHeejin Ahn MachineBasicBlock *EHPad = nullptr; 1205*ed41945fSHeejin Ahn for (auto *Succ : MBB->successors()) { 1206*ed41945fSHeejin Ahn if (Succ->isEHPad()) { 1207*ed41945fSHeejin Ahn EHPad = Succ; 1208*ed41945fSHeejin Ahn break; 1209*ed41945fSHeejin Ahn } 1210*ed41945fSHeejin Ahn } 1211*ed41945fSHeejin Ahn if (EHPad) 1212*ed41945fSHeejin Ahn MBB->removeSuccessor(EHPad); 1213*ed41945fSHeejin Ahn 1214*ed41945fSHeejin Ahn addTryDelegate(RangeBegin, RangeEnd, UnwindDest); 1215*ed41945fSHeejin Ahn } 1216*ed41945fSHeejin Ahn } 1217*ed41945fSHeejin Ahn 1218*ed41945fSHeejin Ahn return true; 1219*ed41945fSHeejin Ahn } 1220*ed41945fSHeejin Ahn 1221*ed41945fSHeejin Ahn bool WebAssemblyCFGStackify::fixCatchUnwindMismatches(MachineFunction &MF) { 1222*ed41945fSHeejin Ahn // TODO implement 1223c4ac74fbSHeejin Ahn return false; 1224c4ac74fbSHeejin Ahn } 1225c4ac74fbSHeejin Ahn 1226*ed41945fSHeejin Ahn void WebAssemblyCFGStackify::recalculateScopeTops(MachineFunction &MF) { 1227*ed41945fSHeejin Ahn // Renumber BBs and recalculate ScopeTop info because new BBs might have been 1228*ed41945fSHeejin Ahn // created and inserted during fixing unwind mismatches. 1229*ed41945fSHeejin Ahn MF.RenumberBlocks(); 1230*ed41945fSHeejin Ahn ScopeTops.clear(); 1231*ed41945fSHeejin Ahn ScopeTops.resize(MF.getNumBlockIDs()); 1232*ed41945fSHeejin Ahn for (auto &MBB : reverse(MF)) { 1233*ed41945fSHeejin Ahn for (auto &MI : reverse(MBB)) { 1234*ed41945fSHeejin Ahn if (ScopeTops[MBB.getNumber()]) 1235*ed41945fSHeejin Ahn break; 1236*ed41945fSHeejin Ahn switch (MI.getOpcode()) { 1237*ed41945fSHeejin Ahn case WebAssembly::END_BLOCK: 1238*ed41945fSHeejin Ahn case WebAssembly::END_LOOP: 1239*ed41945fSHeejin Ahn case WebAssembly::END_TRY: 1240*ed41945fSHeejin Ahn case WebAssembly::DELEGATE: 1241*ed41945fSHeejin Ahn updateScopeTops(EndToBegin[&MI]->getParent(), &MBB); 1242*ed41945fSHeejin Ahn break; 1243*ed41945fSHeejin Ahn case WebAssembly::CATCH: 1244*ed41945fSHeejin Ahn case WebAssembly::CATCH_ALL: 1245*ed41945fSHeejin Ahn updateScopeTops(EHPadToTry[&MBB]->getParent(), &MBB); 1246*ed41945fSHeejin Ahn break; 1247*ed41945fSHeejin Ahn } 1248*ed41945fSHeejin Ahn } 1249*ed41945fSHeejin Ahn } 1250*ed41945fSHeejin Ahn } 1251*ed41945fSHeejin Ahn 1252*ed41945fSHeejin Ahn unsigned WebAssemblyCFGStackify::getDepth( 1253*ed41945fSHeejin Ahn const SmallVectorImpl<const MachineBasicBlock *> &Stack, 12541d68e80fSDan Gohman const MachineBasicBlock *MBB) { 1255*ed41945fSHeejin Ahn if (MBB == FakeCallerBB) 1256*ed41945fSHeejin Ahn return Stack.size(); 12571d68e80fSDan Gohman unsigned Depth = 0; 12581d68e80fSDan Gohman for (auto X : reverse(Stack)) { 12591d68e80fSDan Gohman if (X == MBB) 12601d68e80fSDan Gohman break; 12611d68e80fSDan Gohman ++Depth; 12621d68e80fSDan Gohman } 12631d68e80fSDan Gohman assert(Depth < Stack.size() && "Branch destination should be in scope"); 12641d68e80fSDan Gohman return Depth; 12651d68e80fSDan Gohman } 12661d68e80fSDan Gohman 12672726b88cSDan Gohman /// In normal assembly languages, when the end of a function is unreachable, 12682726b88cSDan Gohman /// because the function ends in an infinite loop or a noreturn call or similar, 12692726b88cSDan Gohman /// it isn't necessary to worry about the function return type at the end of 12702726b88cSDan Gohman /// the function, because it's never reached. However, in WebAssembly, blocks 12712726b88cSDan Gohman /// that end at the function end need to have a return type signature that 12722726b88cSDan Gohman /// matches the function signature, even though it's unreachable. This function 12732726b88cSDan Gohman /// checks for such cases and fixes up the signatures. 1274e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::fixEndsAtEndOfFunction(MachineFunction &MF) { 1275e76fa9ecSHeejin Ahn const auto &MFI = *MF.getInfo<WebAssemblyFunctionInfo>(); 12762726b88cSDan Gohman 12772726b88cSDan Gohman if (MFI.getResults().empty()) 12782726b88cSDan Gohman return; 12792726b88cSDan Gohman 12802cb27072SThomas Lively // MCInstLower will add the proper types to multivalue signatures based on the 12812cb27072SThomas Lively // function return type 12822cb27072SThomas Lively WebAssembly::BlockType RetType = 12832cb27072SThomas Lively MFI.getResults().size() > 1 12842cb27072SThomas Lively ? WebAssembly::BlockType::Multivalue 12852cb27072SThomas Lively : WebAssembly::BlockType( 12862cb27072SThomas Lively WebAssembly::toValType(MFI.getResults().front())); 12872726b88cSDan Gohman 1288d25c17f3SHeejin Ahn SmallVector<MachineBasicBlock::reverse_iterator, 4> Worklist; 1289d25c17f3SHeejin Ahn Worklist.push_back(MF.rbegin()->rbegin()); 1290d25c17f3SHeejin Ahn 1291d25c17f3SHeejin Ahn auto Process = [&](MachineBasicBlock::reverse_iterator It) { 1292d25c17f3SHeejin Ahn auto *MBB = It->getParent(); 1293d25c17f3SHeejin Ahn while (It != MBB->rend()) { 1294d25c17f3SHeejin Ahn MachineInstr &MI = *It++; 1295801bf7ebSShiva Chen if (MI.isPosition() || MI.isDebugInstr()) 12962726b88cSDan Gohman continue; 12972cb27072SThomas Lively switch (MI.getOpcode()) { 1298d25c17f3SHeejin Ahn case WebAssembly::END_TRY: { 1299d25c17f3SHeejin Ahn // If a 'try''s return type is fixed, both its try body and catch body 1300d25c17f3SHeejin Ahn // should satisfy the return type, so we need to search 'end' 1301d25c17f3SHeejin Ahn // instructions before its corresponding 'catch' too. 1302d25c17f3SHeejin Ahn auto *EHPad = TryToEHPad.lookup(EndToBegin[&MI]); 1303d25c17f3SHeejin Ahn assert(EHPad); 13049f8b2576SHeejin Ahn auto NextIt = 13059f8b2576SHeejin Ahn std::next(WebAssembly::findCatch(EHPad)->getReverseIterator()); 13069f8b2576SHeejin Ahn if (NextIt != EHPad->rend()) 13079f8b2576SHeejin Ahn Worklist.push_back(NextIt); 1308d25c17f3SHeejin Ahn LLVM_FALLTHROUGH; 1309d25c17f3SHeejin Ahn } 13102cb27072SThomas Lively case WebAssembly::END_BLOCK: 13112cb27072SThomas Lively case WebAssembly::END_LOOP: 131218c56a07SHeejin Ahn EndToBegin[&MI]->getOperand(0).setImm(int32_t(RetType)); 13132726b88cSDan Gohman continue; 13142cb27072SThomas Lively default: 1315d25c17f3SHeejin Ahn // Something other than an `end`. We're done for this BB. 13162726b88cSDan Gohman return; 13172726b88cSDan Gohman } 13182726b88cSDan Gohman } 1319d25c17f3SHeejin Ahn // We've reached the beginning of a BB. Continue the search in the previous 1320d25c17f3SHeejin Ahn // BB. 1321d25c17f3SHeejin Ahn Worklist.push_back(MBB->getPrevNode()->rbegin()); 1322d25c17f3SHeejin Ahn }; 1323d25c17f3SHeejin Ahn 1324d25c17f3SHeejin Ahn while (!Worklist.empty()) 1325d25c17f3SHeejin Ahn Process(Worklist.pop_back_val()); 13262cb27072SThomas Lively } 13272726b88cSDan Gohman 1328d934cb88SDan Gohman // WebAssembly functions end with an end instruction, as if the function body 1329d934cb88SDan Gohman // were a block. 133018c56a07SHeejin Ahn static void appendEndToFunction(MachineFunction &MF, 1331d934cb88SDan Gohman const WebAssemblyInstrInfo &TII) { 133210b31358SDerek Schuff BuildMI(MF.back(), MF.back().end(), 133310b31358SDerek Schuff MF.back().findPrevDebugLoc(MF.back().end()), 1334d934cb88SDan Gohman TII.get(WebAssembly::END_FUNCTION)); 1335d934cb88SDan Gohman } 1336d934cb88SDan Gohman 1337e76fa9ecSHeejin Ahn /// Insert LOOP/TRY/BLOCK markers at appropriate places. 1338e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::placeMarkers(MachineFunction &MF) { 1339e76fa9ecSHeejin Ahn // We allocate one more than the number of blocks in the function to 1340e76fa9ecSHeejin Ahn // accommodate for the possible fake block we may insert at the end. 1341e76fa9ecSHeejin Ahn ScopeTops.resize(MF.getNumBlockIDs() + 1); 13428fe7e86bSDan Gohman // Place the LOOP for MBB if MBB is the header of a loop. 1343e76fa9ecSHeejin Ahn for (auto &MBB : MF) 1344e76fa9ecSHeejin Ahn placeLoopMarker(MBB); 134544a5a4b1SHeejin Ahn 1346d6f48786SHeejin Ahn const MCAsmInfo *MCAI = MF.getTarget().getMCAsmInfo(); 134744a5a4b1SHeejin Ahn for (auto &MBB : MF) { 134844a5a4b1SHeejin Ahn if (MBB.isEHPad()) { 134944a5a4b1SHeejin Ahn // Place the TRY for MBB if MBB is the EH pad of an exception. 1350e76fa9ecSHeejin Ahn if (MCAI->getExceptionHandlingType() == ExceptionHandling::Wasm && 1351e76fa9ecSHeejin Ahn MF.getFunction().hasPersonalityFn()) 1352e76fa9ecSHeejin Ahn placeTryMarker(MBB); 135344a5a4b1SHeejin Ahn } else { 135432807932SDan Gohman // Place the BLOCK for MBB if MBB is branched to from above. 1355e76fa9ecSHeejin Ahn placeBlockMarker(MBB); 1356950a13cfSDan Gohman } 135744a5a4b1SHeejin Ahn } 1358c4ac74fbSHeejin Ahn // Fix mismatches in unwind destinations induced by linearizing the code. 1359daeead4bSHeejin Ahn if (MCAI->getExceptionHandlingType() == ExceptionHandling::Wasm && 1360*ed41945fSHeejin Ahn MF.getFunction().hasPersonalityFn()) { 1361*ed41945fSHeejin Ahn bool Changed = fixCallUnwindMismatches(MF); 1362*ed41945fSHeejin Ahn Changed |= fixCatchUnwindMismatches(MF); 1363*ed41945fSHeejin Ahn if (Changed) 1364*ed41945fSHeejin Ahn recalculateScopeTops(MF); 1365*ed41945fSHeejin Ahn } 136644a5a4b1SHeejin Ahn } 1367950a13cfSDan Gohman 1368e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::rewriteDepthImmediates(MachineFunction &MF) { 13691d68e80fSDan Gohman // Now rewrite references to basic blocks to be depth immediates. 13701d68e80fSDan Gohman SmallVector<const MachineBasicBlock *, 8> Stack; 1371*ed41945fSHeejin Ahn SmallVector<const MachineBasicBlock *, 8> DelegateStack; 13721d68e80fSDan Gohman for (auto &MBB : reverse(MF)) { 1373e76fa9ecSHeejin Ahn for (auto I = MBB.rbegin(), E = MBB.rend(); I != E; ++I) { 1374e76fa9ecSHeejin Ahn MachineInstr &MI = *I; 13751d68e80fSDan Gohman switch (MI.getOpcode()) { 13761d68e80fSDan Gohman case WebAssembly::BLOCK: 1377e76fa9ecSHeejin Ahn case WebAssembly::TRY: 1378e76fa9ecSHeejin Ahn assert(ScopeTops[Stack.back()->getNumber()]->getNumber() <= 1379e76fa9ecSHeejin Ahn MBB.getNumber() && 1380e76fa9ecSHeejin Ahn "Block/try marker should be balanced"); 1381e76fa9ecSHeejin Ahn Stack.pop_back(); 1382*ed41945fSHeejin Ahn DelegateStack.pop_back(); 1383e76fa9ecSHeejin Ahn break; 1384e76fa9ecSHeejin Ahn 13851d68e80fSDan Gohman case WebAssembly::LOOP: 13861d68e80fSDan Gohman assert(Stack.back() == &MBB && "Loop top should be balanced"); 13871d68e80fSDan Gohman Stack.pop_back(); 1388*ed41945fSHeejin Ahn DelegateStack.pop_back(); 13891d68e80fSDan Gohman break; 1390e76fa9ecSHeejin Ahn 13911d68e80fSDan Gohman case WebAssembly::END_BLOCK: 1392*ed41945fSHeejin Ahn Stack.push_back(&MBB); 1393*ed41945fSHeejin Ahn DelegateStack.push_back(&MBB); 1394*ed41945fSHeejin Ahn break; 1395*ed41945fSHeejin Ahn 1396e76fa9ecSHeejin Ahn case WebAssembly::END_TRY: 1397*ed41945fSHeejin Ahn // We handle DELEGATE in the default level, because DELEGATE has 1398*ed41945fSHeejin Ahn // immediate operands to rewirte. 13991d68e80fSDan Gohman Stack.push_back(&MBB); 14001d68e80fSDan Gohman break; 1401e76fa9ecSHeejin Ahn 14021d68e80fSDan Gohman case WebAssembly::END_LOOP: 1403e76fa9ecSHeejin Ahn Stack.push_back(EndToBegin[&MI]->getParent()); 1404*ed41945fSHeejin Ahn DelegateStack.push_back(EndToBegin[&MI]->getParent()); 1405*ed41945fSHeejin Ahn break; 1406*ed41945fSHeejin Ahn 1407*ed41945fSHeejin Ahn case WebAssembly::CATCH: 1408*ed41945fSHeejin Ahn case WebAssembly::CATCH_ALL: 1409*ed41945fSHeejin Ahn DelegateStack.push_back(&MBB); 14101d68e80fSDan Gohman break; 1411e76fa9ecSHeejin Ahn 14121d68e80fSDan Gohman default: 14131d68e80fSDan Gohman if (MI.isTerminator()) { 14141d68e80fSDan Gohman // Rewrite MBB operands to be depth immediates. 14151d68e80fSDan Gohman SmallVector<MachineOperand, 4> Ops(MI.operands()); 14161d68e80fSDan Gohman while (MI.getNumOperands() > 0) 14171d68e80fSDan Gohman MI.RemoveOperand(MI.getNumOperands() - 1); 14181d68e80fSDan Gohman for (auto MO : Ops) { 1419*ed41945fSHeejin Ahn if (MO.isMBB()) { 1420*ed41945fSHeejin Ahn if (MI.getOpcode() == WebAssembly::DELEGATE) 1421*ed41945fSHeejin Ahn MO = MachineOperand::CreateImm( 1422*ed41945fSHeejin Ahn getDepth(DelegateStack, MO.getMBB())); 1423*ed41945fSHeejin Ahn else 142418c56a07SHeejin Ahn MO = MachineOperand::CreateImm(getDepth(Stack, MO.getMBB())); 1425*ed41945fSHeejin Ahn } 14261d68e80fSDan Gohman MI.addOperand(MF, MO); 142732807932SDan Gohman } 14281d68e80fSDan Gohman } 1429*ed41945fSHeejin Ahn 1430*ed41945fSHeejin Ahn if (MI.getOpcode() == WebAssembly::DELEGATE) { 1431*ed41945fSHeejin Ahn Stack.push_back(&MBB); 1432*ed41945fSHeejin Ahn DelegateStack.push_back(&MBB); 1433*ed41945fSHeejin Ahn } 14341d68e80fSDan Gohman break; 14351d68e80fSDan Gohman } 14361d68e80fSDan Gohman } 14371d68e80fSDan Gohman } 14381d68e80fSDan Gohman assert(Stack.empty() && "Control flow should be balanced"); 1439e76fa9ecSHeejin Ahn } 14402726b88cSDan Gohman 1441*ed41945fSHeejin Ahn void WebAssemblyCFGStackify::cleanupFunctionData(MachineFunction &MF) { 1442*ed41945fSHeejin Ahn if (FakeCallerBB) 1443*ed41945fSHeejin Ahn MF.DeleteMachineBasicBlock(FakeCallerBB); 1444*ed41945fSHeejin Ahn AppendixBB = FakeCallerBB = nullptr; 1445*ed41945fSHeejin Ahn } 1446*ed41945fSHeejin Ahn 1447e76fa9ecSHeejin Ahn void WebAssemblyCFGStackify::releaseMemory() { 1448e76fa9ecSHeejin Ahn ScopeTops.clear(); 1449e76fa9ecSHeejin Ahn BeginToEnd.clear(); 1450e76fa9ecSHeejin Ahn EndToBegin.clear(); 1451e76fa9ecSHeejin Ahn TryToEHPad.clear(); 1452e76fa9ecSHeejin Ahn EHPadToTry.clear(); 14531d68e80fSDan Gohman } 145432807932SDan Gohman 1455950a13cfSDan Gohman bool WebAssemblyCFGStackify::runOnMachineFunction(MachineFunction &MF) { 1456d34e60caSNicola Zaghen LLVM_DEBUG(dbgs() << "********** CFG Stackifying **********\n" 1457950a13cfSDan Gohman "********** Function: " 1458950a13cfSDan Gohman << MF.getName() << '\n'); 1459cf699b45SHeejin Ahn const MCAsmInfo *MCAI = MF.getTarget().getMCAsmInfo(); 1460950a13cfSDan Gohman 1461e76fa9ecSHeejin Ahn releaseMemory(); 1462e76fa9ecSHeejin Ahn 1463e040533eSDan Gohman // Liveness is not tracked for VALUE_STACK physreg. 14649c3bf318SDerek Schuff MF.getRegInfo().invalidateLiveness(); 1465950a13cfSDan Gohman 1466e76fa9ecSHeejin Ahn // Place the BLOCK/LOOP/TRY markers to indicate the beginnings of scopes. 1467e76fa9ecSHeejin Ahn placeMarkers(MF); 1468e76fa9ecSHeejin Ahn 1469c4ac74fbSHeejin Ahn // Remove unnecessary instructions possibly introduced by try/end_trys. 1470cf699b45SHeejin Ahn if (MCAI->getExceptionHandlingType() == ExceptionHandling::Wasm && 1471cf699b45SHeejin Ahn MF.getFunction().hasPersonalityFn()) 1472cf699b45SHeejin Ahn removeUnnecessaryInstrs(MF); 1473cf699b45SHeejin Ahn 1474e76fa9ecSHeejin Ahn // Convert MBB operands in terminators to relative depth immediates. 1475e76fa9ecSHeejin Ahn rewriteDepthImmediates(MF); 1476e76fa9ecSHeejin Ahn 1477e76fa9ecSHeejin Ahn // Fix up block/loop/try signatures at the end of the function to conform to 1478e76fa9ecSHeejin Ahn // WebAssembly's rules. 1479e76fa9ecSHeejin Ahn fixEndsAtEndOfFunction(MF); 1480e76fa9ecSHeejin Ahn 1481e76fa9ecSHeejin Ahn // Add an end instruction at the end of the function body. 1482e76fa9ecSHeejin Ahn const auto &TII = *MF.getSubtarget<WebAssemblySubtarget>().getInstrInfo(); 1483e76fa9ecSHeejin Ahn if (!MF.getSubtarget<WebAssemblySubtarget>() 1484e76fa9ecSHeejin Ahn .getTargetTriple() 1485e76fa9ecSHeejin Ahn .isOSBinFormatELF()) 148618c56a07SHeejin Ahn appendEndToFunction(MF, TII); 148732807932SDan Gohman 1488*ed41945fSHeejin Ahn cleanupFunctionData(MF); 1489*ed41945fSHeejin Ahn 14901aaa481fSHeejin Ahn MF.getInfo<WebAssemblyFunctionInfo>()->setCFGStackified(); 1491950a13cfSDan Gohman return true; 1492950a13cfSDan Gohman } 1493