Index: lib/Target/WebAssembly/CMakeLists.txt =================================================================== --- lib/Target/WebAssembly/CMakeLists.txt +++ lib/Target/WebAssembly/CMakeLists.txt @@ -12,6 +12,7 @@ add_llvm_target(WebAssemblyCodeGen Relooper.cpp WebAssemblyAsmPrinter.cpp + WebAssemblyCFGStackify.cpp WebAssemblyFastISel.cpp WebAssemblyFrameLowering.cpp WebAssemblyISelDAGToDAG.cpp Index: lib/Target/WebAssembly/WebAssembly.h =================================================================== --- lib/Target/WebAssembly/WebAssembly.h +++ lib/Target/WebAssembly/WebAssembly.h @@ -26,6 +26,8 @@ FunctionPass *createWebAssemblyISelDag(WebAssemblyTargetMachine &TM, CodeGenOpt::Level OptLevel); +FunctionPass *createWebAssemblyCFGStackify(); + } // end namespace llvm #endif Index: lib/Target/WebAssembly/WebAssemblyCFGStackify.cpp =================================================================== --- lib/Target/WebAssembly/WebAssemblyCFGStackify.cpp +++ lib/Target/WebAssembly/WebAssemblyCFGStackify.cpp @@ -0,0 +1,190 @@ +//===-- WebAssemblyCFGStackify.cpp - CFG Stackification -------------------===// +// +// The LLVM Compiler Infrastructure +// +// This file is distributed under the University of Illinois Open Source +// License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// +/// +/// \file +/// \brief This file implements a CFG stacking pass. +/// +//===----------------------------------------------------------------------===// + +#include "WebAssembly.h" +#include "MCTargetDesc/WebAssemblyMCTargetDesc.h" +#include "WebAssemblySubtarget.h" +#include "llvm/CodeGen/MachineFunction.h" +#include "llvm/CodeGen/MachineInstrBuilder.h" +#include "llvm/CodeGen/MachineLoopInfo.h" +#include "llvm/CodeGen/Passes.h" +#include "llvm/Support/Debug.h" +#include "llvm/Support/raw_ostream.h" +using namespace llvm; + +#define DEBUG_TYPE "wasm-cfg-stackify" + +namespace { +class WebAssemblyCFGStackify final : public MachineFunctionPass { +public: + static char ID; // Pass identification, replacement for typeid + WebAssemblyCFGStackify() : MachineFunctionPass(ID) {} + +private: + const char *getPassName() const override { + return "WebAssembly CFG Stackify"; + } + + void getAnalysisUsage(AnalysisUsage &AU) const override { + AU.setPreservesCFG(); + AU.addRequired(); + AU.addPreserved(); + MachineFunctionPass::getAnalysisUsage(AU); + } + + bool runOnMachineFunction(MachineFunction &MF) override; +}; +} // end anonymous namespace + +char WebAssemblyCFGStackify::ID = 0; +FunctionPass *llvm::createWebAssemblyCFGStackify() { + return new WebAssemblyCFGStackify(); +} + +static bool IsNext(MachineBasicBlock *M, MachineBasicBlock *N) { + return next(MachineFunction::iterator(M)) == MachineFunction::iterator(N); +} + +namespace { +struct RPOStackEntry { + MachineBasicBlock *MBB; + SmallVector Succs; + + RPOStackEntry(MachineBasicBlock *MBB, const MachineLoopInfo &MLI) : MBB(MBB) { + // RPO is not a unique form, since at every basic block with multiple + // successors, the DFS has to pick which order to visit the successors in. + // This code attempts to order the successors strategically. + // + // FIXME: Right now this is some hackish code that attempts to sort the + // successors to make loops contiguous and to prefer to keep blocks in + // existing layout order when possible. + unsigned Depth = MLI.getLoopDepth(MBB); + for (auto Succ : MBB->successors()) + if (MLI.getLoopDepth(Succ) != Depth && IsNext(MBB, Succ)) + Succs.push_back(Succ); + for (auto Succ : MBB->successors()) + if (MLI.getLoopDepth(Succ) != Depth && !IsNext(MBB, Succ)) + Succs.push_back(Succ); + for (auto Succ : MBB->successors()) + if (MLI.getLoopDepth(Succ) == Depth && IsNext(MBB, Succ)) + Succs.push_back(Succ); + for (auto Succ : MBB->successors()) + if (MLI.getLoopDepth(Succ) == Depth && !IsNext(MBB, Succ)) + Succs.push_back(Succ); + } +}; +} + +// Sort the blocks in RPO, taking special care to make sure that loops are +// contiguous even in the case of split backedges. +static void SortBlocks(MachineFunction &MF, const MachineLoopInfo &MLI) { + SmallPtrSet Visited; + SmallVector Stack; + + MachineBasicBlock *Entry = MF.begin(); + Stack.push_back(RPOStackEntry(Entry, MLI)); + Visited.insert(Entry); + + do { + top: + RPOStackEntry &Entry = Stack.back(); + SmallVectorImpl &Succs = Entry.Succs; + if (!Succs.empty()) { + MachineBasicBlock *Succ = Succs.pop_back_val(); + if (Visited.insert(Succ).second) + Stack.push_back(RPOStackEntry(Succ, MLI)); + goto top; + } + MachineBasicBlock *MBB = Entry.MBB; + MBB->moveBefore(MF.begin()); + MBB->updateTerminator(); + Stack.pop_back(); + } while (!Stack.empty()); +} + +static void PlaceMarkers(MachineFunction &MF, const MachineLoopInfo &MLI, + const WebAssemblyInstrInfo *TII) { + for (auto &MBB : MF) { + // Place the LOOP for a loop. + if (MachineLoop *Loop = MLI.getLoopFor(&MBB)) { + MachineBasicBlock *Top = Loop->getTopBlock(); + assert(Loop->getHeader() == Top); + if (Top == &MBB) + BuildMI(*Top, Top->begin(), DebugLoc(), TII->get(WebAssembly::LOOP)) + .addMBB(Loop->getBottomBlock()); + } + + // Check for forward branches to handle. + for (auto &Term : MBB.terminators()) { + switch (Term.getOpcode()) { + case WebAssembly::BR: + case WebAssembly::BRIF: { + MachineBasicBlock *Succ = Term.getOperand(0).getMBB(); + if (Succ->getNumber() > MBB.getNumber()) { + // Place the BLOCK for a forward branch. + MachineLoop *Loop = MLI.getLoopFor(Succ); + MachineBasicBlock *Header = Loop ? Loop->getHeader() : &MF.front(); + MachineBasicBlock::iterator I = Header->begin(); + if (I->getOpcode() == WebAssembly::LOOP) + ++I; + int SuccNumber = Succ->getNumber(); + // Position the BLOCK in nesting order. + while (I->getOpcode() == WebAssembly::BLOCK) { + int N = I->getOperand(0).getMBB()->getNumber(); + if (N < SuccNumber) + break; + // If there's already a BLOCK for Succ, we don't need another. + if (N == SuccNumber) + goto skip_block; + ++I; + } + + BuildMI(*Header, I, DebugLoc(), TII->get(WebAssembly::BLOCK)) + .addMBB(Succ); + } + skip_block:; + break; + } + case WebAssembly::RETURN_VOID: + case WebAssembly::RETURN_Int32: + case WebAssembly::RETURN_Float32: + case WebAssembly::RETURN_Int64: + case WebAssembly::RETURN_Float64: + break; + default: + llvm_unreachable("unhandled terminator"); + } + } + } +} + +bool WebAssemblyCFGStackify::runOnMachineFunction(MachineFunction &MF) { + DEBUG(dbgs() << "********** CFG Stackifying **********\n" + "********** Function: " + << MF.getName() << '\n'); + + const MachineLoopInfo &MLI = getAnalysis(); + const auto *TII = MF.getSubtarget().getInstrInfo(); + + // Sort the blocks in RPO, with contiguous loops. + SortBlocks(MF, MLI); + + // Now that we've sorted the blocks in RPO, renumber them. + MF.RenumberBlocks(); + + // Place the BLOCK and LOOP markers to indicate the beginnings of scopes. + PlaceMarkers(MF, MLI, TII); + + return true; +} Index: lib/Target/WebAssembly/WebAssemblyISD.def =================================================================== --- lib/Target/WebAssembly/WebAssemblyISD.def +++ lib/Target/WebAssembly/WebAssemblyISD.def @@ -19,5 +19,6 @@ HANDLE_NODETYPE(RETURN) HANDLE_NODETYPE(ARGUMENT) HANDLE_NODETYPE(Wrapper) +HANDLE_NODETYPE(BRIF) // add memory opcodes starting at ISD::FIRST_TARGET_MEMORY_OPCODE here... Index: lib/Target/WebAssembly/WebAssemblyISelLowering.cpp =================================================================== --- lib/Target/WebAssembly/WebAssemblyISelLowering.cpp +++ lib/Target/WebAssembly/WebAssemblyISelLowering.cpp @@ -153,6 +153,12 @@ setOperationAction(ISD::STACKRESTORE, MVT::Other, Expand); setOperationAction(ISD::DYNAMIC_STACKALLOC, MVTPtr, Expand); + // Expand these forms; we pattern-match the forms that we can handle in isel. + setOperationAction(ISD::BR_JT, MVT::Other, Expand); + for (auto T : {MVT::i32, MVT::i64, MVT::f32, MVT::f64}) + for (auto Op : {ISD::BR_CC, ISD::SELECT_CC}) + setOperationAction(Op, T, Expand); + // WebAssembly doesn't have: // - Floating-point extending loads. // - Floating-point truncating stores. Index: lib/Target/WebAssembly/WebAssemblyInstrControl.td =================================================================== --- lib/Target/WebAssembly/WebAssemblyInstrControl.td +++ lib/Target/WebAssembly/WebAssemblyInstrControl.td @@ -25,6 +25,17 @@ * switch: switch statement with fallthrough */ +let isBranch = 1, isTerminator = 1, hasCtrlDep = 1 in { +def BRIF : I<(outs), (ins bb_op:$dst, Int32:$a), + [(brcond Int32:$a, bb:$dst)]>; +let isBarrier = 1 in +def BR : I<(outs), (ins bb_op:$dst), + [(br bb:$dst)]>; +} // isBranch = 1, isTerminator = 1, hasCtrlDep = 1 + +def BLOCK : I<(outs), (ins bb_op:$dst), []>; +def LOOP : I<(outs), (ins bb_op:$dst), []>; + multiclass RETURN { def RETURN_#vt : I<(outs), (ins vt:$val), [(WebAssemblyreturn vt:$val)]>; } @@ -35,3 +46,16 @@ defm : RETURN; def RETURN_VOID : I<(outs), (ins), [(WebAssemblyreturn)]>; } // isReturn = 1, isTerminator = 1, hasCtrlDep = 1, isBarrier = 1 + +def SELECT_I32 : I<(outs Int32:$dst), (ins Int32:$a, Int32:$t, Int32:$f), + [(set Int32:$dst, (select Int32:$a, Int32:$t, Int32:$f))]>; +def SELECT_I64 : I<(outs Int64:$dst), (ins Int64:$a, Int64:$t, Int64:$f), + [(set Int64:$dst, (select Int64:$a, Int64:$t, Int64:$f))]>; +def SELECT_F32 : I<(outs Float32:$dst), + (ins Int32:$a, Float32:$lhs, Float32:$rhs), + [(set Float32:$dst, + (select Int32:$a, Float32:$lhs, Float32:$rhs))]>; +def SELECT_F64 : I<(outs Float64:$dst), + (ins Int32:$a, Float64:$lhs, Float64:$rhs), + [(set Float64:$dst, + (select Int32:$a, Float64:$lhs, Float64:$rhs))]>; Index: lib/Target/WebAssembly/WebAssemblyInstrInfo.h =================================================================== --- lib/Target/WebAssembly/WebAssemblyInstrInfo.h +++ lib/Target/WebAssembly/WebAssemblyInstrInfo.h @@ -37,6 +37,18 @@ void copyPhysReg(MachineBasicBlock &MBB, MachineBasicBlock::iterator MI, DebugLoc DL, unsigned DestReg, unsigned SrcReg, bool KillSrc) const override; + + bool AnalyzeBranch(MachineBasicBlock &MBB, MachineBasicBlock *&TBB, + MachineBasicBlock *&FBB, + SmallVectorImpl &Cond, + bool AllowModify = false) const override; + unsigned RemoveBranch(MachineBasicBlock &MBB) const override; + unsigned InsertBranch(MachineBasicBlock &MBB, MachineBasicBlock *TBB, + MachineBasicBlock *FBB, + ArrayRef Cond, + DebugLoc DL) const override; + bool + ReverseBranchCondition(SmallVectorImpl &Cond) const override; }; } // end namespace llvm Index: lib/Target/WebAssembly/WebAssemblyInstrInfo.cpp =================================================================== --- lib/Target/WebAssembly/WebAssemblyInstrInfo.cpp +++ lib/Target/WebAssembly/WebAssemblyInstrInfo.cpp @@ -37,3 +37,89 @@ BuildMI(MBB, I, DL, get(WebAssembly::COPY), DestReg) .addReg(SrcReg, KillSrc ? RegState::Kill : 0); } + +// Branch analysis. +bool WebAssemblyInstrInfo::AnalyzeBranch(MachineBasicBlock &MBB, + MachineBasicBlock *&TBB, + MachineBasicBlock *&FBB, + SmallVectorImpl &Cond, + bool AllowModify) const { + bool HaveCond = false; + for (MachineInstr &MI : iterator_range( + MBB.getFirstInstrTerminator(), MBB.instr_end())) { + switch (MI.getOpcode()) { + default: + // Unhandled instruction; bail out. + return true; + case WebAssembly::BRIF: + if (HaveCond) + return true; + Cond.push_back(MI.getOperand(1)); + TBB = MI.getOperand(0).getMBB(); + HaveCond = true; + break; + case WebAssembly::BR: + if (!HaveCond) + TBB = MI.getOperand(0).getMBB(); + else + FBB = MI.getOperand(0).getMBB(); + break; + } + if (MI.isBarrier()) + break; + } + + return false; +} + +unsigned WebAssemblyInstrInfo::RemoveBranch(MachineBasicBlock &MBB) const { + MachineBasicBlock::instr_iterator I = MBB.instr_end(); + unsigned Count = 0; + + while (I != MBB.instr_begin()) { + --I; + if (I->isDebugValue()) + continue; + if (!I->isTerminator()) + break; + // Remove the branch. + I->eraseFromParent(); + I = MBB.instr_end(); + ++Count; + } + + return Count; +} + +unsigned WebAssemblyInstrInfo::InsertBranch( + MachineBasicBlock &MBB, MachineBasicBlock *TBB, MachineBasicBlock *FBB, + ArrayRef Cond, DebugLoc DL) const { + assert(Cond.size() <= 1); + + if (Cond.empty()) { + if (!TBB) + return 0; + + BuildMI(&MBB, DL, get(WebAssembly::BR)).addMBB(TBB); + return 1; + } + + BuildMI(&MBB, DL, get(WebAssembly::BRIF)) + .addMBB(TBB) + .addOperand(Cond[0]); + if (!FBB) + return 1; + + BuildMI(&MBB, DL, get(WebAssembly::BR)).addMBB(FBB); + return 2; +} + +bool WebAssemblyInstrInfo::ReverseBranchCondition( + SmallVectorImpl &Cond) const { + assert(Cond.size() == 1); + + // TODO: Add branch reversal here... And re-enable MachineBlockPlacementID + // when we do. + + return true; +} Index: lib/Target/WebAssembly/WebAssemblyInstrInfo.td =================================================================== --- lib/Target/WebAssembly/WebAssemblyInstrInfo.td +++ lib/Target/WebAssembly/WebAssemblyInstrInfo.td @@ -69,6 +69,7 @@ * set_local: set the current value of a local variable */ +def bb_op : Operand; def global : Operand; //===----------------------------------------------------------------------===// Index: lib/Target/WebAssembly/WebAssemblyTargetMachine.cpp =================================================================== --- lib/Target/WebAssembly/WebAssemblyTargetMachine.cpp +++ lib/Target/WebAssembly/WebAssemblyTargetMachine.cpp @@ -159,8 +159,14 @@ disablePass(&PrologEpilogCodeInserterID); // Fails with: should be run after register allocation. disablePass(&MachineCopyPropagationID); + + // FIXME: Until we get ReverseBranchCondition support, MachineBlockPlacement + // can create ugly-looking control flow. + disablePass(&MachineBlockPlacementID); } void WebAssemblyPassConfig::addPreSched2() {} -void WebAssemblyPassConfig::addPreEmitPass() {} +void WebAssemblyPassConfig::addPreEmitPass() { + addPass(createWebAssemblyCFGStackify()); +} Index: test/CodeGen/WebAssembly/phi.ll =================================================================== --- test/CodeGen/WebAssembly/phi.ll +++ test/CodeGen/WebAssembly/phi.ll @@ -1,8 +1,5 @@ ; RUN: llc < %s -asm-verbose=false | FileCheck %s -; This test depends on branching support, which is not yet checked in. -; XFAIL: * - ; Test that phis are lowered. target datalayout = "e-p:32:32-i64:64-v128:8:128-n32:64-S128"