1*0b57cec5SDimitry Andric //- WebAssemblyISelDAGToDAG.cpp - A dag to dag inst selector for WebAssembly -// 2*0b57cec5SDimitry Andric // 3*0b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4*0b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 5*0b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6*0b57cec5SDimitry Andric // 7*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 8*0b57cec5SDimitry Andric /// 9*0b57cec5SDimitry Andric /// \file 10*0b57cec5SDimitry Andric /// This file defines an instruction selector for the WebAssembly target. 11*0b57cec5SDimitry Andric /// 12*0b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 13*0b57cec5SDimitry Andric 14*0b57cec5SDimitry Andric #include "MCTargetDesc/WebAssemblyMCTargetDesc.h" 15*0b57cec5SDimitry Andric #include "WebAssembly.h" 16*0b57cec5SDimitry Andric #include "WebAssemblyTargetMachine.h" 17*0b57cec5SDimitry Andric #include "llvm/CodeGen/SelectionDAGISel.h" 18*0b57cec5SDimitry Andric #include "llvm/IR/DiagnosticInfo.h" 19*0b57cec5SDimitry Andric #include "llvm/IR/Function.h" // To access function attributes. 20*0b57cec5SDimitry Andric #include "llvm/Support/Debug.h" 21*0b57cec5SDimitry Andric #include "llvm/Support/KnownBits.h" 22*0b57cec5SDimitry Andric #include "llvm/Support/MathExtras.h" 23*0b57cec5SDimitry Andric #include "llvm/Support/raw_ostream.h" 24*0b57cec5SDimitry Andric using namespace llvm; 25*0b57cec5SDimitry Andric 26*0b57cec5SDimitry Andric #define DEBUG_TYPE "wasm-isel" 27*0b57cec5SDimitry Andric 28*0b57cec5SDimitry Andric //===--------------------------------------------------------------------===// 29*0b57cec5SDimitry Andric /// WebAssembly-specific code to select WebAssembly machine instructions for 30*0b57cec5SDimitry Andric /// SelectionDAG operations. 31*0b57cec5SDimitry Andric /// 32*0b57cec5SDimitry Andric namespace { 33*0b57cec5SDimitry Andric class WebAssemblyDAGToDAGISel final : public SelectionDAGISel { 34*0b57cec5SDimitry Andric /// Keep a pointer to the WebAssemblySubtarget around so that we can make the 35*0b57cec5SDimitry Andric /// right decision when generating code for different targets. 36*0b57cec5SDimitry Andric const WebAssemblySubtarget *Subtarget; 37*0b57cec5SDimitry Andric 38*0b57cec5SDimitry Andric bool ForCodeSize; 39*0b57cec5SDimitry Andric 40*0b57cec5SDimitry Andric public: 41*0b57cec5SDimitry Andric WebAssemblyDAGToDAGISel(WebAssemblyTargetMachine &TM, 42*0b57cec5SDimitry Andric CodeGenOpt::Level OptLevel) 43*0b57cec5SDimitry Andric : SelectionDAGISel(TM, OptLevel), Subtarget(nullptr), ForCodeSize(false) { 44*0b57cec5SDimitry Andric } 45*0b57cec5SDimitry Andric 46*0b57cec5SDimitry Andric StringRef getPassName() const override { 47*0b57cec5SDimitry Andric return "WebAssembly Instruction Selection"; 48*0b57cec5SDimitry Andric } 49*0b57cec5SDimitry Andric 50*0b57cec5SDimitry Andric bool runOnMachineFunction(MachineFunction &MF) override { 51*0b57cec5SDimitry Andric LLVM_DEBUG(dbgs() << "********** ISelDAGToDAG **********\n" 52*0b57cec5SDimitry Andric "********** Function: " 53*0b57cec5SDimitry Andric << MF.getName() << '\n'); 54*0b57cec5SDimitry Andric 55*0b57cec5SDimitry Andric ForCodeSize = MF.getFunction().hasOptSize(); 56*0b57cec5SDimitry Andric Subtarget = &MF.getSubtarget<WebAssemblySubtarget>(); 57*0b57cec5SDimitry Andric return SelectionDAGISel::runOnMachineFunction(MF); 58*0b57cec5SDimitry Andric } 59*0b57cec5SDimitry Andric 60*0b57cec5SDimitry Andric void Select(SDNode *Node) override; 61*0b57cec5SDimitry Andric 62*0b57cec5SDimitry Andric bool SelectInlineAsmMemoryOperand(const SDValue &Op, unsigned ConstraintID, 63*0b57cec5SDimitry Andric std::vector<SDValue> &OutOps) override; 64*0b57cec5SDimitry Andric 65*0b57cec5SDimitry Andric // Include the pieces autogenerated from the target description. 66*0b57cec5SDimitry Andric #include "WebAssemblyGenDAGISel.inc" 67*0b57cec5SDimitry Andric 68*0b57cec5SDimitry Andric private: 69*0b57cec5SDimitry Andric // add select functions here... 70*0b57cec5SDimitry Andric }; 71*0b57cec5SDimitry Andric } // end anonymous namespace 72*0b57cec5SDimitry Andric 73*0b57cec5SDimitry Andric void WebAssemblyDAGToDAGISel::Select(SDNode *Node) { 74*0b57cec5SDimitry Andric // If we have a custom node, we already have selected! 75*0b57cec5SDimitry Andric if (Node->isMachineOpcode()) { 76*0b57cec5SDimitry Andric LLVM_DEBUG(errs() << "== "; Node->dump(CurDAG); errs() << "\n"); 77*0b57cec5SDimitry Andric Node->setNodeId(-1); 78*0b57cec5SDimitry Andric return; 79*0b57cec5SDimitry Andric } 80*0b57cec5SDimitry Andric 81*0b57cec5SDimitry Andric // Few custom selection stuff. 82*0b57cec5SDimitry Andric SDLoc DL(Node); 83*0b57cec5SDimitry Andric MachineFunction &MF = CurDAG->getMachineFunction(); 84*0b57cec5SDimitry Andric switch (Node->getOpcode()) { 85*0b57cec5SDimitry Andric case ISD::ATOMIC_FENCE: { 86*0b57cec5SDimitry Andric if (!MF.getSubtarget<WebAssemblySubtarget>().hasAtomics()) 87*0b57cec5SDimitry Andric break; 88*0b57cec5SDimitry Andric 89*0b57cec5SDimitry Andric uint64_t SyncScopeID = 90*0b57cec5SDimitry Andric cast<ConstantSDNode>(Node->getOperand(2).getNode())->getZExtValue(); 91*0b57cec5SDimitry Andric switch (SyncScopeID) { 92*0b57cec5SDimitry Andric case SyncScope::SingleThread: { 93*0b57cec5SDimitry Andric // We lower a single-thread fence to a pseudo compiler barrier instruction 94*0b57cec5SDimitry Andric // preventing instruction reordering. This will not be emitted in final 95*0b57cec5SDimitry Andric // binary. 96*0b57cec5SDimitry Andric MachineSDNode *Fence = 97*0b57cec5SDimitry Andric CurDAG->getMachineNode(WebAssembly::COMPILER_FENCE, 98*0b57cec5SDimitry Andric DL, // debug loc 99*0b57cec5SDimitry Andric MVT::Other, // outchain type 100*0b57cec5SDimitry Andric Node->getOperand(0) // inchain 101*0b57cec5SDimitry Andric ); 102*0b57cec5SDimitry Andric ReplaceNode(Node, Fence); 103*0b57cec5SDimitry Andric CurDAG->RemoveDeadNode(Node); 104*0b57cec5SDimitry Andric return; 105*0b57cec5SDimitry Andric } 106*0b57cec5SDimitry Andric 107*0b57cec5SDimitry Andric case SyncScope::System: { 108*0b57cec5SDimitry Andric // For non-emscripten systems, we have not decided on what we should 109*0b57cec5SDimitry Andric // traslate fences to yet. 110*0b57cec5SDimitry Andric if (!Subtarget->getTargetTriple().isOSEmscripten()) 111*0b57cec5SDimitry Andric report_fatal_error( 112*0b57cec5SDimitry Andric "ATOMIC_FENCE is not yet supported in non-emscripten OSes"); 113*0b57cec5SDimitry Andric 114*0b57cec5SDimitry Andric // Wasm does not have a fence instruction, but because all atomic 115*0b57cec5SDimitry Andric // instructions in wasm are sequentially consistent, we translate a 116*0b57cec5SDimitry Andric // fence to an idempotent atomic RMW instruction to a linear memory 117*0b57cec5SDimitry Andric // address. All atomic instructions in wasm are sequentially consistent, 118*0b57cec5SDimitry Andric // but this is to ensure a fence also prevents reordering of non-atomic 119*0b57cec5SDimitry Andric // instructions in the VM. Even though LLVM IR's fence instruction does 120*0b57cec5SDimitry Andric // not say anything about its relationship with non-atomic instructions, 121*0b57cec5SDimitry Andric // we think this is more user-friendly. 122*0b57cec5SDimitry Andric // 123*0b57cec5SDimitry Andric // While any address can work, here we use a value stored in 124*0b57cec5SDimitry Andric // __stack_pointer wasm global because there's high chance that area is 125*0b57cec5SDimitry Andric // in cache. 126*0b57cec5SDimitry Andric // 127*0b57cec5SDimitry Andric // So the selected instructions will be in the form of: 128*0b57cec5SDimitry Andric // %addr = get_global $__stack_pointer 129*0b57cec5SDimitry Andric // %0 = i32.const 0 130*0b57cec5SDimitry Andric // i32.atomic.rmw.or %addr, %0 131*0b57cec5SDimitry Andric SDValue StackPtrSym = CurDAG->getTargetExternalSymbol( 132*0b57cec5SDimitry Andric "__stack_pointer", TLI->getPointerTy(CurDAG->getDataLayout())); 133*0b57cec5SDimitry Andric MachineSDNode *GetGlobal = 134*0b57cec5SDimitry Andric CurDAG->getMachineNode(WebAssembly::GLOBAL_GET_I32, // opcode 135*0b57cec5SDimitry Andric DL, // debug loc 136*0b57cec5SDimitry Andric MVT::i32, // result type 137*0b57cec5SDimitry Andric StackPtrSym // __stack_pointer symbol 138*0b57cec5SDimitry Andric ); 139*0b57cec5SDimitry Andric 140*0b57cec5SDimitry Andric SDValue Zero = CurDAG->getTargetConstant(0, DL, MVT::i32); 141*0b57cec5SDimitry Andric auto *MMO = MF.getMachineMemOperand( 142*0b57cec5SDimitry Andric MachinePointerInfo::getUnknownStack(MF), 143*0b57cec5SDimitry Andric // FIXME Volatile isn't really correct, but currently all LLVM 144*0b57cec5SDimitry Andric // atomic instructions are treated as volatiles in the backend, so 145*0b57cec5SDimitry Andric // we should be consistent. 146*0b57cec5SDimitry Andric MachineMemOperand::MOVolatile | MachineMemOperand::MOLoad | 147*0b57cec5SDimitry Andric MachineMemOperand::MOStore, 148*0b57cec5SDimitry Andric 4, 4, AAMDNodes(), nullptr, SyncScope::System, 149*0b57cec5SDimitry Andric AtomicOrdering::SequentiallyConsistent); 150*0b57cec5SDimitry Andric MachineSDNode *Const0 = 151*0b57cec5SDimitry Andric CurDAG->getMachineNode(WebAssembly::CONST_I32, DL, MVT::i32, Zero); 152*0b57cec5SDimitry Andric MachineSDNode *AtomicRMW = CurDAG->getMachineNode( 153*0b57cec5SDimitry Andric WebAssembly::ATOMIC_RMW_OR_I32, // opcode 154*0b57cec5SDimitry Andric DL, // debug loc 155*0b57cec5SDimitry Andric MVT::i32, // result type 156*0b57cec5SDimitry Andric MVT::Other, // outchain type 157*0b57cec5SDimitry Andric { 158*0b57cec5SDimitry Andric Zero, // alignment 159*0b57cec5SDimitry Andric Zero, // offset 160*0b57cec5SDimitry Andric SDValue(GetGlobal, 0), // __stack_pointer 161*0b57cec5SDimitry Andric SDValue(Const0, 0), // OR with 0 to make it idempotent 162*0b57cec5SDimitry Andric Node->getOperand(0) // inchain 163*0b57cec5SDimitry Andric }); 164*0b57cec5SDimitry Andric 165*0b57cec5SDimitry Andric CurDAG->setNodeMemRefs(AtomicRMW, {MMO}); 166*0b57cec5SDimitry Andric ReplaceUses(SDValue(Node, 0), SDValue(AtomicRMW, 1)); 167*0b57cec5SDimitry Andric CurDAG->RemoveDeadNode(Node); 168*0b57cec5SDimitry Andric return; 169*0b57cec5SDimitry Andric } 170*0b57cec5SDimitry Andric default: 171*0b57cec5SDimitry Andric llvm_unreachable("Unknown scope!"); 172*0b57cec5SDimitry Andric } 173*0b57cec5SDimitry Andric } 174*0b57cec5SDimitry Andric 175*0b57cec5SDimitry Andric case ISD::GlobalTLSAddress: { 176*0b57cec5SDimitry Andric const auto *GA = cast<GlobalAddressSDNode>(Node); 177*0b57cec5SDimitry Andric 178*0b57cec5SDimitry Andric if (!MF.getSubtarget<WebAssemblySubtarget>().hasBulkMemory()) 179*0b57cec5SDimitry Andric report_fatal_error("cannot use thread-local storage without bulk memory", 180*0b57cec5SDimitry Andric false); 181*0b57cec5SDimitry Andric 182*0b57cec5SDimitry Andric // Currently Emscripten does not support dynamic linking with threads. 183*0b57cec5SDimitry Andric // Therefore, if we have thread-local storage, only the local-exec model 184*0b57cec5SDimitry Andric // is possible. 185*0b57cec5SDimitry Andric // TODO: remove this and implement proper TLS models once Emscripten 186*0b57cec5SDimitry Andric // supports dynamic linking with threads. 187*0b57cec5SDimitry Andric if (GA->getGlobal()->getThreadLocalMode() != 188*0b57cec5SDimitry Andric GlobalValue::LocalExecTLSModel && 189*0b57cec5SDimitry Andric !Subtarget->getTargetTriple().isOSEmscripten()) { 190*0b57cec5SDimitry Andric report_fatal_error("only -ftls-model=local-exec is supported for now on " 191*0b57cec5SDimitry Andric "non-Emscripten OSes: variable " + 192*0b57cec5SDimitry Andric GA->getGlobal()->getName(), 193*0b57cec5SDimitry Andric false); 194*0b57cec5SDimitry Andric } 195*0b57cec5SDimitry Andric 196*0b57cec5SDimitry Andric MVT PtrVT = TLI->getPointerTy(CurDAG->getDataLayout()); 197*0b57cec5SDimitry Andric assert(PtrVT == MVT::i32 && "only wasm32 is supported for now"); 198*0b57cec5SDimitry Andric 199*0b57cec5SDimitry Andric SDValue TLSBaseSym = CurDAG->getTargetExternalSymbol("__tls_base", PtrVT); 200*0b57cec5SDimitry Andric SDValue TLSOffsetSym = CurDAG->getTargetGlobalAddress( 201*0b57cec5SDimitry Andric GA->getGlobal(), DL, PtrVT, GA->getOffset(), 0); 202*0b57cec5SDimitry Andric 203*0b57cec5SDimitry Andric MachineSDNode *TLSBase = CurDAG->getMachineNode(WebAssembly::GLOBAL_GET_I32, 204*0b57cec5SDimitry Andric DL, MVT::i32, TLSBaseSym); 205*0b57cec5SDimitry Andric MachineSDNode *TLSOffset = CurDAG->getMachineNode( 206*0b57cec5SDimitry Andric WebAssembly::CONST_I32, DL, MVT::i32, TLSOffsetSym); 207*0b57cec5SDimitry Andric MachineSDNode *TLSAddress = 208*0b57cec5SDimitry Andric CurDAG->getMachineNode(WebAssembly::ADD_I32, DL, MVT::i32, 209*0b57cec5SDimitry Andric SDValue(TLSBase, 0), SDValue(TLSOffset, 0)); 210*0b57cec5SDimitry Andric ReplaceNode(Node, TLSAddress); 211*0b57cec5SDimitry Andric return; 212*0b57cec5SDimitry Andric } 213*0b57cec5SDimitry Andric 214*0b57cec5SDimitry Andric case ISD::INTRINSIC_WO_CHAIN: { 215*0b57cec5SDimitry Andric unsigned IntNo = cast<ConstantSDNode>(Node->getOperand(0))->getZExtValue(); 216*0b57cec5SDimitry Andric switch (IntNo) { 217*0b57cec5SDimitry Andric case Intrinsic::wasm_tls_size: { 218*0b57cec5SDimitry Andric MVT PtrVT = TLI->getPointerTy(CurDAG->getDataLayout()); 219*0b57cec5SDimitry Andric assert(PtrVT == MVT::i32 && "only wasm32 is supported for now"); 220*0b57cec5SDimitry Andric 221*0b57cec5SDimitry Andric MachineSDNode *TLSSize = CurDAG->getMachineNode( 222*0b57cec5SDimitry Andric WebAssembly::GLOBAL_GET_I32, DL, PtrVT, 223*0b57cec5SDimitry Andric CurDAG->getTargetExternalSymbol("__tls_size", MVT::i32)); 224*0b57cec5SDimitry Andric ReplaceNode(Node, TLSSize); 225*0b57cec5SDimitry Andric return; 226*0b57cec5SDimitry Andric } 227*0b57cec5SDimitry Andric } 228*0b57cec5SDimitry Andric break; 229*0b57cec5SDimitry Andric } 230*0b57cec5SDimitry Andric 231*0b57cec5SDimitry Andric default: 232*0b57cec5SDimitry Andric break; 233*0b57cec5SDimitry Andric } 234*0b57cec5SDimitry Andric 235*0b57cec5SDimitry Andric // Select the default instruction. 236*0b57cec5SDimitry Andric SelectCode(Node); 237*0b57cec5SDimitry Andric } 238*0b57cec5SDimitry Andric 239*0b57cec5SDimitry Andric bool WebAssemblyDAGToDAGISel::SelectInlineAsmMemoryOperand( 240*0b57cec5SDimitry Andric const SDValue &Op, unsigned ConstraintID, std::vector<SDValue> &OutOps) { 241*0b57cec5SDimitry Andric switch (ConstraintID) { 242*0b57cec5SDimitry Andric case InlineAsm::Constraint_i: 243*0b57cec5SDimitry Andric case InlineAsm::Constraint_m: 244*0b57cec5SDimitry Andric // We just support simple memory operands that just have a single address 245*0b57cec5SDimitry Andric // operand and need no special handling. 246*0b57cec5SDimitry Andric OutOps.push_back(Op); 247*0b57cec5SDimitry Andric return false; 248*0b57cec5SDimitry Andric default: 249*0b57cec5SDimitry Andric break; 250*0b57cec5SDimitry Andric } 251*0b57cec5SDimitry Andric 252*0b57cec5SDimitry Andric return true; 253*0b57cec5SDimitry Andric } 254*0b57cec5SDimitry Andric 255*0b57cec5SDimitry Andric /// This pass converts a legalized DAG into a WebAssembly-specific DAG, ready 256*0b57cec5SDimitry Andric /// for instruction scheduling. 257*0b57cec5SDimitry Andric FunctionPass *llvm::createWebAssemblyISelDag(WebAssemblyTargetMachine &TM, 258*0b57cec5SDimitry Andric CodeGenOpt::Level OptLevel) { 259*0b57cec5SDimitry Andric return new WebAssemblyDAGToDAGISel(TM, OptLevel); 260*0b57cec5SDimitry Andric } 261