xref: /freebsd/contrib/llvm-project/llvm/lib/Target/AMDGPU/AMDGPUMCInstLower.cpp (revision e8d8bef961a50d4dc22501cde4fb9fb0be1b2532)
10b57cec5SDimitry Andric //===- AMDGPUMCInstLower.cpp - Lower AMDGPU MachineInstr to an MCInst -----===//
20b57cec5SDimitry Andric //
30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information.
50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
60b57cec5SDimitry Andric //
70b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
80b57cec5SDimitry Andric //
90b57cec5SDimitry Andric /// \file
100b57cec5SDimitry Andric /// Code to lower AMDGPU MachineInstrs to their corresponding MCInst.
110b57cec5SDimitry Andric //
120b57cec5SDimitry Andric //===----------------------------------------------------------------------===//
130b57cec5SDimitry Andric //
140b57cec5SDimitry Andric 
150b57cec5SDimitry Andric #include "AMDGPUAsmPrinter.h"
160b57cec5SDimitry Andric #include "AMDGPUTargetMachine.h"
170b57cec5SDimitry Andric #include "MCTargetDesc/AMDGPUInstPrinter.h"
180b57cec5SDimitry Andric #include "MCTargetDesc/AMDGPUMCTargetDesc.h"
190b57cec5SDimitry Andric #include "R600AsmPrinter.h"
200b57cec5SDimitry Andric #include "llvm/CodeGen/MachineBasicBlock.h"
210b57cec5SDimitry Andric #include "llvm/CodeGen/MachineInstr.h"
220b57cec5SDimitry Andric #include "llvm/IR/Constants.h"
230b57cec5SDimitry Andric #include "llvm/IR/Function.h"
240b57cec5SDimitry Andric #include "llvm/IR/GlobalVariable.h"
250b57cec5SDimitry Andric #include "llvm/MC/MCCodeEmitter.h"
260b57cec5SDimitry Andric #include "llvm/MC/MCContext.h"
270b57cec5SDimitry Andric #include "llvm/MC/MCExpr.h"
280b57cec5SDimitry Andric #include "llvm/MC/MCInst.h"
290b57cec5SDimitry Andric #include "llvm/MC/MCObjectStreamer.h"
300b57cec5SDimitry Andric #include "llvm/MC/MCStreamer.h"
310b57cec5SDimitry Andric #include "llvm/Support/ErrorHandling.h"
320b57cec5SDimitry Andric #include "llvm/Support/Format.h"
330b57cec5SDimitry Andric #include <algorithm>
340b57cec5SDimitry Andric 
350b57cec5SDimitry Andric using namespace llvm;
360b57cec5SDimitry Andric 
370b57cec5SDimitry Andric namespace {
380b57cec5SDimitry Andric 
390b57cec5SDimitry Andric class AMDGPUMCInstLower {
400b57cec5SDimitry Andric   MCContext &Ctx;
410b57cec5SDimitry Andric   const TargetSubtargetInfo &ST;
420b57cec5SDimitry Andric   const AsmPrinter &AP;
430b57cec5SDimitry Andric 
440b57cec5SDimitry Andric   const MCExpr *getLongBranchBlockExpr(const MachineBasicBlock &SrcBB,
450b57cec5SDimitry Andric                                        const MachineOperand &MO) const;
460b57cec5SDimitry Andric 
470b57cec5SDimitry Andric public:
480b57cec5SDimitry Andric   AMDGPUMCInstLower(MCContext &ctx, const TargetSubtargetInfo &ST,
490b57cec5SDimitry Andric                     const AsmPrinter &AP);
500b57cec5SDimitry Andric 
510b57cec5SDimitry Andric   bool lowerOperand(const MachineOperand &MO, MCOperand &MCOp) const;
520b57cec5SDimitry Andric 
530b57cec5SDimitry Andric   /// Lower a MachineInstr to an MCInst
540b57cec5SDimitry Andric   void lower(const MachineInstr *MI, MCInst &OutMI) const;
550b57cec5SDimitry Andric 
560b57cec5SDimitry Andric };
570b57cec5SDimitry Andric 
580b57cec5SDimitry Andric class R600MCInstLower : public AMDGPUMCInstLower {
590b57cec5SDimitry Andric public:
600b57cec5SDimitry Andric   R600MCInstLower(MCContext &ctx, const R600Subtarget &ST,
610b57cec5SDimitry Andric                   const AsmPrinter &AP);
620b57cec5SDimitry Andric 
630b57cec5SDimitry Andric   /// Lower a MachineInstr to an MCInst
640b57cec5SDimitry Andric   void lower(const MachineInstr *MI, MCInst &OutMI) const;
650b57cec5SDimitry Andric };
660b57cec5SDimitry Andric 
670b57cec5SDimitry Andric 
680b57cec5SDimitry Andric } // End anonymous namespace
690b57cec5SDimitry Andric 
700b57cec5SDimitry Andric #include "AMDGPUGenMCPseudoLowering.inc"
710b57cec5SDimitry Andric 
720b57cec5SDimitry Andric AMDGPUMCInstLower::AMDGPUMCInstLower(MCContext &ctx,
730b57cec5SDimitry Andric                                      const TargetSubtargetInfo &st,
740b57cec5SDimitry Andric                                      const AsmPrinter &ap):
750b57cec5SDimitry Andric   Ctx(ctx), ST(st), AP(ap) { }
760b57cec5SDimitry Andric 
770b57cec5SDimitry Andric static MCSymbolRefExpr::VariantKind getVariantKind(unsigned MOFlags) {
780b57cec5SDimitry Andric   switch (MOFlags) {
790b57cec5SDimitry Andric   default:
800b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_None;
810b57cec5SDimitry Andric   case SIInstrInfo::MO_GOTPCREL:
820b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_GOTPCREL;
830b57cec5SDimitry Andric   case SIInstrInfo::MO_GOTPCREL32_LO:
840b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_AMDGPU_GOTPCREL32_LO;
850b57cec5SDimitry Andric   case SIInstrInfo::MO_GOTPCREL32_HI:
860b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_AMDGPU_GOTPCREL32_HI;
870b57cec5SDimitry Andric   case SIInstrInfo::MO_REL32_LO:
880b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_AMDGPU_REL32_LO;
890b57cec5SDimitry Andric   case SIInstrInfo::MO_REL32_HI:
900b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_AMDGPU_REL32_HI;
910b57cec5SDimitry Andric   case SIInstrInfo::MO_ABS32_LO:
920b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_AMDGPU_ABS32_LO;
930b57cec5SDimitry Andric   case SIInstrInfo::MO_ABS32_HI:
940b57cec5SDimitry Andric     return MCSymbolRefExpr::VK_AMDGPU_ABS32_HI;
950b57cec5SDimitry Andric   }
960b57cec5SDimitry Andric }
970b57cec5SDimitry Andric 
980b57cec5SDimitry Andric const MCExpr *AMDGPUMCInstLower::getLongBranchBlockExpr(
990b57cec5SDimitry Andric   const MachineBasicBlock &SrcBB,
1000b57cec5SDimitry Andric   const MachineOperand &MO) const {
1010b57cec5SDimitry Andric   const MCExpr *DestBBSym
1020b57cec5SDimitry Andric     = MCSymbolRefExpr::create(MO.getMBB()->getSymbol(), Ctx);
1030b57cec5SDimitry Andric   const MCExpr *SrcBBSym = MCSymbolRefExpr::create(SrcBB.getSymbol(), Ctx);
1040b57cec5SDimitry Andric 
1050b57cec5SDimitry Andric   // FIXME: The first half of this assert should be removed. This should
1060b57cec5SDimitry Andric   // probably be PC relative instead of using the source block symbol, and
1070b57cec5SDimitry Andric   // therefore the indirect branch expansion should use a bundle.
1080b57cec5SDimitry Andric   assert(
1090b57cec5SDimitry Andric       skipDebugInstructionsForward(SrcBB.begin(), SrcBB.end())->getOpcode() ==
1100b57cec5SDimitry Andric           AMDGPU::S_GETPC_B64 &&
1110b57cec5SDimitry Andric       ST.getInstrInfo()->get(AMDGPU::S_GETPC_B64).Size == 4);
1120b57cec5SDimitry Andric 
1130b57cec5SDimitry Andric   // s_getpc_b64 returns the address of next instruction.
1140b57cec5SDimitry Andric   const MCConstantExpr *One = MCConstantExpr::create(4, Ctx);
1150b57cec5SDimitry Andric   SrcBBSym = MCBinaryExpr::createAdd(SrcBBSym, One, Ctx);
1160b57cec5SDimitry Andric 
1170b57cec5SDimitry Andric   if (MO.getTargetFlags() == SIInstrInfo::MO_LONG_BRANCH_FORWARD)
1180b57cec5SDimitry Andric     return MCBinaryExpr::createSub(DestBBSym, SrcBBSym, Ctx);
1190b57cec5SDimitry Andric 
1200b57cec5SDimitry Andric   assert(MO.getTargetFlags() == SIInstrInfo::MO_LONG_BRANCH_BACKWARD);
1210b57cec5SDimitry Andric   return MCBinaryExpr::createSub(SrcBBSym, DestBBSym, Ctx);
1220b57cec5SDimitry Andric }
1230b57cec5SDimitry Andric 
1240b57cec5SDimitry Andric bool AMDGPUMCInstLower::lowerOperand(const MachineOperand &MO,
1250b57cec5SDimitry Andric                                      MCOperand &MCOp) const {
1260b57cec5SDimitry Andric   switch (MO.getType()) {
1270b57cec5SDimitry Andric   default:
1280b57cec5SDimitry Andric     llvm_unreachable("unknown operand type");
1290b57cec5SDimitry Andric   case MachineOperand::MO_Immediate:
1300b57cec5SDimitry Andric     MCOp = MCOperand::createImm(MO.getImm());
1310b57cec5SDimitry Andric     return true;
1320b57cec5SDimitry Andric   case MachineOperand::MO_Register:
1330b57cec5SDimitry Andric     MCOp = MCOperand::createReg(AMDGPU::getMCReg(MO.getReg(), ST));
1340b57cec5SDimitry Andric     return true;
1350b57cec5SDimitry Andric   case MachineOperand::MO_MachineBasicBlock: {
1360b57cec5SDimitry Andric     if (MO.getTargetFlags() != 0) {
1370b57cec5SDimitry Andric       MCOp = MCOperand::createExpr(
1380b57cec5SDimitry Andric         getLongBranchBlockExpr(*MO.getParent()->getParent(), MO));
1390b57cec5SDimitry Andric     } else {
1400b57cec5SDimitry Andric       MCOp = MCOperand::createExpr(
1410b57cec5SDimitry Andric         MCSymbolRefExpr::create(MO.getMBB()->getSymbol(), Ctx));
1420b57cec5SDimitry Andric     }
1430b57cec5SDimitry Andric 
1440b57cec5SDimitry Andric     return true;
1450b57cec5SDimitry Andric   }
1460b57cec5SDimitry Andric   case MachineOperand::MO_GlobalAddress: {
1470b57cec5SDimitry Andric     const GlobalValue *GV = MO.getGlobal();
1480b57cec5SDimitry Andric     SmallString<128> SymbolName;
1490b57cec5SDimitry Andric     AP.getNameWithPrefix(SymbolName, GV);
1500b57cec5SDimitry Andric     MCSymbol *Sym = Ctx.getOrCreateSymbol(SymbolName);
1510b57cec5SDimitry Andric     const MCExpr *Expr =
1520b57cec5SDimitry Andric       MCSymbolRefExpr::create(Sym, getVariantKind(MO.getTargetFlags()),Ctx);
1530b57cec5SDimitry Andric     int64_t Offset = MO.getOffset();
1540b57cec5SDimitry Andric     if (Offset != 0) {
1550b57cec5SDimitry Andric       Expr = MCBinaryExpr::createAdd(Expr,
1560b57cec5SDimitry Andric                                      MCConstantExpr::create(Offset, Ctx), Ctx);
1570b57cec5SDimitry Andric     }
1580b57cec5SDimitry Andric     MCOp = MCOperand::createExpr(Expr);
1590b57cec5SDimitry Andric     return true;
1600b57cec5SDimitry Andric   }
1610b57cec5SDimitry Andric   case MachineOperand::MO_ExternalSymbol: {
1620b57cec5SDimitry Andric     MCSymbol *Sym = Ctx.getOrCreateSymbol(StringRef(MO.getSymbolName()));
1630b57cec5SDimitry Andric     Sym->setExternal(true);
1640b57cec5SDimitry Andric     const MCSymbolRefExpr *Expr = MCSymbolRefExpr::create(Sym, Ctx);
1650b57cec5SDimitry Andric     MCOp = MCOperand::createExpr(Expr);
1660b57cec5SDimitry Andric     return true;
1670b57cec5SDimitry Andric   }
1680b57cec5SDimitry Andric   case MachineOperand::MO_RegisterMask:
1690b57cec5SDimitry Andric     // Regmasks are like implicit defs.
1700b57cec5SDimitry Andric     return false;
1710b57cec5SDimitry Andric   }
1720b57cec5SDimitry Andric }
1730b57cec5SDimitry Andric 
1740b57cec5SDimitry Andric void AMDGPUMCInstLower::lower(const MachineInstr *MI, MCInst &OutMI) const {
1750b57cec5SDimitry Andric   unsigned Opcode = MI->getOpcode();
1760b57cec5SDimitry Andric   const auto *TII = static_cast<const SIInstrInfo*>(ST.getInstrInfo());
1770b57cec5SDimitry Andric 
1780b57cec5SDimitry Andric   // FIXME: Should be able to handle this with emitPseudoExpansionLowering. We
1790b57cec5SDimitry Andric   // need to select it to the subtarget specific version, and there's no way to
1800b57cec5SDimitry Andric   // do that with a single pseudo source operation.
1810b57cec5SDimitry Andric   if (Opcode == AMDGPU::S_SETPC_B64_return)
1820b57cec5SDimitry Andric     Opcode = AMDGPU::S_SETPC_B64;
1830b57cec5SDimitry Andric   else if (Opcode == AMDGPU::SI_CALL) {
1840b57cec5SDimitry Andric     // SI_CALL is just S_SWAPPC_B64 with an additional operand to track the
1850b57cec5SDimitry Andric     // called function (which we need to remove here).
1860b57cec5SDimitry Andric     OutMI.setOpcode(TII->pseudoToMCOpcode(AMDGPU::S_SWAPPC_B64));
1870b57cec5SDimitry Andric     MCOperand Dest, Src;
1880b57cec5SDimitry Andric     lowerOperand(MI->getOperand(0), Dest);
1890b57cec5SDimitry Andric     lowerOperand(MI->getOperand(1), Src);
1900b57cec5SDimitry Andric     OutMI.addOperand(Dest);
1910b57cec5SDimitry Andric     OutMI.addOperand(Src);
1920b57cec5SDimitry Andric     return;
1930b57cec5SDimitry Andric   } else if (Opcode == AMDGPU::SI_TCRETURN) {
1940b57cec5SDimitry Andric     // TODO: How to use branch immediate and avoid register+add?
1950b57cec5SDimitry Andric     Opcode = AMDGPU::S_SETPC_B64;
1960b57cec5SDimitry Andric   }
1970b57cec5SDimitry Andric 
1980b57cec5SDimitry Andric   int MCOpcode = TII->pseudoToMCOpcode(Opcode);
1990b57cec5SDimitry Andric   if (MCOpcode == -1) {
2000b57cec5SDimitry Andric     LLVMContext &C = MI->getParent()->getParent()->getFunction().getContext();
2010b57cec5SDimitry Andric     C.emitError("AMDGPUMCInstLower::lower - Pseudo instruction doesn't have "
2020b57cec5SDimitry Andric                 "a target-specific version: " + Twine(MI->getOpcode()));
2030b57cec5SDimitry Andric   }
2040b57cec5SDimitry Andric 
2050b57cec5SDimitry Andric   OutMI.setOpcode(MCOpcode);
2060b57cec5SDimitry Andric 
2070b57cec5SDimitry Andric   for (const MachineOperand &MO : MI->explicit_operands()) {
2080b57cec5SDimitry Andric     MCOperand MCOp;
2090b57cec5SDimitry Andric     lowerOperand(MO, MCOp);
2100b57cec5SDimitry Andric     OutMI.addOperand(MCOp);
2110b57cec5SDimitry Andric   }
2128bcb0991SDimitry Andric 
2138bcb0991SDimitry Andric   int FIIdx = AMDGPU::getNamedOperandIdx(MCOpcode, AMDGPU::OpName::fi);
2148bcb0991SDimitry Andric   if (FIIdx >= (int)OutMI.getNumOperands())
2158bcb0991SDimitry Andric     OutMI.addOperand(MCOperand::createImm(0));
2160b57cec5SDimitry Andric }
2170b57cec5SDimitry Andric 
2180b57cec5SDimitry Andric bool AMDGPUAsmPrinter::lowerOperand(const MachineOperand &MO,
2190b57cec5SDimitry Andric                                     MCOperand &MCOp) const {
2200b57cec5SDimitry Andric   const GCNSubtarget &STI = MF->getSubtarget<GCNSubtarget>();
2210b57cec5SDimitry Andric   AMDGPUMCInstLower MCInstLowering(OutContext, STI, *this);
2220b57cec5SDimitry Andric   return MCInstLowering.lowerOperand(MO, MCOp);
2230b57cec5SDimitry Andric }
2240b57cec5SDimitry Andric 
2250b57cec5SDimitry Andric static const MCExpr *lowerAddrSpaceCast(const TargetMachine &TM,
2260b57cec5SDimitry Andric                                         const Constant *CV,
2270b57cec5SDimitry Andric                                         MCContext &OutContext) {
2280b57cec5SDimitry Andric   // TargetMachine does not support llvm-style cast. Use C++-style cast.
2290b57cec5SDimitry Andric   // This is safe since TM is always of type AMDGPUTargetMachine or its
2300b57cec5SDimitry Andric   // derived class.
2310b57cec5SDimitry Andric   auto &AT = static_cast<const AMDGPUTargetMachine&>(TM);
2320b57cec5SDimitry Andric   auto *CE = dyn_cast<ConstantExpr>(CV);
2330b57cec5SDimitry Andric 
2340b57cec5SDimitry Andric   // Lower null pointers in private and local address space.
2350b57cec5SDimitry Andric   // Clang generates addrspacecast for null pointers in private and local
2360b57cec5SDimitry Andric   // address space, which needs to be lowered.
2370b57cec5SDimitry Andric   if (CE && CE->getOpcode() == Instruction::AddrSpaceCast) {
2380b57cec5SDimitry Andric     auto Op = CE->getOperand(0);
2390b57cec5SDimitry Andric     auto SrcAddr = Op->getType()->getPointerAddressSpace();
2400b57cec5SDimitry Andric     if (Op->isNullValue() && AT.getNullPointerValue(SrcAddr) == 0) {
2410b57cec5SDimitry Andric       auto DstAddr = CE->getType()->getPointerAddressSpace();
2420b57cec5SDimitry Andric       return MCConstantExpr::create(AT.getNullPointerValue(DstAddr),
2430b57cec5SDimitry Andric         OutContext);
2440b57cec5SDimitry Andric     }
2450b57cec5SDimitry Andric   }
2460b57cec5SDimitry Andric   return nullptr;
2470b57cec5SDimitry Andric }
2480b57cec5SDimitry Andric 
2490b57cec5SDimitry Andric const MCExpr *AMDGPUAsmPrinter::lowerConstant(const Constant *CV) {
2500b57cec5SDimitry Andric   if (const MCExpr *E = lowerAddrSpaceCast(TM, CV, OutContext))
2510b57cec5SDimitry Andric     return E;
2520b57cec5SDimitry Andric   return AsmPrinter::lowerConstant(CV);
2530b57cec5SDimitry Andric }
2540b57cec5SDimitry Andric 
2555ffd83dbSDimitry Andric void AMDGPUAsmPrinter::emitInstruction(const MachineInstr *MI) {
2560b57cec5SDimitry Andric   if (emitPseudoExpansionLowering(*OutStreamer, MI))
2570b57cec5SDimitry Andric     return;
2580b57cec5SDimitry Andric 
2590b57cec5SDimitry Andric   const GCNSubtarget &STI = MF->getSubtarget<GCNSubtarget>();
2600b57cec5SDimitry Andric   AMDGPUMCInstLower MCInstLowering(OutContext, STI, *this);
2610b57cec5SDimitry Andric 
2620b57cec5SDimitry Andric   StringRef Err;
2630b57cec5SDimitry Andric   if (!STI.getInstrInfo()->verifyInstruction(*MI, Err)) {
2640b57cec5SDimitry Andric     LLVMContext &C = MI->getParent()->getParent()->getFunction().getContext();
2650b57cec5SDimitry Andric     C.emitError("Illegal instruction detected: " + Err);
2660b57cec5SDimitry Andric     MI->print(errs());
2670b57cec5SDimitry Andric   }
2680b57cec5SDimitry Andric 
2690b57cec5SDimitry Andric   if (MI->isBundle()) {
2700b57cec5SDimitry Andric     const MachineBasicBlock *MBB = MI->getParent();
2710b57cec5SDimitry Andric     MachineBasicBlock::const_instr_iterator I = ++MI->getIterator();
2720b57cec5SDimitry Andric     while (I != MBB->instr_end() && I->isInsideBundle()) {
2735ffd83dbSDimitry Andric       emitInstruction(&*I);
2740b57cec5SDimitry Andric       ++I;
2750b57cec5SDimitry Andric     }
2760b57cec5SDimitry Andric   } else {
2770b57cec5SDimitry Andric     // We don't want SI_MASK_BRANCH/SI_RETURN_TO_EPILOG encoded. They are
2780b57cec5SDimitry Andric     // placeholder terminator instructions and should only be printed as
2790b57cec5SDimitry Andric     // comments.
2800b57cec5SDimitry Andric     if (MI->getOpcode() == AMDGPU::SI_MASK_BRANCH) {
2810b57cec5SDimitry Andric       if (isVerbose()) {
2820b57cec5SDimitry Andric         SmallVector<char, 16> BBStr;
2830b57cec5SDimitry Andric         raw_svector_ostream Str(BBStr);
2840b57cec5SDimitry Andric 
2850b57cec5SDimitry Andric         const MachineBasicBlock *MBB = MI->getOperand(0).getMBB();
2860b57cec5SDimitry Andric         const MCSymbolRefExpr *Expr
2870b57cec5SDimitry Andric           = MCSymbolRefExpr::create(MBB->getSymbol(), OutContext);
2880b57cec5SDimitry Andric         Expr->print(Str, MAI);
2890b57cec5SDimitry Andric         OutStreamer->emitRawComment(Twine(" mask branch ") + BBStr);
2900b57cec5SDimitry Andric       }
2910b57cec5SDimitry Andric 
2920b57cec5SDimitry Andric       return;
2930b57cec5SDimitry Andric     }
2940b57cec5SDimitry Andric 
2950b57cec5SDimitry Andric     if (MI->getOpcode() == AMDGPU::SI_RETURN_TO_EPILOG) {
2960b57cec5SDimitry Andric       if (isVerbose())
2970b57cec5SDimitry Andric         OutStreamer->emitRawComment(" return to shader part epilog");
2980b57cec5SDimitry Andric       return;
2990b57cec5SDimitry Andric     }
3000b57cec5SDimitry Andric 
3010b57cec5SDimitry Andric     if (MI->getOpcode() == AMDGPU::WAVE_BARRIER) {
3020b57cec5SDimitry Andric       if (isVerbose())
3030b57cec5SDimitry Andric         OutStreamer->emitRawComment(" wave barrier");
3040b57cec5SDimitry Andric       return;
3050b57cec5SDimitry Andric     }
3060b57cec5SDimitry Andric 
3070b57cec5SDimitry Andric     if (MI->getOpcode() == AMDGPU::SI_MASKED_UNREACHABLE) {
3080b57cec5SDimitry Andric       if (isVerbose())
3090b57cec5SDimitry Andric         OutStreamer->emitRawComment(" divergent unreachable");
3100b57cec5SDimitry Andric       return;
3110b57cec5SDimitry Andric     }
3120b57cec5SDimitry Andric 
3130b57cec5SDimitry Andric     MCInst TmpInst;
3140b57cec5SDimitry Andric     MCInstLowering.lower(MI, TmpInst);
3150b57cec5SDimitry Andric     EmitToStreamer(*OutStreamer, TmpInst);
3160b57cec5SDimitry Andric 
3170b57cec5SDimitry Andric #ifdef EXPENSIVE_CHECKS
3180b57cec5SDimitry Andric     // Sanity-check getInstSizeInBytes on explicitly specified CPUs (it cannot
3190b57cec5SDimitry Andric     // work correctly for the generic CPU).
3200b57cec5SDimitry Andric     //
3210b57cec5SDimitry Andric     // The isPseudo check really shouldn't be here, but unfortunately there are
3220b57cec5SDimitry Andric     // some negative lit tests that depend on being able to continue through
3230b57cec5SDimitry Andric     // here even when pseudo instructions haven't been lowered.
324*e8d8bef9SDimitry Andric     //
325*e8d8bef9SDimitry Andric     // We also overestimate branch sizes with the offset bug.
326*e8d8bef9SDimitry Andric     if (!MI->isPseudo() && STI.isCPUStringValid(STI.getCPU()) &&
327*e8d8bef9SDimitry Andric         (!STI.hasOffset3fBug() || !MI->isBranch())) {
3280b57cec5SDimitry Andric       SmallVector<MCFixup, 4> Fixups;
3290b57cec5SDimitry Andric       SmallVector<char, 16> CodeBytes;
3300b57cec5SDimitry Andric       raw_svector_ostream CodeStream(CodeBytes);
3310b57cec5SDimitry Andric 
3320b57cec5SDimitry Andric       std::unique_ptr<MCCodeEmitter> InstEmitter(createSIMCCodeEmitter(
3330b57cec5SDimitry Andric           *STI.getInstrInfo(), *OutContext.getRegisterInfo(), OutContext));
3340b57cec5SDimitry Andric       InstEmitter->encodeInstruction(TmpInst, CodeStream, Fixups, STI);
3350b57cec5SDimitry Andric 
3360b57cec5SDimitry Andric       assert(CodeBytes.size() == STI.getInstrInfo()->getInstSizeInBytes(*MI));
3370b57cec5SDimitry Andric     }
3380b57cec5SDimitry Andric #endif
3390b57cec5SDimitry Andric 
3400b57cec5SDimitry Andric     if (DumpCodeInstEmitter) {
3410b57cec5SDimitry Andric       // Disassemble instruction/operands to text
3420b57cec5SDimitry Andric       DisasmLines.resize(DisasmLines.size() + 1);
3430b57cec5SDimitry Andric       std::string &DisasmLine = DisasmLines.back();
3440b57cec5SDimitry Andric       raw_string_ostream DisasmStream(DisasmLine);
3450b57cec5SDimitry Andric 
3460b57cec5SDimitry Andric       AMDGPUInstPrinter InstPrinter(*TM.getMCAsmInfo(), *STI.getInstrInfo(),
3470b57cec5SDimitry Andric                                     *STI.getRegisterInfo());
348480093f4SDimitry Andric       InstPrinter.printInst(&TmpInst, 0, StringRef(), STI, DisasmStream);
3490b57cec5SDimitry Andric 
3500b57cec5SDimitry Andric       // Disassemble instruction/operands to hex representation.
3510b57cec5SDimitry Andric       SmallVector<MCFixup, 4> Fixups;
3520b57cec5SDimitry Andric       SmallVector<char, 16> CodeBytes;
3530b57cec5SDimitry Andric       raw_svector_ostream CodeStream(CodeBytes);
3540b57cec5SDimitry Andric 
3550b57cec5SDimitry Andric       DumpCodeInstEmitter->encodeInstruction(
3560b57cec5SDimitry Andric           TmpInst, CodeStream, Fixups, MF->getSubtarget<MCSubtargetInfo>());
3570b57cec5SDimitry Andric       HexLines.resize(HexLines.size() + 1);
3580b57cec5SDimitry Andric       std::string &HexLine = HexLines.back();
3590b57cec5SDimitry Andric       raw_string_ostream HexStream(HexLine);
3600b57cec5SDimitry Andric 
3610b57cec5SDimitry Andric       for (size_t i = 0; i < CodeBytes.size(); i += 4) {
3620b57cec5SDimitry Andric         unsigned int CodeDWord = *(unsigned int *)&CodeBytes[i];
3630b57cec5SDimitry Andric         HexStream << format("%s%08X", (i > 0 ? " " : ""), CodeDWord);
3640b57cec5SDimitry Andric       }
3650b57cec5SDimitry Andric 
3660b57cec5SDimitry Andric       DisasmStream.flush();
3670b57cec5SDimitry Andric       DisasmLineMaxLen = std::max(DisasmLineMaxLen, DisasmLine.size());
3680b57cec5SDimitry Andric     }
3690b57cec5SDimitry Andric   }
3700b57cec5SDimitry Andric }
3710b57cec5SDimitry Andric 
3720b57cec5SDimitry Andric R600MCInstLower::R600MCInstLower(MCContext &Ctx, const R600Subtarget &ST,
3730b57cec5SDimitry Andric                                  const AsmPrinter &AP) :
3740b57cec5SDimitry Andric         AMDGPUMCInstLower(Ctx, ST, AP) { }
3750b57cec5SDimitry Andric 
3760b57cec5SDimitry Andric void R600MCInstLower::lower(const MachineInstr *MI, MCInst &OutMI) const {
3770b57cec5SDimitry Andric   OutMI.setOpcode(MI->getOpcode());
3780b57cec5SDimitry Andric   for (const MachineOperand &MO : MI->explicit_operands()) {
3790b57cec5SDimitry Andric     MCOperand MCOp;
3800b57cec5SDimitry Andric     lowerOperand(MO, MCOp);
3810b57cec5SDimitry Andric     OutMI.addOperand(MCOp);
3820b57cec5SDimitry Andric   }
3830b57cec5SDimitry Andric }
3840b57cec5SDimitry Andric 
3855ffd83dbSDimitry Andric void R600AsmPrinter::emitInstruction(const MachineInstr *MI) {
3860b57cec5SDimitry Andric   const R600Subtarget &STI = MF->getSubtarget<R600Subtarget>();
3870b57cec5SDimitry Andric   R600MCInstLower MCInstLowering(OutContext, STI, *this);
3880b57cec5SDimitry Andric 
3890b57cec5SDimitry Andric   StringRef Err;
3900b57cec5SDimitry Andric   if (!STI.getInstrInfo()->verifyInstruction(*MI, Err)) {
3910b57cec5SDimitry Andric     LLVMContext &C = MI->getParent()->getParent()->getFunction().getContext();
3920b57cec5SDimitry Andric     C.emitError("Illegal instruction detected: " + Err);
3930b57cec5SDimitry Andric     MI->print(errs());
3940b57cec5SDimitry Andric   }
3950b57cec5SDimitry Andric 
3960b57cec5SDimitry Andric   if (MI->isBundle()) {
3970b57cec5SDimitry Andric     const MachineBasicBlock *MBB = MI->getParent();
3980b57cec5SDimitry Andric     MachineBasicBlock::const_instr_iterator I = ++MI->getIterator();
3990b57cec5SDimitry Andric     while (I != MBB->instr_end() && I->isInsideBundle()) {
4005ffd83dbSDimitry Andric       emitInstruction(&*I);
4010b57cec5SDimitry Andric       ++I;
4020b57cec5SDimitry Andric     }
4030b57cec5SDimitry Andric   } else {
4040b57cec5SDimitry Andric     MCInst TmpInst;
4050b57cec5SDimitry Andric     MCInstLowering.lower(MI, TmpInst);
4060b57cec5SDimitry Andric     EmitToStreamer(*OutStreamer, TmpInst);
4070b57cec5SDimitry Andric  }
4080b57cec5SDimitry Andric }
4090b57cec5SDimitry Andric 
4100b57cec5SDimitry Andric const MCExpr *R600AsmPrinter::lowerConstant(const Constant *CV) {
4110b57cec5SDimitry Andric   if (const MCExpr *E = lowerAddrSpaceCast(TM, CV, OutContext))
4120b57cec5SDimitry Andric     return E;
4130b57cec5SDimitry Andric   return AsmPrinter::lowerConstant(CV);
4140b57cec5SDimitry Andric }
415