1 //===-- RISCVMCCodeEmitter.cpp - Convert RISCV code to machine code -------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements the RISCVMCCodeEmitter class. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "MCTargetDesc/RISCVFixupKinds.h" 14 #include "MCTargetDesc/RISCVMCExpr.h" 15 #include "MCTargetDesc/RISCVMCTargetDesc.h" 16 #include "Utils/RISCVBaseInfo.h" 17 #include "llvm/ADT/Statistic.h" 18 #include "llvm/CodeGen/Register.h" 19 #include "llvm/MC/MCAsmInfo.h" 20 #include "llvm/MC/MCCodeEmitter.h" 21 #include "llvm/MC/MCContext.h" 22 #include "llvm/MC/MCExpr.h" 23 #include "llvm/MC/MCInst.h" 24 #include "llvm/MC/MCInstBuilder.h" 25 #include "llvm/MC/MCInstrInfo.h" 26 #include "llvm/MC/MCRegisterInfo.h" 27 #include "llvm/MC/MCSymbol.h" 28 #include "llvm/Support/Casting.h" 29 #include "llvm/Support/EndianStream.h" 30 #include "llvm/Support/raw_ostream.h" 31 32 using namespace llvm; 33 34 #define DEBUG_TYPE "mccodeemitter" 35 36 STATISTIC(MCNumEmitted, "Number of MC instructions emitted"); 37 STATISTIC(MCNumFixups, "Number of MC fixups created"); 38 39 namespace { 40 class RISCVMCCodeEmitter : public MCCodeEmitter { 41 RISCVMCCodeEmitter(const RISCVMCCodeEmitter &) = delete; 42 void operator=(const RISCVMCCodeEmitter &) = delete; 43 MCContext &Ctx; 44 MCInstrInfo const &MCII; 45 46 public: 47 RISCVMCCodeEmitter(MCContext &ctx, MCInstrInfo const &MCII) 48 : Ctx(ctx), MCII(MCII) {} 49 50 ~RISCVMCCodeEmitter() override {} 51 52 void encodeInstruction(const MCInst &MI, raw_ostream &OS, 53 SmallVectorImpl<MCFixup> &Fixups, 54 const MCSubtargetInfo &STI) const override; 55 56 void expandFunctionCall(const MCInst &MI, raw_ostream &OS, 57 SmallVectorImpl<MCFixup> &Fixups, 58 const MCSubtargetInfo &STI) const; 59 60 void expandAddTPRel(const MCInst &MI, raw_ostream &OS, 61 SmallVectorImpl<MCFixup> &Fixups, 62 const MCSubtargetInfo &STI) const; 63 64 /// TableGen'erated function for getting the binary encoding for an 65 /// instruction. 66 uint64_t getBinaryCodeForInstr(const MCInst &MI, 67 SmallVectorImpl<MCFixup> &Fixups, 68 const MCSubtargetInfo &STI) const; 69 70 /// Return binary encoding of operand. If the machine operand requires 71 /// relocation, record the relocation and return zero. 72 unsigned getMachineOpValue(const MCInst &MI, const MCOperand &MO, 73 SmallVectorImpl<MCFixup> &Fixups, 74 const MCSubtargetInfo &STI) const; 75 76 unsigned getImmOpValueAsr1(const MCInst &MI, unsigned OpNo, 77 SmallVectorImpl<MCFixup> &Fixups, 78 const MCSubtargetInfo &STI) const; 79 80 unsigned getImmOpValue(const MCInst &MI, unsigned OpNo, 81 SmallVectorImpl<MCFixup> &Fixups, 82 const MCSubtargetInfo &STI) const; 83 84 unsigned getVMaskReg(const MCInst &MI, unsigned OpNo, 85 SmallVectorImpl<MCFixup> &Fixups, 86 const MCSubtargetInfo &STI) const; 87 }; 88 } // end anonymous namespace 89 90 MCCodeEmitter *llvm::createRISCVMCCodeEmitter(const MCInstrInfo &MCII, 91 const MCRegisterInfo &MRI, 92 MCContext &Ctx) { 93 return new RISCVMCCodeEmitter(Ctx, MCII); 94 } 95 96 // Expand PseudoCALL(Reg), PseudoTAIL and PseudoJump to AUIPC and JALR with 97 // relocation types. We expand those pseudo-instructions while encoding them, 98 // meaning AUIPC and JALR won't go through RISCV MC to MC compressed 99 // instruction transformation. This is acceptable because AUIPC has no 16-bit 100 // form and C_JALR has no immediate operand field. We let linker relaxation 101 // deal with it. When linker relaxation is enabled, AUIPC and JALR have a 102 // chance to relax to JAL. 103 // If the C extension is enabled, JAL has a chance relax to C_JAL. 104 void RISCVMCCodeEmitter::expandFunctionCall(const MCInst &MI, raw_ostream &OS, 105 SmallVectorImpl<MCFixup> &Fixups, 106 const MCSubtargetInfo &STI) const { 107 MCInst TmpInst; 108 MCOperand Func; 109 Register Ra; 110 if (MI.getOpcode() == RISCV::PseudoTAIL) { 111 Func = MI.getOperand(0); 112 Ra = RISCV::X6; 113 } else if (MI.getOpcode() == RISCV::PseudoCALLReg) { 114 Func = MI.getOperand(1); 115 Ra = MI.getOperand(0).getReg(); 116 } else if (MI.getOpcode() == RISCV::PseudoCALL) { 117 Func = MI.getOperand(0); 118 Ra = RISCV::X1; 119 } else if (MI.getOpcode() == RISCV::PseudoJump) { 120 Func = MI.getOperand(1); 121 Ra = MI.getOperand(0).getReg(); 122 } 123 uint32_t Binary; 124 125 assert(Func.isExpr() && "Expected expression"); 126 127 const MCExpr *CallExpr = Func.getExpr(); 128 129 // Emit AUIPC Ra, Func with R_RISCV_CALL relocation type. 130 TmpInst = MCInstBuilder(RISCV::AUIPC) 131 .addReg(Ra) 132 .addOperand(MCOperand::createExpr(CallExpr)); 133 Binary = getBinaryCodeForInstr(TmpInst, Fixups, STI); 134 support::endian::write(OS, Binary, support::little); 135 136 if (MI.getOpcode() == RISCV::PseudoTAIL || 137 MI.getOpcode() == RISCV::PseudoJump) 138 // Emit JALR X0, Ra, 0 139 TmpInst = MCInstBuilder(RISCV::JALR).addReg(RISCV::X0).addReg(Ra).addImm(0); 140 else 141 // Emit JALR Ra, Ra, 0 142 TmpInst = MCInstBuilder(RISCV::JALR).addReg(Ra).addReg(Ra).addImm(0); 143 Binary = getBinaryCodeForInstr(TmpInst, Fixups, STI); 144 support::endian::write(OS, Binary, support::little); 145 } 146 147 // Expand PseudoAddTPRel to a simple ADD with the correct relocation. 148 void RISCVMCCodeEmitter::expandAddTPRel(const MCInst &MI, raw_ostream &OS, 149 SmallVectorImpl<MCFixup> &Fixups, 150 const MCSubtargetInfo &STI) const { 151 MCOperand DestReg = MI.getOperand(0); 152 MCOperand SrcReg = MI.getOperand(1); 153 MCOperand TPReg = MI.getOperand(2); 154 assert(TPReg.isReg() && TPReg.getReg() == RISCV::X4 && 155 "Expected thread pointer as second input to TP-relative add"); 156 157 MCOperand SrcSymbol = MI.getOperand(3); 158 assert(SrcSymbol.isExpr() && 159 "Expected expression as third input to TP-relative add"); 160 161 const RISCVMCExpr *Expr = dyn_cast<RISCVMCExpr>(SrcSymbol.getExpr()); 162 assert(Expr && Expr->getKind() == RISCVMCExpr::VK_RISCV_TPREL_ADD && 163 "Expected tprel_add relocation on TP-relative symbol"); 164 165 // Emit the correct tprel_add relocation for the symbol. 166 Fixups.push_back(MCFixup::create( 167 0, Expr, MCFixupKind(RISCV::fixup_riscv_tprel_add), MI.getLoc())); 168 169 // Emit fixup_riscv_relax for tprel_add where the relax feature is enabled. 170 if (STI.getFeatureBits()[RISCV::FeatureRelax]) { 171 const MCConstantExpr *Dummy = MCConstantExpr::create(0, Ctx); 172 Fixups.push_back(MCFixup::create( 173 0, Dummy, MCFixupKind(RISCV::fixup_riscv_relax), MI.getLoc())); 174 } 175 176 // Emit a normal ADD instruction with the given operands. 177 MCInst TmpInst = MCInstBuilder(RISCV::ADD) 178 .addOperand(DestReg) 179 .addOperand(SrcReg) 180 .addOperand(TPReg); 181 uint32_t Binary = getBinaryCodeForInstr(TmpInst, Fixups, STI); 182 support::endian::write(OS, Binary, support::little); 183 } 184 185 void RISCVMCCodeEmitter::encodeInstruction(const MCInst &MI, raw_ostream &OS, 186 SmallVectorImpl<MCFixup> &Fixups, 187 const MCSubtargetInfo &STI) const { 188 const MCInstrDesc &Desc = MCII.get(MI.getOpcode()); 189 // Get byte count of instruction. 190 unsigned Size = Desc.getSize(); 191 192 // RISCVInstrInfo::getInstSizeInBytes hard-codes the number of expanded 193 // instructions for each pseudo, and must be updated when adding new pseudos 194 // or changing existing ones. 195 if (MI.getOpcode() == RISCV::PseudoCALLReg || 196 MI.getOpcode() == RISCV::PseudoCALL || 197 MI.getOpcode() == RISCV::PseudoTAIL || 198 MI.getOpcode() == RISCV::PseudoJump) { 199 expandFunctionCall(MI, OS, Fixups, STI); 200 MCNumEmitted += 2; 201 return; 202 } 203 204 if (MI.getOpcode() == RISCV::PseudoAddTPRel) { 205 expandAddTPRel(MI, OS, Fixups, STI); 206 MCNumEmitted += 1; 207 return; 208 } 209 210 switch (Size) { 211 default: 212 llvm_unreachable("Unhandled encodeInstruction length!"); 213 case 2: { 214 uint16_t Bits = getBinaryCodeForInstr(MI, Fixups, STI); 215 support::endian::write<uint16_t>(OS, Bits, support::little); 216 break; 217 } 218 case 4: { 219 uint32_t Bits = getBinaryCodeForInstr(MI, Fixups, STI); 220 support::endian::write(OS, Bits, support::little); 221 break; 222 } 223 } 224 225 ++MCNumEmitted; // Keep track of the # of mi's emitted. 226 } 227 228 unsigned 229 RISCVMCCodeEmitter::getMachineOpValue(const MCInst &MI, const MCOperand &MO, 230 SmallVectorImpl<MCFixup> &Fixups, 231 const MCSubtargetInfo &STI) const { 232 233 if (MO.isReg()) 234 return Ctx.getRegisterInfo()->getEncodingValue(MO.getReg()); 235 236 if (MO.isImm()) 237 return static_cast<unsigned>(MO.getImm()); 238 239 llvm_unreachable("Unhandled expression!"); 240 return 0; 241 } 242 243 unsigned 244 RISCVMCCodeEmitter::getImmOpValueAsr1(const MCInst &MI, unsigned OpNo, 245 SmallVectorImpl<MCFixup> &Fixups, 246 const MCSubtargetInfo &STI) const { 247 const MCOperand &MO = MI.getOperand(OpNo); 248 249 if (MO.isImm()) { 250 unsigned Res = MO.getImm(); 251 assert((Res & 1) == 0 && "LSB is non-zero"); 252 return Res >> 1; 253 } 254 255 return getImmOpValue(MI, OpNo, Fixups, STI); 256 } 257 258 unsigned RISCVMCCodeEmitter::getImmOpValue(const MCInst &MI, unsigned OpNo, 259 SmallVectorImpl<MCFixup> &Fixups, 260 const MCSubtargetInfo &STI) const { 261 bool EnableRelax = STI.getFeatureBits()[RISCV::FeatureRelax]; 262 const MCOperand &MO = MI.getOperand(OpNo); 263 264 MCInstrDesc const &Desc = MCII.get(MI.getOpcode()); 265 unsigned MIFrm = Desc.TSFlags & RISCVII::InstFormatMask; 266 267 // If the destination is an immediate, there is nothing to do. 268 if (MO.isImm()) 269 return MO.getImm(); 270 271 assert(MO.isExpr() && 272 "getImmOpValue expects only expressions or immediates"); 273 const MCExpr *Expr = MO.getExpr(); 274 MCExpr::ExprKind Kind = Expr->getKind(); 275 RISCV::Fixups FixupKind = RISCV::fixup_riscv_invalid; 276 bool RelaxCandidate = false; 277 if (Kind == MCExpr::Target) { 278 const RISCVMCExpr *RVExpr = cast<RISCVMCExpr>(Expr); 279 280 switch (RVExpr->getKind()) { 281 case RISCVMCExpr::VK_RISCV_None: 282 case RISCVMCExpr::VK_RISCV_Invalid: 283 case RISCVMCExpr::VK_RISCV_32_PCREL: 284 llvm_unreachable("Unhandled fixup kind!"); 285 case RISCVMCExpr::VK_RISCV_TPREL_ADD: 286 // tprel_add is only used to indicate that a relocation should be emitted 287 // for an add instruction used in TP-relative addressing. It should not be 288 // expanded as if representing an actual instruction operand and so to 289 // encounter it here is an error. 290 llvm_unreachable( 291 "VK_RISCV_TPREL_ADD should not represent an instruction operand"); 292 case RISCVMCExpr::VK_RISCV_LO: 293 if (MIFrm == RISCVII::InstFormatI) 294 FixupKind = RISCV::fixup_riscv_lo12_i; 295 else if (MIFrm == RISCVII::InstFormatS) 296 FixupKind = RISCV::fixup_riscv_lo12_s; 297 else 298 llvm_unreachable("VK_RISCV_LO used with unexpected instruction format"); 299 RelaxCandidate = true; 300 break; 301 case RISCVMCExpr::VK_RISCV_HI: 302 FixupKind = RISCV::fixup_riscv_hi20; 303 RelaxCandidate = true; 304 break; 305 case RISCVMCExpr::VK_RISCV_PCREL_LO: 306 if (MIFrm == RISCVII::InstFormatI) 307 FixupKind = RISCV::fixup_riscv_pcrel_lo12_i; 308 else if (MIFrm == RISCVII::InstFormatS) 309 FixupKind = RISCV::fixup_riscv_pcrel_lo12_s; 310 else 311 llvm_unreachable( 312 "VK_RISCV_PCREL_LO used with unexpected instruction format"); 313 RelaxCandidate = true; 314 break; 315 case RISCVMCExpr::VK_RISCV_PCREL_HI: 316 FixupKind = RISCV::fixup_riscv_pcrel_hi20; 317 RelaxCandidate = true; 318 break; 319 case RISCVMCExpr::VK_RISCV_GOT_HI: 320 FixupKind = RISCV::fixup_riscv_got_hi20; 321 break; 322 case RISCVMCExpr::VK_RISCV_TPREL_LO: 323 if (MIFrm == RISCVII::InstFormatI) 324 FixupKind = RISCV::fixup_riscv_tprel_lo12_i; 325 else if (MIFrm == RISCVII::InstFormatS) 326 FixupKind = RISCV::fixup_riscv_tprel_lo12_s; 327 else 328 llvm_unreachable( 329 "VK_RISCV_TPREL_LO used with unexpected instruction format"); 330 RelaxCandidate = true; 331 break; 332 case RISCVMCExpr::VK_RISCV_TPREL_HI: 333 FixupKind = RISCV::fixup_riscv_tprel_hi20; 334 RelaxCandidate = true; 335 break; 336 case RISCVMCExpr::VK_RISCV_TLS_GOT_HI: 337 FixupKind = RISCV::fixup_riscv_tls_got_hi20; 338 break; 339 case RISCVMCExpr::VK_RISCV_TLS_GD_HI: 340 FixupKind = RISCV::fixup_riscv_tls_gd_hi20; 341 break; 342 case RISCVMCExpr::VK_RISCV_CALL: 343 FixupKind = RISCV::fixup_riscv_call; 344 RelaxCandidate = true; 345 break; 346 case RISCVMCExpr::VK_RISCV_CALL_PLT: 347 FixupKind = RISCV::fixup_riscv_call_plt; 348 RelaxCandidate = true; 349 break; 350 } 351 } else if (Kind == MCExpr::SymbolRef && 352 cast<MCSymbolRefExpr>(Expr)->getKind() == MCSymbolRefExpr::VK_None) { 353 if (Desc.getOpcode() == RISCV::JAL) { 354 FixupKind = RISCV::fixup_riscv_jal; 355 } else if (MIFrm == RISCVII::InstFormatB) { 356 FixupKind = RISCV::fixup_riscv_branch; 357 } else if (MIFrm == RISCVII::InstFormatCJ) { 358 FixupKind = RISCV::fixup_riscv_rvc_jump; 359 } else if (MIFrm == RISCVII::InstFormatCB) { 360 FixupKind = RISCV::fixup_riscv_rvc_branch; 361 } 362 } 363 364 assert(FixupKind != RISCV::fixup_riscv_invalid && "Unhandled expression!"); 365 366 Fixups.push_back( 367 MCFixup::create(0, Expr, MCFixupKind(FixupKind), MI.getLoc())); 368 ++MCNumFixups; 369 370 // Ensure an R_RISCV_RELAX relocation will be emitted if linker relaxation is 371 // enabled and the current fixup will result in a relocation that may be 372 // relaxed. 373 if (EnableRelax && RelaxCandidate) { 374 const MCConstantExpr *Dummy = MCConstantExpr::create(0, Ctx); 375 Fixups.push_back( 376 MCFixup::create(0, Dummy, MCFixupKind(RISCV::fixup_riscv_relax), 377 MI.getLoc())); 378 ++MCNumFixups; 379 } 380 381 return 0; 382 } 383 384 unsigned RISCVMCCodeEmitter::getVMaskReg(const MCInst &MI, unsigned OpNo, 385 SmallVectorImpl<MCFixup> &Fixups, 386 const MCSubtargetInfo &STI) const { 387 MCOperand MO = MI.getOperand(OpNo); 388 assert(MO.isReg() && "Expected a register."); 389 390 switch (MO.getReg()) { 391 default: 392 llvm_unreachable("Invalid mask register."); 393 case RISCV::V0: 394 return 0; 395 case RISCV::NoRegister: 396 return 1; 397 } 398 } 399 400 #include "RISCVGenMCCodeEmitter.inc" 401