xref: /freebsd/contrib/llvm-project/llvm/lib/Target/RISCV/MCTargetDesc/RISCVMCCodeEmitter.cpp (revision d5e3895ea4fe4ef9db8823774e07b4368180a23e)
1 //===-- RISCVMCCodeEmitter.cpp - Convert RISCV code to machine code -------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements the RISCVMCCodeEmitter class.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "MCTargetDesc/RISCVFixupKinds.h"
14 #include "MCTargetDesc/RISCVMCExpr.h"
15 #include "MCTargetDesc/RISCVMCTargetDesc.h"
16 #include "Utils/RISCVBaseInfo.h"
17 #include "llvm/ADT/Statistic.h"
18 #include "llvm/CodeGen/Register.h"
19 #include "llvm/MC/MCAsmInfo.h"
20 #include "llvm/MC/MCCodeEmitter.h"
21 #include "llvm/MC/MCContext.h"
22 #include "llvm/MC/MCExpr.h"
23 #include "llvm/MC/MCInst.h"
24 #include "llvm/MC/MCInstBuilder.h"
25 #include "llvm/MC/MCInstrInfo.h"
26 #include "llvm/MC/MCRegisterInfo.h"
27 #include "llvm/MC/MCSymbol.h"
28 #include "llvm/Support/Casting.h"
29 #include "llvm/Support/EndianStream.h"
30 #include "llvm/Support/raw_ostream.h"
31 
32 using namespace llvm;
33 
34 #define DEBUG_TYPE "mccodeemitter"
35 
36 STATISTIC(MCNumEmitted, "Number of MC instructions emitted");
37 STATISTIC(MCNumFixups, "Number of MC fixups created");
38 
39 namespace {
40 class RISCVMCCodeEmitter : public MCCodeEmitter {
41   RISCVMCCodeEmitter(const RISCVMCCodeEmitter &) = delete;
42   void operator=(const RISCVMCCodeEmitter &) = delete;
43   MCContext &Ctx;
44   MCInstrInfo const &MCII;
45 
46 public:
47   RISCVMCCodeEmitter(MCContext &ctx, MCInstrInfo const &MCII)
48       : Ctx(ctx), MCII(MCII) {}
49 
50   ~RISCVMCCodeEmitter() override {}
51 
52   void encodeInstruction(const MCInst &MI, raw_ostream &OS,
53                          SmallVectorImpl<MCFixup> &Fixups,
54                          const MCSubtargetInfo &STI) const override;
55 
56   void expandFunctionCall(const MCInst &MI, raw_ostream &OS,
57                           SmallVectorImpl<MCFixup> &Fixups,
58                           const MCSubtargetInfo &STI) const;
59 
60   void expandAddTPRel(const MCInst &MI, raw_ostream &OS,
61                       SmallVectorImpl<MCFixup> &Fixups,
62                       const MCSubtargetInfo &STI) const;
63 
64   /// TableGen'erated function for getting the binary encoding for an
65   /// instruction.
66   uint64_t getBinaryCodeForInstr(const MCInst &MI,
67                                  SmallVectorImpl<MCFixup> &Fixups,
68                                  const MCSubtargetInfo &STI) const;
69 
70   /// Return binary encoding of operand. If the machine operand requires
71   /// relocation, record the relocation and return zero.
72   unsigned getMachineOpValue(const MCInst &MI, const MCOperand &MO,
73                              SmallVectorImpl<MCFixup> &Fixups,
74                              const MCSubtargetInfo &STI) const;
75 
76   unsigned getImmOpValueAsr1(const MCInst &MI, unsigned OpNo,
77                              SmallVectorImpl<MCFixup> &Fixups,
78                              const MCSubtargetInfo &STI) const;
79 
80   unsigned getImmOpValue(const MCInst &MI, unsigned OpNo,
81                          SmallVectorImpl<MCFixup> &Fixups,
82                          const MCSubtargetInfo &STI) const;
83 
84   unsigned getVMaskReg(const MCInst &MI, unsigned OpNo,
85                        SmallVectorImpl<MCFixup> &Fixups,
86                        const MCSubtargetInfo &STI) const;
87 };
88 } // end anonymous namespace
89 
90 MCCodeEmitter *llvm::createRISCVMCCodeEmitter(const MCInstrInfo &MCII,
91                                               const MCRegisterInfo &MRI,
92                                               MCContext &Ctx) {
93   return new RISCVMCCodeEmitter(Ctx, MCII);
94 }
95 
96 // Expand PseudoCALL(Reg), PseudoTAIL and PseudoJump to AUIPC and JALR with
97 // relocation types. We expand those pseudo-instructions while encoding them,
98 // meaning AUIPC and JALR won't go through RISCV MC to MC compressed
99 // instruction transformation. This is acceptable because AUIPC has no 16-bit
100 // form and C_JALR has no immediate operand field.  We let linker relaxation
101 // deal with it. When linker relaxation is enabled, AUIPC and JALR have a
102 // chance to relax to JAL.
103 // If the C extension is enabled, JAL has a chance relax to C_JAL.
104 void RISCVMCCodeEmitter::expandFunctionCall(const MCInst &MI, raw_ostream &OS,
105                                             SmallVectorImpl<MCFixup> &Fixups,
106                                             const MCSubtargetInfo &STI) const {
107   MCInst TmpInst;
108   MCOperand Func;
109   Register Ra;
110   if (MI.getOpcode() == RISCV::PseudoTAIL) {
111     Func = MI.getOperand(0);
112     Ra = RISCV::X6;
113   } else if (MI.getOpcode() == RISCV::PseudoCALLReg) {
114     Func = MI.getOperand(1);
115     Ra = MI.getOperand(0).getReg();
116   } else if (MI.getOpcode() == RISCV::PseudoCALL) {
117     Func = MI.getOperand(0);
118     Ra = RISCV::X1;
119   } else if (MI.getOpcode() == RISCV::PseudoJump) {
120     Func = MI.getOperand(1);
121     Ra = MI.getOperand(0).getReg();
122   }
123   uint32_t Binary;
124 
125   assert(Func.isExpr() && "Expected expression");
126 
127   const MCExpr *CallExpr = Func.getExpr();
128 
129   // Emit AUIPC Ra, Func with R_RISCV_CALL relocation type.
130   TmpInst = MCInstBuilder(RISCV::AUIPC)
131                 .addReg(Ra)
132                 .addOperand(MCOperand::createExpr(CallExpr));
133   Binary = getBinaryCodeForInstr(TmpInst, Fixups, STI);
134   support::endian::write(OS, Binary, support::little);
135 
136   if (MI.getOpcode() == RISCV::PseudoTAIL ||
137       MI.getOpcode() == RISCV::PseudoJump)
138     // Emit JALR X0, Ra, 0
139     TmpInst = MCInstBuilder(RISCV::JALR).addReg(RISCV::X0).addReg(Ra).addImm(0);
140   else
141     // Emit JALR Ra, Ra, 0
142     TmpInst = MCInstBuilder(RISCV::JALR).addReg(Ra).addReg(Ra).addImm(0);
143   Binary = getBinaryCodeForInstr(TmpInst, Fixups, STI);
144   support::endian::write(OS, Binary, support::little);
145 }
146 
147 // Expand PseudoAddTPRel to a simple ADD with the correct relocation.
148 void RISCVMCCodeEmitter::expandAddTPRel(const MCInst &MI, raw_ostream &OS,
149                                         SmallVectorImpl<MCFixup> &Fixups,
150                                         const MCSubtargetInfo &STI) const {
151   MCOperand DestReg = MI.getOperand(0);
152   MCOperand SrcReg = MI.getOperand(1);
153   MCOperand TPReg = MI.getOperand(2);
154   assert(TPReg.isReg() && TPReg.getReg() == RISCV::X4 &&
155          "Expected thread pointer as second input to TP-relative add");
156 
157   MCOperand SrcSymbol = MI.getOperand(3);
158   assert(SrcSymbol.isExpr() &&
159          "Expected expression as third input to TP-relative add");
160 
161   const RISCVMCExpr *Expr = dyn_cast<RISCVMCExpr>(SrcSymbol.getExpr());
162   assert(Expr && Expr->getKind() == RISCVMCExpr::VK_RISCV_TPREL_ADD &&
163          "Expected tprel_add relocation on TP-relative symbol");
164 
165   // Emit the correct tprel_add relocation for the symbol.
166   Fixups.push_back(MCFixup::create(
167       0, Expr, MCFixupKind(RISCV::fixup_riscv_tprel_add), MI.getLoc()));
168 
169   // Emit fixup_riscv_relax for tprel_add where the relax feature is enabled.
170   if (STI.getFeatureBits()[RISCV::FeatureRelax]) {
171     const MCConstantExpr *Dummy = MCConstantExpr::create(0, Ctx);
172     Fixups.push_back(MCFixup::create(
173         0, Dummy, MCFixupKind(RISCV::fixup_riscv_relax), MI.getLoc()));
174   }
175 
176   // Emit a normal ADD instruction with the given operands.
177   MCInst TmpInst = MCInstBuilder(RISCV::ADD)
178                        .addOperand(DestReg)
179                        .addOperand(SrcReg)
180                        .addOperand(TPReg);
181   uint32_t Binary = getBinaryCodeForInstr(TmpInst, Fixups, STI);
182   support::endian::write(OS, Binary, support::little);
183 }
184 
185 void RISCVMCCodeEmitter::encodeInstruction(const MCInst &MI, raw_ostream &OS,
186                                            SmallVectorImpl<MCFixup> &Fixups,
187                                            const MCSubtargetInfo &STI) const {
188   const MCInstrDesc &Desc = MCII.get(MI.getOpcode());
189   // Get byte count of instruction.
190   unsigned Size = Desc.getSize();
191 
192   // RISCVInstrInfo::getInstSizeInBytes hard-codes the number of expanded
193   // instructions for each pseudo, and must be updated when adding new pseudos
194   // or changing existing ones.
195   if (MI.getOpcode() == RISCV::PseudoCALLReg ||
196       MI.getOpcode() == RISCV::PseudoCALL ||
197       MI.getOpcode() == RISCV::PseudoTAIL ||
198       MI.getOpcode() == RISCV::PseudoJump) {
199     expandFunctionCall(MI, OS, Fixups, STI);
200     MCNumEmitted += 2;
201     return;
202   }
203 
204   if (MI.getOpcode() == RISCV::PseudoAddTPRel) {
205     expandAddTPRel(MI, OS, Fixups, STI);
206     MCNumEmitted += 1;
207     return;
208   }
209 
210   switch (Size) {
211   default:
212     llvm_unreachable("Unhandled encodeInstruction length!");
213   case 2: {
214     uint16_t Bits = getBinaryCodeForInstr(MI, Fixups, STI);
215     support::endian::write<uint16_t>(OS, Bits, support::little);
216     break;
217   }
218   case 4: {
219     uint32_t Bits = getBinaryCodeForInstr(MI, Fixups, STI);
220     support::endian::write(OS, Bits, support::little);
221     break;
222   }
223   }
224 
225   ++MCNumEmitted; // Keep track of the # of mi's emitted.
226 }
227 
228 unsigned
229 RISCVMCCodeEmitter::getMachineOpValue(const MCInst &MI, const MCOperand &MO,
230                                       SmallVectorImpl<MCFixup> &Fixups,
231                                       const MCSubtargetInfo &STI) const {
232 
233   if (MO.isReg())
234     return Ctx.getRegisterInfo()->getEncodingValue(MO.getReg());
235 
236   if (MO.isImm())
237     return static_cast<unsigned>(MO.getImm());
238 
239   llvm_unreachable("Unhandled expression!");
240   return 0;
241 }
242 
243 unsigned
244 RISCVMCCodeEmitter::getImmOpValueAsr1(const MCInst &MI, unsigned OpNo,
245                                       SmallVectorImpl<MCFixup> &Fixups,
246                                       const MCSubtargetInfo &STI) const {
247   const MCOperand &MO = MI.getOperand(OpNo);
248 
249   if (MO.isImm()) {
250     unsigned Res = MO.getImm();
251     assert((Res & 1) == 0 && "LSB is non-zero");
252     return Res >> 1;
253   }
254 
255   return getImmOpValue(MI, OpNo, Fixups, STI);
256 }
257 
258 unsigned RISCVMCCodeEmitter::getImmOpValue(const MCInst &MI, unsigned OpNo,
259                                            SmallVectorImpl<MCFixup> &Fixups,
260                                            const MCSubtargetInfo &STI) const {
261   bool EnableRelax = STI.getFeatureBits()[RISCV::FeatureRelax];
262   const MCOperand &MO = MI.getOperand(OpNo);
263 
264   MCInstrDesc const &Desc = MCII.get(MI.getOpcode());
265   unsigned MIFrm = Desc.TSFlags & RISCVII::InstFormatMask;
266 
267   // If the destination is an immediate, there is nothing to do.
268   if (MO.isImm())
269     return MO.getImm();
270 
271   assert(MO.isExpr() &&
272          "getImmOpValue expects only expressions or immediates");
273   const MCExpr *Expr = MO.getExpr();
274   MCExpr::ExprKind Kind = Expr->getKind();
275   RISCV::Fixups FixupKind = RISCV::fixup_riscv_invalid;
276   bool RelaxCandidate = false;
277   if (Kind == MCExpr::Target) {
278     const RISCVMCExpr *RVExpr = cast<RISCVMCExpr>(Expr);
279 
280     switch (RVExpr->getKind()) {
281     case RISCVMCExpr::VK_RISCV_None:
282     case RISCVMCExpr::VK_RISCV_Invalid:
283     case RISCVMCExpr::VK_RISCV_32_PCREL:
284       llvm_unreachable("Unhandled fixup kind!");
285     case RISCVMCExpr::VK_RISCV_TPREL_ADD:
286       // tprel_add is only used to indicate that a relocation should be emitted
287       // for an add instruction used in TP-relative addressing. It should not be
288       // expanded as if representing an actual instruction operand and so to
289       // encounter it here is an error.
290       llvm_unreachable(
291           "VK_RISCV_TPREL_ADD should not represent an instruction operand");
292     case RISCVMCExpr::VK_RISCV_LO:
293       if (MIFrm == RISCVII::InstFormatI)
294         FixupKind = RISCV::fixup_riscv_lo12_i;
295       else if (MIFrm == RISCVII::InstFormatS)
296         FixupKind = RISCV::fixup_riscv_lo12_s;
297       else
298         llvm_unreachable("VK_RISCV_LO used with unexpected instruction format");
299       RelaxCandidate = true;
300       break;
301     case RISCVMCExpr::VK_RISCV_HI:
302       FixupKind = RISCV::fixup_riscv_hi20;
303       RelaxCandidate = true;
304       break;
305     case RISCVMCExpr::VK_RISCV_PCREL_LO:
306       if (MIFrm == RISCVII::InstFormatI)
307         FixupKind = RISCV::fixup_riscv_pcrel_lo12_i;
308       else if (MIFrm == RISCVII::InstFormatS)
309         FixupKind = RISCV::fixup_riscv_pcrel_lo12_s;
310       else
311         llvm_unreachable(
312             "VK_RISCV_PCREL_LO used with unexpected instruction format");
313       RelaxCandidate = true;
314       break;
315     case RISCVMCExpr::VK_RISCV_PCREL_HI:
316       FixupKind = RISCV::fixup_riscv_pcrel_hi20;
317       RelaxCandidate = true;
318       break;
319     case RISCVMCExpr::VK_RISCV_GOT_HI:
320       FixupKind = RISCV::fixup_riscv_got_hi20;
321       break;
322     case RISCVMCExpr::VK_RISCV_TPREL_LO:
323       if (MIFrm == RISCVII::InstFormatI)
324         FixupKind = RISCV::fixup_riscv_tprel_lo12_i;
325       else if (MIFrm == RISCVII::InstFormatS)
326         FixupKind = RISCV::fixup_riscv_tprel_lo12_s;
327       else
328         llvm_unreachable(
329             "VK_RISCV_TPREL_LO used with unexpected instruction format");
330       RelaxCandidate = true;
331       break;
332     case RISCVMCExpr::VK_RISCV_TPREL_HI:
333       FixupKind = RISCV::fixup_riscv_tprel_hi20;
334       RelaxCandidate = true;
335       break;
336     case RISCVMCExpr::VK_RISCV_TLS_GOT_HI:
337       FixupKind = RISCV::fixup_riscv_tls_got_hi20;
338       break;
339     case RISCVMCExpr::VK_RISCV_TLS_GD_HI:
340       FixupKind = RISCV::fixup_riscv_tls_gd_hi20;
341       break;
342     case RISCVMCExpr::VK_RISCV_CALL:
343       FixupKind = RISCV::fixup_riscv_call;
344       RelaxCandidate = true;
345       break;
346     case RISCVMCExpr::VK_RISCV_CALL_PLT:
347       FixupKind = RISCV::fixup_riscv_call_plt;
348       RelaxCandidate = true;
349       break;
350     }
351   } else if (Kind == MCExpr::SymbolRef &&
352              cast<MCSymbolRefExpr>(Expr)->getKind() == MCSymbolRefExpr::VK_None) {
353     if (Desc.getOpcode() == RISCV::JAL) {
354       FixupKind = RISCV::fixup_riscv_jal;
355     } else if (MIFrm == RISCVII::InstFormatB) {
356       FixupKind = RISCV::fixup_riscv_branch;
357     } else if (MIFrm == RISCVII::InstFormatCJ) {
358       FixupKind = RISCV::fixup_riscv_rvc_jump;
359     } else if (MIFrm == RISCVII::InstFormatCB) {
360       FixupKind = RISCV::fixup_riscv_rvc_branch;
361     }
362   }
363 
364   assert(FixupKind != RISCV::fixup_riscv_invalid && "Unhandled expression!");
365 
366   Fixups.push_back(
367       MCFixup::create(0, Expr, MCFixupKind(FixupKind), MI.getLoc()));
368   ++MCNumFixups;
369 
370   // Ensure an R_RISCV_RELAX relocation will be emitted if linker relaxation is
371   // enabled and the current fixup will result in a relocation that may be
372   // relaxed.
373   if (EnableRelax && RelaxCandidate) {
374     const MCConstantExpr *Dummy = MCConstantExpr::create(0, Ctx);
375     Fixups.push_back(
376     MCFixup::create(0, Dummy, MCFixupKind(RISCV::fixup_riscv_relax),
377                     MI.getLoc()));
378     ++MCNumFixups;
379   }
380 
381   return 0;
382 }
383 
384 unsigned RISCVMCCodeEmitter::getVMaskReg(const MCInst &MI, unsigned OpNo,
385                                          SmallVectorImpl<MCFixup> &Fixups,
386                                          const MCSubtargetInfo &STI) const {
387   MCOperand MO = MI.getOperand(OpNo);
388   assert(MO.isReg() && "Expected a register.");
389 
390   switch (MO.getReg()) {
391   default:
392     llvm_unreachable("Invalid mask register.");
393   case RISCV::V0:
394     return 0;
395   case RISCV::NoRegister:
396     return 1;
397   }
398 }
399 
400 #include "RISCVGenMCCodeEmitter.inc"
401