xref: /freebsd/contrib/llvm-project/llvm/lib/Target/MSP430/AsmParser/MSP430AsmParser.cpp (revision 85868e8a1daeaae7a0e48effb2ea2310ae3b02c6)
1 //===- MSP430AsmParser.cpp - Parse MSP430 assembly to MCInst instructions -===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "MSP430.h"
10 #include "MSP430RegisterInfo.h"
11 #include "MCTargetDesc/MSP430MCTargetDesc.h"
12 #include "TargetInfo/MSP430TargetInfo.h"
13 
14 #include "llvm/ADT/APInt.h"
15 #include "llvm/ADT/StringSwitch.h"
16 #include "llvm/MC/MCContext.h"
17 #include "llvm/MC/MCExpr.h"
18 #include "llvm/MC/MCInst.h"
19 #include "llvm/MC/MCInstBuilder.h"
20 #include "llvm/MC/MCParser/MCAsmLexer.h"
21 #include "llvm/MC/MCParser/MCParsedAsmOperand.h"
22 #include "llvm/MC/MCParser/MCTargetAsmParser.h"
23 #include "llvm/MC/MCStreamer.h"
24 #include "llvm/MC/MCSubtargetInfo.h"
25 #include "llvm/MC/MCSymbol.h"
26 #include "llvm/MC/MCValue.h"
27 #include "llvm/Support/Debug.h"
28 #include "llvm/Support/MathExtras.h"
29 #include "llvm/Support/TargetRegistry.h"
30 
31 #define DEBUG_TYPE "msp430-asm-parser"
32 
33 using namespace llvm;
34 
35 namespace {
36 
37 /// Parses MSP430 assembly from a stream.
38 class MSP430AsmParser : public MCTargetAsmParser {
39   const MCSubtargetInfo &STI;
40   MCAsmParser &Parser;
41   const MCRegisterInfo *MRI;
42 
43   bool MatchAndEmitInstruction(SMLoc IDLoc, unsigned &Opcode,
44                                OperandVector &Operands, MCStreamer &Out,
45                                uint64_t &ErrorInfo,
46                                bool MatchingInlineAsm) override;
47 
48   bool ParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc) override;
49 
50   bool ParseInstruction(ParseInstructionInfo &Info, StringRef Name,
51                         SMLoc NameLoc, OperandVector &Operands) override;
52 
53   bool ParseDirective(AsmToken DirectiveID) override;
54   bool ParseDirectiveRefSym(AsmToken DirectiveID);
55 
56   unsigned validateTargetOperandClass(MCParsedAsmOperand &Op,
57                                       unsigned Kind) override;
58 
59   bool parseJccInstruction(ParseInstructionInfo &Info, StringRef Name,
60                            SMLoc NameLoc, OperandVector &Operands);
61 
62   bool ParseOperand(OperandVector &Operands);
63 
64   bool ParseLiteralValues(unsigned Size, SMLoc L);
65 
66   MCAsmParser &getParser() const { return Parser; }
67   MCAsmLexer &getLexer() const { return Parser.getLexer(); }
68 
69   /// @name Auto-generated Matcher Functions
70   /// {
71 
72 #define GET_ASSEMBLER_HEADER
73 #include "MSP430GenAsmMatcher.inc"
74 
75   /// }
76 
77 public:
78   MSP430AsmParser(const MCSubtargetInfo &STI, MCAsmParser &Parser,
79                   const MCInstrInfo &MII, const MCTargetOptions &Options)
80       : MCTargetAsmParser(Options, STI, MII), STI(STI), Parser(Parser) {
81     MCAsmParserExtension::Initialize(Parser);
82     MRI = getContext().getRegisterInfo();
83 
84     setAvailableFeatures(ComputeAvailableFeatures(STI.getFeatureBits()));
85   }
86 };
87 
88 /// A parsed MSP430 assembly operand.
89 class MSP430Operand : public MCParsedAsmOperand {
90   typedef MCParsedAsmOperand Base;
91 
92   enum KindTy {
93     k_Imm,
94     k_Reg,
95     k_Tok,
96     k_Mem,
97     k_IndReg,
98     k_PostIndReg
99   } Kind;
100 
101   struct Memory {
102     unsigned Reg;
103     const MCExpr *Offset;
104   };
105   union {
106     const MCExpr *Imm;
107     unsigned      Reg;
108     StringRef     Tok;
109     Memory        Mem;
110   };
111 
112   SMLoc Start, End;
113 
114 public:
115   MSP430Operand(StringRef Tok, SMLoc const &S)
116       : Base(), Kind(k_Tok), Tok(Tok), Start(S), End(S) {}
117   MSP430Operand(KindTy Kind, unsigned Reg, SMLoc const &S, SMLoc const &E)
118       : Base(), Kind(Kind), Reg(Reg), Start(S), End(E) {}
119   MSP430Operand(MCExpr const *Imm, SMLoc const &S, SMLoc const &E)
120       : Base(), Kind(k_Imm), Imm(Imm), Start(S), End(E) {}
121   MSP430Operand(unsigned Reg, MCExpr const *Expr, SMLoc const &S, SMLoc const &E)
122       : Base(), Kind(k_Mem), Mem({Reg, Expr}), Start(S), End(E) {}
123 
124   void addRegOperands(MCInst &Inst, unsigned N) const {
125     assert((Kind == k_Reg || Kind == k_IndReg || Kind == k_PostIndReg) &&
126         "Unexpected operand kind");
127     assert(N == 1 && "Invalid number of operands!");
128 
129     Inst.addOperand(MCOperand::createReg(Reg));
130   }
131 
132   void addExprOperand(MCInst &Inst, const MCExpr *Expr) const {
133     // Add as immediate when possible
134     if (!Expr)
135       Inst.addOperand(MCOperand::createImm(0));
136     else if (const MCConstantExpr *CE = dyn_cast<MCConstantExpr>(Expr))
137       Inst.addOperand(MCOperand::createImm(CE->getValue()));
138     else
139       Inst.addOperand(MCOperand::createExpr(Expr));
140   }
141 
142   void addImmOperands(MCInst &Inst, unsigned N) const {
143     assert(Kind == k_Imm && "Unexpected operand kind");
144     assert(N == 1 && "Invalid number of operands!");
145 
146     addExprOperand(Inst, Imm);
147   }
148 
149   void addMemOperands(MCInst &Inst, unsigned N) const {
150     assert(Kind == k_Mem && "Unexpected operand kind");
151     assert(N == 2 && "Invalid number of operands");
152 
153     Inst.addOperand(MCOperand::createReg(Mem.Reg));
154     addExprOperand(Inst, Mem.Offset);
155   }
156 
157   bool isReg() const        { return Kind == k_Reg; }
158   bool isImm() const        { return Kind == k_Imm; }
159   bool isToken() const      { return Kind == k_Tok; }
160   bool isMem() const        { return Kind == k_Mem; }
161   bool isIndReg() const     { return Kind == k_IndReg; }
162   bool isPostIndReg() const { return Kind == k_PostIndReg; }
163 
164   bool isCGImm() const {
165     if (Kind != k_Imm)
166       return false;
167 
168     int64_t Val;
169     if (!Imm->evaluateAsAbsolute(Val))
170       return false;
171 
172     if (Val == 0 || Val == 1 || Val == 2 || Val == 4 || Val == 8 || Val == -1)
173       return true;
174 
175     return false;
176   }
177 
178   StringRef getToken() const {
179     assert(Kind == k_Tok && "Invalid access!");
180     return Tok;
181   }
182 
183   unsigned getReg() const {
184     assert(Kind == k_Reg && "Invalid access!");
185     return Reg;
186   }
187 
188   void setReg(unsigned RegNo) {
189     assert(Kind == k_Reg && "Invalid access!");
190     Reg = RegNo;
191   }
192 
193   static std::unique_ptr<MSP430Operand> CreateToken(StringRef Str, SMLoc S) {
194     return std::make_unique<MSP430Operand>(Str, S);
195   }
196 
197   static std::unique_ptr<MSP430Operand> CreateReg(unsigned RegNum, SMLoc S,
198                                                   SMLoc E) {
199     return std::make_unique<MSP430Operand>(k_Reg, RegNum, S, E);
200   }
201 
202   static std::unique_ptr<MSP430Operand> CreateImm(const MCExpr *Val, SMLoc S,
203                                                   SMLoc E) {
204     return std::make_unique<MSP430Operand>(Val, S, E);
205   }
206 
207   static std::unique_ptr<MSP430Operand> CreateMem(unsigned RegNum,
208                                                   const MCExpr *Val,
209                                                   SMLoc S, SMLoc E) {
210     return std::make_unique<MSP430Operand>(RegNum, Val, S, E);
211   }
212 
213   static std::unique_ptr<MSP430Operand> CreateIndReg(unsigned RegNum, SMLoc S,
214                                                   SMLoc E) {
215     return std::make_unique<MSP430Operand>(k_IndReg, RegNum, S, E);
216   }
217 
218   static std::unique_ptr<MSP430Operand> CreatePostIndReg(unsigned RegNum, SMLoc S,
219                                                   SMLoc E) {
220     return std::make_unique<MSP430Operand>(k_PostIndReg, RegNum, S, E);
221   }
222 
223   SMLoc getStartLoc() const { return Start; }
224   SMLoc getEndLoc() const { return End; }
225 
226   virtual void print(raw_ostream &O) const {
227     switch (Kind) {
228     case k_Tok:
229       O << "Token " << Tok;
230       break;
231     case k_Reg:
232       O << "Register " << Reg;
233       break;
234     case k_Imm:
235       O << "Immediate " << *Imm;
236       break;
237     case k_Mem:
238       O << "Memory ";
239       O << *Mem.Offset << "(" << Reg << ")";
240       break;
241     case k_IndReg:
242       O << "RegInd " << Reg;
243       break;
244     case k_PostIndReg:
245       O << "PostInc " << Reg;
246       break;
247     }
248   }
249 };
250 } // end anonymous namespace
251 
252 bool MSP430AsmParser::MatchAndEmitInstruction(SMLoc Loc, unsigned &Opcode,
253                                               OperandVector &Operands,
254                                               MCStreamer &Out,
255                                               uint64_t &ErrorInfo,
256                                               bool MatchingInlineAsm) {
257   MCInst Inst;
258   unsigned MatchResult =
259       MatchInstructionImpl(Operands, Inst, ErrorInfo, MatchingInlineAsm);
260 
261   switch (MatchResult) {
262   case Match_Success:
263     Inst.setLoc(Loc);
264     Out.EmitInstruction(Inst, STI);
265     return false;
266   case Match_MnemonicFail:
267     return Error(Loc, "invalid instruction mnemonic");
268   case Match_InvalidOperand: {
269     SMLoc ErrorLoc = Loc;
270     if (ErrorInfo != ~0U) {
271       if (ErrorInfo >= Operands.size())
272         return Error(ErrorLoc, "too few operands for instruction");
273 
274       ErrorLoc = ((MSP430Operand &)*Operands[ErrorInfo]).getStartLoc();
275       if (ErrorLoc == SMLoc())
276         ErrorLoc = Loc;
277     }
278     return Error(ErrorLoc, "invalid operand for instruction");
279   }
280   default:
281     return true;
282   }
283 }
284 
285 // Auto-generated by TableGen
286 static unsigned MatchRegisterName(StringRef Name);
287 static unsigned MatchRegisterAltName(StringRef Name);
288 
289 bool MSP430AsmParser::ParseRegister(unsigned &RegNo, SMLoc &StartLoc,
290                                     SMLoc &EndLoc) {
291   if (getLexer().getKind() == AsmToken::Identifier) {
292     auto Name = getLexer().getTok().getIdentifier().lower();
293     RegNo = MatchRegisterName(Name);
294     if (RegNo == MSP430::NoRegister) {
295       RegNo = MatchRegisterAltName(Name);
296       if (RegNo == MSP430::NoRegister)
297         return true;
298     }
299 
300     AsmToken const &T = getParser().getTok();
301     StartLoc = T.getLoc();
302     EndLoc = T.getEndLoc();
303     getLexer().Lex(); // eat register token
304 
305     return false;
306   }
307 
308   return Error(StartLoc, "invalid register name");
309 }
310 
311 bool MSP430AsmParser::parseJccInstruction(ParseInstructionInfo &Info,
312                                           StringRef Name, SMLoc NameLoc,
313                                           OperandVector &Operands) {
314   if (!Name.startswith_lower("j"))
315     return true;
316 
317   auto CC = Name.drop_front().lower();
318   unsigned CondCode;
319   if (CC == "ne" || CC == "nz")
320     CondCode = MSP430CC::COND_NE;
321   else if (CC == "eq" || CC == "z")
322     CondCode = MSP430CC::COND_E;
323   else if (CC == "lo" || CC == "nc")
324     CondCode = MSP430CC::COND_LO;
325   else if (CC == "hs" || CC == "c")
326     CondCode = MSP430CC::COND_HS;
327   else if (CC == "n")
328     CondCode = MSP430CC::COND_N;
329   else if (CC == "ge")
330     CondCode = MSP430CC::COND_GE;
331   else if (CC == "l")
332     CondCode = MSP430CC::COND_L;
333   else if (CC == "mp")
334     CondCode = MSP430CC::COND_NONE;
335   else
336     return Error(NameLoc, "unknown instruction");
337 
338   if (CondCode == (unsigned)MSP430CC::COND_NONE)
339     Operands.push_back(MSP430Operand::CreateToken("jmp", NameLoc));
340   else {
341     Operands.push_back(MSP430Operand::CreateToken("j", NameLoc));
342     const MCExpr *CCode = MCConstantExpr::create(CondCode, getContext());
343     Operands.push_back(MSP430Operand::CreateImm(CCode, SMLoc(), SMLoc()));
344   }
345 
346   // Skip optional '$' sign.
347   if (getLexer().getKind() == AsmToken::Dollar)
348     getLexer().Lex(); // Eat '$'
349 
350   const MCExpr *Val;
351   SMLoc ExprLoc = getLexer().getLoc();
352   if (getParser().parseExpression(Val))
353     return Error(ExprLoc, "expected expression operand");
354 
355   int64_t Res;
356   if (Val->evaluateAsAbsolute(Res))
357     if (Res < -512 || Res > 511)
358       return Error(ExprLoc, "invalid jump offset");
359 
360   Operands.push_back(MSP430Operand::CreateImm(Val, ExprLoc,
361     getLexer().getLoc()));
362 
363   if (getLexer().isNot(AsmToken::EndOfStatement)) {
364     SMLoc Loc = getLexer().getLoc();
365     getParser().eatToEndOfStatement();
366     return Error(Loc, "unexpected token");
367   }
368 
369   getParser().Lex(); // Consume the EndOfStatement.
370   return false;
371 }
372 
373 bool MSP430AsmParser::ParseInstruction(ParseInstructionInfo &Info,
374                                        StringRef Name, SMLoc NameLoc,
375                                        OperandVector &Operands) {
376   // Drop .w suffix
377   if (Name.endswith_lower(".w"))
378     Name = Name.drop_back(2);
379 
380   if (!parseJccInstruction(Info, Name, NameLoc, Operands))
381     return false;
382 
383   // First operand is instruction mnemonic
384   Operands.push_back(MSP430Operand::CreateToken(Name, NameLoc));
385 
386   // If there are no more operands, then finish
387   if (getLexer().is(AsmToken::EndOfStatement))
388     return false;
389 
390   // Parse first operand
391   if (ParseOperand(Operands))
392     return true;
393 
394   // Parse second operand if any
395   if (getLexer().is(AsmToken::Comma)) {
396     getLexer().Lex(); // Eat ','
397     if (ParseOperand(Operands))
398       return true;
399   }
400 
401   if (getLexer().isNot(AsmToken::EndOfStatement)) {
402     SMLoc Loc = getLexer().getLoc();
403     getParser().eatToEndOfStatement();
404     return Error(Loc, "unexpected token");
405   }
406 
407   getParser().Lex(); // Consume the EndOfStatement.
408   return false;
409 }
410 
411 bool MSP430AsmParser::ParseDirectiveRefSym(AsmToken DirectiveID) {
412     StringRef Name;
413     if (getParser().parseIdentifier(Name))
414       return TokError("expected identifier in directive");
415 
416     MCSymbol *Sym = getContext().getOrCreateSymbol(Name);
417     getStreamer().EmitSymbolAttribute(Sym, MCSA_Global);
418     return false;
419 }
420 
421 bool MSP430AsmParser::ParseDirective(AsmToken DirectiveID) {
422   StringRef IDVal = DirectiveID.getIdentifier();
423   if (IDVal.lower() == ".long") {
424     ParseLiteralValues(4, DirectiveID.getLoc());
425   } else if (IDVal.lower() == ".word" || IDVal.lower() == ".short") {
426     ParseLiteralValues(2, DirectiveID.getLoc());
427   } else if (IDVal.lower() == ".byte") {
428     ParseLiteralValues(1, DirectiveID.getLoc());
429   } else if (IDVal.lower() == ".refsym") {
430     return ParseDirectiveRefSym(DirectiveID);
431   }
432   return true;
433 }
434 
435 bool MSP430AsmParser::ParseOperand(OperandVector &Operands) {
436   switch (getLexer().getKind()) {
437     default: return true;
438     case AsmToken::Identifier: {
439       // try rN
440       unsigned RegNo;
441       SMLoc StartLoc, EndLoc;
442       if (!ParseRegister(RegNo, StartLoc, EndLoc)) {
443         Operands.push_back(MSP430Operand::CreateReg(RegNo, StartLoc, EndLoc));
444         return false;
445       }
446       LLVM_FALLTHROUGH;
447     }
448     case AsmToken::Integer:
449     case AsmToken::Plus:
450     case AsmToken::Minus: {
451       SMLoc StartLoc = getParser().getTok().getLoc();
452       const MCExpr *Val;
453       // Try constexpr[(rN)]
454       if (!getParser().parseExpression(Val)) {
455         unsigned RegNo = MSP430::PC;
456         SMLoc EndLoc = getParser().getTok().getLoc();
457         // Try (rN)
458         if (getLexer().getKind() == AsmToken::LParen) {
459           getLexer().Lex(); // Eat '('
460           SMLoc RegStartLoc;
461           if (ParseRegister(RegNo, RegStartLoc, EndLoc))
462             return true;
463           if (getLexer().getKind() != AsmToken::RParen)
464             return true;
465           EndLoc = getParser().getTok().getEndLoc();
466           getLexer().Lex(); // Eat ')'
467         }
468         Operands.push_back(MSP430Operand::CreateMem(RegNo, Val, StartLoc,
469           EndLoc));
470         return false;
471       }
472       return true;
473     }
474     case AsmToken::Amp: {
475       // Try &constexpr
476       SMLoc StartLoc = getParser().getTok().getLoc();
477       getLexer().Lex(); // Eat '&'
478       const MCExpr *Val;
479       if (!getParser().parseExpression(Val)) {
480         SMLoc EndLoc = getParser().getTok().getLoc();
481         Operands.push_back(MSP430Operand::CreateMem(MSP430::SR, Val, StartLoc,
482           EndLoc));
483         return false;
484       }
485       return true;
486     }
487     case AsmToken::At: {
488       // Try @rN[+]
489       SMLoc StartLoc = getParser().getTok().getLoc();
490       getLexer().Lex(); // Eat '@'
491       unsigned RegNo;
492       SMLoc RegStartLoc, EndLoc;
493       if (ParseRegister(RegNo, RegStartLoc, EndLoc))
494         return true;
495       if (getLexer().getKind() == AsmToken::Plus) {
496         Operands.push_back(MSP430Operand::CreatePostIndReg(RegNo, StartLoc, EndLoc));
497         getLexer().Lex(); // Eat '+'
498         return false;
499       }
500       if (Operands.size() > 1) // Emulate @rd in destination position as 0(rd)
501         Operands.push_back(MSP430Operand::CreateMem(RegNo,
502             MCConstantExpr::create(0, getContext()), StartLoc, EndLoc));
503       else
504         Operands.push_back(MSP430Operand::CreateIndReg(RegNo, StartLoc, EndLoc));
505       return false;
506     }
507     case AsmToken::Hash:
508       // Try #constexpr
509       SMLoc StartLoc = getParser().getTok().getLoc();
510       getLexer().Lex(); // Eat '#'
511       const MCExpr *Val;
512       if (!getParser().parseExpression(Val)) {
513         SMLoc EndLoc = getParser().getTok().getLoc();
514         Operands.push_back(MSP430Operand::CreateImm(Val, StartLoc, EndLoc));
515         return false;
516       }
517       return true;
518   }
519 }
520 
521 bool MSP430AsmParser::ParseLiteralValues(unsigned Size, SMLoc L) {
522   auto parseOne = [&]() -> bool {
523     const MCExpr *Value;
524     if (getParser().parseExpression(Value))
525       return true;
526     getParser().getStreamer().EmitValue(Value, Size, L);
527     return false;
528   };
529   return (parseMany(parseOne));
530 }
531 
532 extern "C" void LLVMInitializeMSP430AsmParser() {
533   RegisterMCAsmParser<MSP430AsmParser> X(getTheMSP430Target());
534 }
535 
536 #define GET_REGISTER_MATCHER
537 #define GET_MATCHER_IMPLEMENTATION
538 #include "MSP430GenAsmMatcher.inc"
539 
540 static unsigned convertGR16ToGR8(unsigned Reg) {
541   switch (Reg) {
542   default:
543     llvm_unreachable("Unknown GR16 register");
544   case MSP430::PC:  return MSP430::PCB;
545   case MSP430::SP:  return MSP430::SPB;
546   case MSP430::SR:  return MSP430::SRB;
547   case MSP430::CG:  return MSP430::CGB;
548   case MSP430::FP:  return MSP430::FPB;
549   case MSP430::R5:  return MSP430::R5B;
550   case MSP430::R6:  return MSP430::R6B;
551   case MSP430::R7:  return MSP430::R7B;
552   case MSP430::R8:  return MSP430::R8B;
553   case MSP430::R9:  return MSP430::R9B;
554   case MSP430::R10: return MSP430::R10B;
555   case MSP430::R11: return MSP430::R11B;
556   case MSP430::R12: return MSP430::R12B;
557   case MSP430::R13: return MSP430::R13B;
558   case MSP430::R14: return MSP430::R14B;
559   case MSP430::R15: return MSP430::R15B;
560   }
561 }
562 
563 unsigned MSP430AsmParser::validateTargetOperandClass(MCParsedAsmOperand &AsmOp,
564                                                      unsigned Kind) {
565   MSP430Operand &Op = static_cast<MSP430Operand &>(AsmOp);
566 
567   if (!Op.isReg())
568     return Match_InvalidOperand;
569 
570   unsigned Reg = Op.getReg();
571   bool isGR16 =
572       MSP430MCRegisterClasses[MSP430::GR16RegClassID].contains(Reg);
573 
574   if (isGR16 && (Kind == MCK_GR8)) {
575     Op.setReg(convertGR16ToGR8(Reg));
576     return Match_Success;
577   }
578 
579   return Match_InvalidOperand;
580 }
581