// LoongArchAsmParser.cpp - Parse LoongArch assembly to MCInst instructions -=// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "MCTargetDesc/LoongArchInstPrinter.h" #include "MCTargetDesc/LoongArchMCTargetDesc.h" #include "TargetInfo/LoongArchTargetInfo.h" #include "llvm/MC/MCContext.h" #include "llvm/MC/MCInstrInfo.h" #include "llvm/MC/MCParser/MCAsmLexer.h" #include "llvm/MC/MCParser/MCParsedAsmOperand.h" #include "llvm/MC/MCParser/MCTargetAsmParser.h" #include "llvm/MC/MCRegisterInfo.h" #include "llvm/MC/MCStreamer.h" #include "llvm/MC/MCSubtargetInfo.h" #include "llvm/MC/TargetRegistry.h" #include "llvm/Support/Casting.h" using namespace llvm; #define DEBUG_TYPE "loongarch-asm-parser" namespace { class LoongArchAsmParser : public MCTargetAsmParser { SMLoc getLoc() const { return getParser().getTok().getLoc(); } /// Parse a register as used in CFI directives. bool ParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc) override; OperandMatchResultTy tryParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc) override; bool ParseInstruction(ParseInstructionInfo &Info, StringRef Name, SMLoc NameLoc, OperandVector &Operands) override; bool ParseDirective(AsmToken DirectiveID) override { return true; } bool MatchAndEmitInstruction(SMLoc IDLoc, unsigned &Opcode, OperandVector &Operands, MCStreamer &Out, uint64_t &ErrorInfo, bool MatchingInlineAsm) override; unsigned checkTargetMatchPredicate(MCInst &Inst) override; unsigned validateTargetOperandClass(MCParsedAsmOperand &Op, unsigned Kind) override; bool generateImmOutOfRangeError(OperandVector &Operands, uint64_t ErrorInfo, int64_t Lower, int64_t Upper, Twine Msg); /// Helper for processing MC instructions that have been successfully matched /// by MatchAndEmitInstruction. bool processInstruction(MCInst &Inst, SMLoc IDLoc, OperandVector &Operands, MCStreamer &Out); // Auto-generated instruction matching functions. #define GET_ASSEMBLER_HEADER #include "LoongArchGenAsmMatcher.inc" OperandMatchResultTy parseRegister(OperandVector &Operands); OperandMatchResultTy parseImmediate(OperandVector &Operands); bool parseOperand(OperandVector &Operands, StringRef Mnemonic); public: enum LoongArchMatchResultTy { Match_Dummy = FIRST_TARGET_MATCH_RESULT_TY, Match_RequiresMsbNotLessThanLsb, Match_RequiresOpnd2NotR0R1, #define GET_OPERAND_DIAGNOSTIC_TYPES #include "LoongArchGenAsmMatcher.inc" #undef GET_OPERAND_DIAGNOSTIC_TYPES }; LoongArchAsmParser(const MCSubtargetInfo &STI, MCAsmParser &Parser, const MCInstrInfo &MII, const MCTargetOptions &Options) : MCTargetAsmParser(Options, STI, MII) { Parser.addAliasForDirective(".half", ".2byte"); Parser.addAliasForDirective(".hword", ".2byte"); Parser.addAliasForDirective(".word", ".4byte"); Parser.addAliasForDirective(".dword", ".8byte"); // Initialize the set of available features. setAvailableFeatures(ComputeAvailableFeatures(STI.getFeatureBits())); } }; // Instances of this class represent a parsed LoongArch machine instruction. class LoongArchOperand : public MCParsedAsmOperand { enum class KindTy { Token, Register, Immediate, } Kind; struct RegOp { MCRegister RegNum; }; struct ImmOp { const MCExpr *Val; }; SMLoc StartLoc, EndLoc; union { StringRef Tok; struct RegOp Reg; struct ImmOp Imm; }; public: LoongArchOperand(KindTy K) : MCParsedAsmOperand(), Kind(K) {} bool isToken() const override { return Kind == KindTy::Token; } bool isReg() const override { return Kind == KindTy::Register; } bool isImm() const override { return Kind == KindTy::Immediate; } bool isMem() const override { return false; } void setReg(MCRegister PhysReg) { Reg.RegNum = PhysReg; } static bool evaluateConstantImm(const MCExpr *Expr, int64_t &Imm) { if (auto CE = dyn_cast(Expr)) { Imm = CE->getValue(); return true; } return false; } template bool isUImm() const { if (!isImm()) return false; int64_t Imm; bool IsConstantImm = evaluateConstantImm(getImm(), Imm); return IsConstantImm && isUInt(Imm - P); } template bool isSImm() const { if (!isImm()) return false; int64_t Imm; bool IsConstantImm = evaluateConstantImm(getImm(), Imm); return IsConstantImm && isShiftedInt(Imm); } bool isUImm2() const { return isUImm<2>(); } bool isUImm2plus1() const { return isUImm<2, 1>(); } bool isUImm3() const { return isUImm<3>(); } bool isUImm5() const { return isUImm<5>(); } bool isUImm6() const { return isUImm<6>(); } bool isUImm8() const { return isUImm<8>(); } bool isUImm12() const { return isUImm<12>(); } bool isUImm14() const { return isUImm<14>(); } bool isUImm15() const { return isUImm<15>(); } bool isSImm12() const { return isSImm<12>(); } bool isSImm14lsl2() const { return isSImm<14, 2>(); } bool isSImm16() const { return isSImm<16>(); } bool isSImm16lsl2() const { return isSImm<16, 2>(); } bool isSImm20() const { return isSImm<20>(); } bool isSImm21lsl2() const { return isSImm<21, 2>(); } bool isSImm26lsl2() const { return isSImm<26, 2>(); } /// Gets location of the first token of this operand. SMLoc getStartLoc() const override { return StartLoc; } /// Gets location of the last token of this operand. SMLoc getEndLoc() const override { return EndLoc; } unsigned getReg() const override { assert(Kind == KindTy::Register && "Invalid type access!"); return Reg.RegNum.id(); } const MCExpr *getImm() const { assert(Kind == KindTy::Immediate && "Invalid type access!"); return Imm.Val; } StringRef getToken() const { assert(Kind == KindTy::Token && "Invalid type access!"); return Tok; } void print(raw_ostream &OS) const override { auto RegName = [](unsigned Reg) { if (Reg) return LoongArchInstPrinter::getRegisterName(Reg); else return "noreg"; }; switch (Kind) { case KindTy::Immediate: OS << *getImm(); break; case KindTy::Register: OS << ""; break; case KindTy::Token: OS << "'" << getToken() << "'"; break; } } static std::unique_ptr createToken(StringRef Str, SMLoc S) { auto Op = std::make_unique(KindTy::Token); Op->Tok = Str; Op->StartLoc = S; Op->EndLoc = S; return Op; } static std::unique_ptr createReg(unsigned RegNo, SMLoc S, SMLoc E) { auto Op = std::make_unique(KindTy::Register); Op->Reg.RegNum = RegNo; Op->StartLoc = S; Op->EndLoc = E; return Op; } static std::unique_ptr createImm(const MCExpr *Val, SMLoc S, SMLoc E) { auto Op = std::make_unique(KindTy::Immediate); Op->Imm.Val = Val; Op->StartLoc = S; Op->EndLoc = E; return Op; } void addExpr(MCInst &Inst, const MCExpr *Expr) const { if (auto CE = dyn_cast(Expr)) Inst.addOperand(MCOperand::createImm(CE->getValue())); else Inst.addOperand(MCOperand::createExpr(Expr)); } // Used by the TableGen Code. void addRegOperands(MCInst &Inst, unsigned N) const { assert(N == 1 && "Invalid number of operands!"); Inst.addOperand(MCOperand::createReg(getReg())); } void addImmOperands(MCInst &Inst, unsigned N) const { assert(N == 1 && "Invalid number of operands!"); addExpr(Inst, getImm()); } }; } // end namespace #define GET_REGISTER_MATCHER #define GET_SUBTARGET_FEATURE_NAME #define GET_MATCHER_IMPLEMENTATION #define GET_MNEMONIC_SPELL_CHECKER #include "LoongArchGenAsmMatcher.inc" static MCRegister convertFPR32ToFPR64(MCRegister Reg) { assert(Reg >= LoongArch::F0 && Reg <= LoongArch::F31 && "Invalid register"); return Reg - LoongArch::F0 + LoongArch::F0_64; } // Attempts to match Name as a register (either using the default name or // alternative ABI names), setting RegNo to the matching register. Upon // failure, returns true and sets RegNo to 0. static bool matchRegisterNameHelper(MCRegister &RegNo, StringRef Name) { RegNo = MatchRegisterName(Name); // The 32-bit and 64-bit FPRs have the same asm name. Check that the initial // match always matches the 32-bit variant, and not the 64-bit one. assert(!(RegNo >= LoongArch::F0_64 && RegNo <= LoongArch::F31_64)); // The default FPR register class is based on the tablegen enum ordering. static_assert(LoongArch::F0 < LoongArch::F0_64, "FPR matching must be updated"); if (RegNo == LoongArch::NoRegister) RegNo = MatchRegisterAltName(Name); return RegNo == LoongArch::NoRegister; } bool LoongArchAsmParser::ParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc) { return Error(getLoc(), "invalid register number"); } OperandMatchResultTy LoongArchAsmParser::tryParseRegister(unsigned &RegNo, SMLoc &StartLoc, SMLoc &EndLoc) { llvm_unreachable("Unimplemented function."); } OperandMatchResultTy LoongArchAsmParser::parseRegister(OperandVector &Operands) { if (getLexer().getTok().isNot(AsmToken::Dollar)) return MatchOperand_NoMatch; // Eat the $ prefix. getLexer().Lex(); if (getLexer().getKind() != AsmToken::Identifier) return MatchOperand_NoMatch; StringRef Name = getLexer().getTok().getIdentifier(); MCRegister RegNo; matchRegisterNameHelper(RegNo, Name); if (RegNo == LoongArch::NoRegister) return MatchOperand_NoMatch; SMLoc S = getLoc(); SMLoc E = SMLoc::getFromPointer(S.getPointer() + Name.size()); getLexer().Lex(); Operands.push_back(LoongArchOperand::createReg(RegNo, S, E)); return MatchOperand_Success; } OperandMatchResultTy LoongArchAsmParser::parseImmediate(OperandVector &Operands) { SMLoc S = getLoc(); SMLoc E; const MCExpr *Res; if (getParser().parseExpression(Res, E)) return MatchOperand_ParseFail; Operands.push_back(LoongArchOperand::createImm(Res, S, E)); return MatchOperand_Success; } /// Looks at a token type and creates the relevant operand from this /// information, adding to Operands. Return true upon an error. bool LoongArchAsmParser::parseOperand(OperandVector &Operands, StringRef Mnemonic) { if (parseRegister(Operands) == MatchOperand_Success || parseImmediate(Operands) == MatchOperand_Success) return false; // Finally we have exhausted all options and must declare defeat. Error(getLoc(), "unknown operand"); return true; } bool LoongArchAsmParser::ParseInstruction(ParseInstructionInfo &Info, StringRef Name, SMLoc NameLoc, OperandVector &Operands) { // First operand in MCInst is instruction mnemonic. Operands.push_back(LoongArchOperand::createToken(Name, NameLoc)); // If there are no more operands, then finish. if (parseOptionalToken(AsmToken::EndOfStatement)) return false; // Parse first operand. if (parseOperand(Operands, Name)) return true; // Parse until end of statement, consuming commas between operands. while (parseOptionalToken(AsmToken::Comma)) if (parseOperand(Operands, Name)) return true; // Parse end of statement and return successfully. if (parseOptionalToken(AsmToken::EndOfStatement)) return false; SMLoc Loc = getLexer().getLoc(); getParser().eatToEndOfStatement(); return Error(Loc, "unexpected token"); } bool LoongArchAsmParser::processInstruction(MCInst &Inst, SMLoc IDLoc, OperandVector &Operands, MCStreamer &Out) { Inst.setLoc(IDLoc); Out.emitInstruction(Inst, getSTI()); return false; } unsigned LoongArchAsmParser::checkTargetMatchPredicate(MCInst &Inst) { switch (Inst.getOpcode()) { default: break; case LoongArch::CSRXCHG: { unsigned Rj = Inst.getOperand(2).getReg(); if (Rj == LoongArch::R0 || Rj == LoongArch::R1) return Match_RequiresOpnd2NotR0R1; return Match_Success; } case LoongArch::BSTRINS_W: case LoongArch::BSTRINS_D: case LoongArch::BSTRPICK_W: case LoongArch::BSTRPICK_D: { unsigned Opc = Inst.getOpcode(); const signed Msb = (Opc == LoongArch::BSTRINS_W || Opc == LoongArch::BSTRINS_D) ? Inst.getOperand(3).getImm() : Inst.getOperand(2).getImm(); const signed Lsb = (Opc == LoongArch::BSTRINS_W || Opc == LoongArch::BSTRINS_D) ? Inst.getOperand(4).getImm() : Inst.getOperand(3).getImm(); if (Msb < Lsb) return Match_RequiresMsbNotLessThanLsb; return Match_Success; } } return Match_Success; } unsigned LoongArchAsmParser::validateTargetOperandClass(MCParsedAsmOperand &AsmOp, unsigned Kind) { LoongArchOperand &Op = static_cast(AsmOp); if (!Op.isReg()) return Match_InvalidOperand; MCRegister Reg = Op.getReg(); // As the parser couldn't differentiate an FPR32 from an FPR64, coerce the // register from FPR32 to FPR64 if necessary. if (LoongArchMCRegisterClasses[LoongArch::FPR32RegClassID].contains(Reg) && Kind == MCK_FPR64) { Op.setReg(convertFPR32ToFPR64(Reg)); return Match_Success; } return Match_InvalidOperand; } bool LoongArchAsmParser::generateImmOutOfRangeError( OperandVector &Operands, uint64_t ErrorInfo, int64_t Lower, int64_t Upper, Twine Msg = "immediate must be an integer in the range") { SMLoc ErrorLoc = ((LoongArchOperand &)*Operands[ErrorInfo]).getStartLoc(); return Error(ErrorLoc, Msg + " [" + Twine(Lower) + ", " + Twine(Upper) + "]"); } bool LoongArchAsmParser::MatchAndEmitInstruction(SMLoc IDLoc, unsigned &Opcode, OperandVector &Operands, MCStreamer &Out, uint64_t &ErrorInfo, bool MatchingInlineAsm) { MCInst Inst; FeatureBitset MissingFeatures; auto Result = MatchInstructionImpl(Operands, Inst, ErrorInfo, MissingFeatures, MatchingInlineAsm); switch (Result) { default: break; case Match_Success: return processInstruction(Inst, IDLoc, Operands, Out); case Match_MissingFeature: { assert(MissingFeatures.any() && "Unknown missing features!"); bool FirstFeature = true; std::string Msg = "instruction requires the following:"; for (unsigned i = 0, e = MissingFeatures.size(); i != e; ++i) { if (MissingFeatures[i]) { Msg += FirstFeature ? " " : ", "; Msg += getSubtargetFeatureName(i); FirstFeature = false; } } return Error(IDLoc, Msg); } case Match_MnemonicFail: { FeatureBitset FBS = ComputeAvailableFeatures(getSTI().getFeatureBits()); std::string Suggestion = LoongArchMnemonicSpellCheck( ((LoongArchOperand &)*Operands[0]).getToken(), FBS, 0); return Error(IDLoc, "unrecognized instruction mnemonic" + Suggestion); } case Match_InvalidOperand: { SMLoc ErrorLoc = IDLoc; if (ErrorInfo != ~0ULL) { if (ErrorInfo >= Operands.size()) return Error(ErrorLoc, "too few operands for instruction"); ErrorLoc = ((LoongArchOperand &)*Operands[ErrorInfo]).getStartLoc(); if (ErrorLoc == SMLoc()) ErrorLoc = IDLoc; } return Error(ErrorLoc, "invalid operand for instruction"); } } // Handle the case when the error message is of specific type // other than the generic Match_InvalidOperand, and the // corresponding operand is missing. if (Result > FIRST_TARGET_MATCH_RESULT_TY) { SMLoc ErrorLoc = IDLoc; if (ErrorInfo != ~0ULL && ErrorInfo >= Operands.size()) return Error(ErrorLoc, "too few operands for instruction"); } switch (Result) { default: break; case Match_RequiresMsbNotLessThanLsb: { SMLoc ErrorStart = Operands[3]->getStartLoc(); return Error(ErrorStart, "msb is less than lsb", SMRange(ErrorStart, Operands[4]->getEndLoc())); } case Match_RequiresOpnd2NotR0R1: return Error(Operands[2]->getStartLoc(), "must not be $r0 or $r1"); case Match_InvalidUImm2: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/0, /*Upper=*/(1 << 2) - 1); case Match_InvalidUImm2plus1: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/1, /*Upper=*/(1 << 2)); case Match_InvalidUImm3: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/0, /*Upper=*/(1 << 3) - 1); case Match_InvalidUImm5: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/0, /*Upper=*/(1 << 5) - 1); case Match_InvalidUImm6: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/0, /*Upper=*/(1 << 6) - 1); case Match_InvalidUImm12: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/0, /*Upper=*/(1 << 12) - 1); case Match_InvalidUImm15: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/0, /*Upper=*/(1 << 15) - 1); case Match_InvalidSImm12: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/-(1 << 11), /*Upper=*/(1 << 11) - 1); case Match_InvalidSImm14lsl2: return generateImmOutOfRangeError( Operands, ErrorInfo, /*Lower=*/-(1 << 15), /*Upper=*/(1 << 15) - 4, "immediate must be a multiple of 4 in the range"); case Match_InvalidSImm16: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/-(1 << 15), /*Upper=*/(1 << 15) - 1); case Match_InvalidSImm16lsl2: return generateImmOutOfRangeError( Operands, ErrorInfo, /*Lower=*/-(1 << 17), /*Upper=*/(1 << 17) - 4, "immediate must be a multiple of 4 in the range"); case Match_InvalidSImm20: return generateImmOutOfRangeError(Operands, ErrorInfo, /*Lower=*/-(1 << 19), /*Upper=*/(1 << 19) - 1); case Match_InvalidSImm21lsl2: return generateImmOutOfRangeError( Operands, ErrorInfo, /*Lower=*/-(1 << 22), /*Upper=*/(1 << 22) - 4, "immediate must be a multiple of 4 in the range"); case Match_InvalidSImm26lsl2: return generateImmOutOfRangeError( Operands, ErrorInfo, /*Lower=*/-(1 << 27), /*Upper=*/(1 << 27) - 4, "immediate must be a multiple of 4 in the range"); } llvm_unreachable("Unknown match type detected!"); } extern "C" LLVM_EXTERNAL_VISIBILITY void LLVMInitializeLoongArchAsmParser() { RegisterMCAsmParser X(getTheLoongArch32Target()); RegisterMCAsmParser Y(getTheLoongArch64Target()); }