1 //===- MIParser.cpp - Machine instructions parser implementation ----------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements the parsing of machine instructions. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "llvm/CodeGen/MIRParser/MIParser.h" 14 #include "MILexer.h" 15 #include "llvm/ADT/APInt.h" 16 #include "llvm/ADT/APSInt.h" 17 #include "llvm/ADT/ArrayRef.h" 18 #include "llvm/ADT/DenseMap.h" 19 #include "llvm/ADT/SmallVector.h" 20 #include "llvm/ADT/StringMap.h" 21 #include "llvm/ADT/StringRef.h" 22 #include "llvm/ADT/StringSwitch.h" 23 #include "llvm/ADT/Twine.h" 24 #include "llvm/AsmParser/Parser.h" 25 #include "llvm/AsmParser/SlotMapping.h" 26 #include "llvm/CodeGen/MIRFormatter.h" 27 #include "llvm/CodeGen/MIRPrinter.h" 28 #include "llvm/CodeGen/MachineBasicBlock.h" 29 #include "llvm/CodeGen/MachineFrameInfo.h" 30 #include "llvm/CodeGen/MachineFunction.h" 31 #include "llvm/CodeGen/MachineInstr.h" 32 #include "llvm/CodeGen/MachineInstrBuilder.h" 33 #include "llvm/CodeGen/MachineMemOperand.h" 34 #include "llvm/CodeGen/MachineOperand.h" 35 #include "llvm/CodeGen/MachineRegisterInfo.h" 36 #include "llvm/CodeGen/PseudoSourceValueManager.h" 37 #include "llvm/CodeGen/RegisterBank.h" 38 #include "llvm/CodeGen/RegisterBankInfo.h" 39 #include "llvm/CodeGen/TargetInstrInfo.h" 40 #include "llvm/CodeGen/TargetRegisterInfo.h" 41 #include "llvm/CodeGen/TargetSubtargetInfo.h" 42 #include "llvm/CodeGenTypes/LowLevelType.h" 43 #include "llvm/IR/BasicBlock.h" 44 #include "llvm/IR/Constants.h" 45 #include "llvm/IR/DataLayout.h" 46 #include "llvm/IR/DebugInfoMetadata.h" 47 #include "llvm/IR/DebugLoc.h" 48 #include "llvm/IR/Function.h" 49 #include "llvm/IR/InstrTypes.h" 50 #include "llvm/IR/Instructions.h" 51 #include "llvm/IR/Intrinsics.h" 52 #include "llvm/IR/Metadata.h" 53 #include "llvm/IR/Module.h" 54 #include "llvm/IR/ModuleSlotTracker.h" 55 #include "llvm/IR/Type.h" 56 #include "llvm/IR/Value.h" 57 #include "llvm/IR/ValueSymbolTable.h" 58 #include "llvm/MC/LaneBitmask.h" 59 #include "llvm/MC/MCContext.h" 60 #include "llvm/MC/MCDwarf.h" 61 #include "llvm/MC/MCInstrDesc.h" 62 #include "llvm/Support/AtomicOrdering.h" 63 #include "llvm/Support/BranchProbability.h" 64 #include "llvm/Support/Casting.h" 65 #include "llvm/Support/ErrorHandling.h" 66 #include "llvm/Support/MemoryBuffer.h" 67 #include "llvm/Support/SMLoc.h" 68 #include "llvm/Support/SourceMgr.h" 69 #include "llvm/Target/TargetMachine.h" 70 #include <cassert> 71 #include <cctype> 72 #include <cstddef> 73 #include <cstdint> 74 #include <limits> 75 #include <string> 76 #include <utility> 77 78 using namespace llvm; 79 80 void PerTargetMIParsingState::setTarget( 81 const TargetSubtargetInfo &NewSubtarget) { 82 83 // If the subtarget changed, over conservatively assume everything is invalid. 84 if (&Subtarget == &NewSubtarget) 85 return; 86 87 Names2InstrOpCodes.clear(); 88 Names2Regs.clear(); 89 Names2RegMasks.clear(); 90 Names2SubRegIndices.clear(); 91 Names2TargetIndices.clear(); 92 Names2DirectTargetFlags.clear(); 93 Names2BitmaskTargetFlags.clear(); 94 Names2MMOTargetFlags.clear(); 95 96 initNames2RegClasses(); 97 initNames2RegBanks(); 98 } 99 100 void PerTargetMIParsingState::initNames2Regs() { 101 if (!Names2Regs.empty()) 102 return; 103 104 // The '%noreg' register is the register 0. 105 Names2Regs.insert(std::make_pair("noreg", 0)); 106 const auto *TRI = Subtarget.getRegisterInfo(); 107 assert(TRI && "Expected target register info"); 108 109 for (unsigned I = 0, E = TRI->getNumRegs(); I < E; ++I) { 110 bool WasInserted = 111 Names2Regs.insert(std::make_pair(StringRef(TRI->getName(I)).lower(), I)) 112 .second; 113 (void)WasInserted; 114 assert(WasInserted && "Expected registers to be unique case-insensitively"); 115 } 116 } 117 118 bool PerTargetMIParsingState::getRegisterByName(StringRef RegName, 119 Register &Reg) { 120 initNames2Regs(); 121 auto RegInfo = Names2Regs.find(RegName); 122 if (RegInfo == Names2Regs.end()) 123 return true; 124 Reg = RegInfo->getValue(); 125 return false; 126 } 127 128 bool PerTargetMIParsingState::getVRegFlagValue(StringRef FlagName, 129 uint8_t &FlagValue) const { 130 const auto *TRI = Subtarget.getRegisterInfo(); 131 std::optional<uint8_t> FV = TRI->getVRegFlagValue(FlagName); 132 if (!FV) 133 return true; 134 FlagValue = *FV; 135 return false; 136 } 137 138 void PerTargetMIParsingState::initNames2InstrOpCodes() { 139 if (!Names2InstrOpCodes.empty()) 140 return; 141 const auto *TII = Subtarget.getInstrInfo(); 142 assert(TII && "Expected target instruction info"); 143 for (unsigned I = 0, E = TII->getNumOpcodes(); I < E; ++I) 144 Names2InstrOpCodes.insert(std::make_pair(StringRef(TII->getName(I)), I)); 145 } 146 147 bool PerTargetMIParsingState::parseInstrName(StringRef InstrName, 148 unsigned &OpCode) { 149 initNames2InstrOpCodes(); 150 auto InstrInfo = Names2InstrOpCodes.find(InstrName); 151 if (InstrInfo == Names2InstrOpCodes.end()) 152 return true; 153 OpCode = InstrInfo->getValue(); 154 return false; 155 } 156 157 void PerTargetMIParsingState::initNames2RegMasks() { 158 if (!Names2RegMasks.empty()) 159 return; 160 const auto *TRI = Subtarget.getRegisterInfo(); 161 assert(TRI && "Expected target register info"); 162 ArrayRef<const uint32_t *> RegMasks = TRI->getRegMasks(); 163 ArrayRef<const char *> RegMaskNames = TRI->getRegMaskNames(); 164 assert(RegMasks.size() == RegMaskNames.size()); 165 for (size_t I = 0, E = RegMasks.size(); I < E; ++I) 166 Names2RegMasks.insert( 167 std::make_pair(StringRef(RegMaskNames[I]).lower(), RegMasks[I])); 168 } 169 170 const uint32_t *PerTargetMIParsingState::getRegMask(StringRef Identifier) { 171 initNames2RegMasks(); 172 auto RegMaskInfo = Names2RegMasks.find(Identifier); 173 if (RegMaskInfo == Names2RegMasks.end()) 174 return nullptr; 175 return RegMaskInfo->getValue(); 176 } 177 178 void PerTargetMIParsingState::initNames2SubRegIndices() { 179 if (!Names2SubRegIndices.empty()) 180 return; 181 const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo(); 182 for (unsigned I = 1, E = TRI->getNumSubRegIndices(); I < E; ++I) 183 Names2SubRegIndices.insert( 184 std::make_pair(TRI->getSubRegIndexName(I), I)); 185 } 186 187 unsigned PerTargetMIParsingState::getSubRegIndex(StringRef Name) { 188 initNames2SubRegIndices(); 189 auto SubRegInfo = Names2SubRegIndices.find(Name); 190 if (SubRegInfo == Names2SubRegIndices.end()) 191 return 0; 192 return SubRegInfo->getValue(); 193 } 194 195 void PerTargetMIParsingState::initNames2TargetIndices() { 196 if (!Names2TargetIndices.empty()) 197 return; 198 const auto *TII = Subtarget.getInstrInfo(); 199 assert(TII && "Expected target instruction info"); 200 auto Indices = TII->getSerializableTargetIndices(); 201 for (const auto &I : Indices) 202 Names2TargetIndices.insert(std::make_pair(StringRef(I.second), I.first)); 203 } 204 205 bool PerTargetMIParsingState::getTargetIndex(StringRef Name, int &Index) { 206 initNames2TargetIndices(); 207 auto IndexInfo = Names2TargetIndices.find(Name); 208 if (IndexInfo == Names2TargetIndices.end()) 209 return true; 210 Index = IndexInfo->second; 211 return false; 212 } 213 214 void PerTargetMIParsingState::initNames2DirectTargetFlags() { 215 if (!Names2DirectTargetFlags.empty()) 216 return; 217 218 const auto *TII = Subtarget.getInstrInfo(); 219 assert(TII && "Expected target instruction info"); 220 auto Flags = TII->getSerializableDirectMachineOperandTargetFlags(); 221 for (const auto &I : Flags) 222 Names2DirectTargetFlags.insert( 223 std::make_pair(StringRef(I.second), I.first)); 224 } 225 226 bool PerTargetMIParsingState::getDirectTargetFlag(StringRef Name, 227 unsigned &Flag) { 228 initNames2DirectTargetFlags(); 229 auto FlagInfo = Names2DirectTargetFlags.find(Name); 230 if (FlagInfo == Names2DirectTargetFlags.end()) 231 return true; 232 Flag = FlagInfo->second; 233 return false; 234 } 235 236 void PerTargetMIParsingState::initNames2BitmaskTargetFlags() { 237 if (!Names2BitmaskTargetFlags.empty()) 238 return; 239 240 const auto *TII = Subtarget.getInstrInfo(); 241 assert(TII && "Expected target instruction info"); 242 auto Flags = TII->getSerializableBitmaskMachineOperandTargetFlags(); 243 for (const auto &I : Flags) 244 Names2BitmaskTargetFlags.insert( 245 std::make_pair(StringRef(I.second), I.first)); 246 } 247 248 bool PerTargetMIParsingState::getBitmaskTargetFlag(StringRef Name, 249 unsigned &Flag) { 250 initNames2BitmaskTargetFlags(); 251 auto FlagInfo = Names2BitmaskTargetFlags.find(Name); 252 if (FlagInfo == Names2BitmaskTargetFlags.end()) 253 return true; 254 Flag = FlagInfo->second; 255 return false; 256 } 257 258 void PerTargetMIParsingState::initNames2MMOTargetFlags() { 259 if (!Names2MMOTargetFlags.empty()) 260 return; 261 262 const auto *TII = Subtarget.getInstrInfo(); 263 assert(TII && "Expected target instruction info"); 264 auto Flags = TII->getSerializableMachineMemOperandTargetFlags(); 265 for (const auto &I : Flags) 266 Names2MMOTargetFlags.insert(std::make_pair(StringRef(I.second), I.first)); 267 } 268 269 bool PerTargetMIParsingState::getMMOTargetFlag(StringRef Name, 270 MachineMemOperand::Flags &Flag) { 271 initNames2MMOTargetFlags(); 272 auto FlagInfo = Names2MMOTargetFlags.find(Name); 273 if (FlagInfo == Names2MMOTargetFlags.end()) 274 return true; 275 Flag = FlagInfo->second; 276 return false; 277 } 278 279 void PerTargetMIParsingState::initNames2RegClasses() { 280 if (!Names2RegClasses.empty()) 281 return; 282 283 const TargetRegisterInfo *TRI = Subtarget.getRegisterInfo(); 284 for (unsigned I = 0, E = TRI->getNumRegClasses(); I < E; ++I) { 285 const auto *RC = TRI->getRegClass(I); 286 Names2RegClasses.insert( 287 std::make_pair(StringRef(TRI->getRegClassName(RC)).lower(), RC)); 288 } 289 } 290 291 void PerTargetMIParsingState::initNames2RegBanks() { 292 if (!Names2RegBanks.empty()) 293 return; 294 295 const RegisterBankInfo *RBI = Subtarget.getRegBankInfo(); 296 // If the target does not support GlobalISel, we may not have a 297 // register bank info. 298 if (!RBI) 299 return; 300 301 for (unsigned I = 0, E = RBI->getNumRegBanks(); I < E; ++I) { 302 const auto &RegBank = RBI->getRegBank(I); 303 Names2RegBanks.insert( 304 std::make_pair(StringRef(RegBank.getName()).lower(), &RegBank)); 305 } 306 } 307 308 const TargetRegisterClass * 309 PerTargetMIParsingState::getRegClass(StringRef Name) { 310 auto RegClassInfo = Names2RegClasses.find(Name); 311 if (RegClassInfo == Names2RegClasses.end()) 312 return nullptr; 313 return RegClassInfo->getValue(); 314 } 315 316 const RegisterBank *PerTargetMIParsingState::getRegBank(StringRef Name) { 317 auto RegBankInfo = Names2RegBanks.find(Name); 318 if (RegBankInfo == Names2RegBanks.end()) 319 return nullptr; 320 return RegBankInfo->getValue(); 321 } 322 323 PerFunctionMIParsingState::PerFunctionMIParsingState(MachineFunction &MF, 324 SourceMgr &SM, const SlotMapping &IRSlots, PerTargetMIParsingState &T) 325 : MF(MF), SM(&SM), IRSlots(IRSlots), Target(T) { 326 } 327 328 VRegInfo &PerFunctionMIParsingState::getVRegInfo(Register Num) { 329 auto I = VRegInfos.try_emplace(Num); 330 if (I.second) { 331 MachineRegisterInfo &MRI = MF.getRegInfo(); 332 VRegInfo *Info = new (Allocator) VRegInfo; 333 Info->VReg = MRI.createIncompleteVirtualRegister(); 334 I.first->second = Info; 335 } 336 return *I.first->second; 337 } 338 339 VRegInfo &PerFunctionMIParsingState::getVRegInfoNamed(StringRef RegName) { 340 assert(RegName != "" && "Expected named reg."); 341 342 auto I = VRegInfosNamed.try_emplace(RegName.str()); 343 if (I.second) { 344 VRegInfo *Info = new (Allocator) VRegInfo; 345 Info->VReg = MF.getRegInfo().createIncompleteVirtualRegister(RegName); 346 I.first->second = Info; 347 } 348 return *I.first->second; 349 } 350 351 static void mapValueToSlot(const Value *V, ModuleSlotTracker &MST, 352 DenseMap<unsigned, const Value *> &Slots2Values) { 353 int Slot = MST.getLocalSlot(V); 354 if (Slot == -1) 355 return; 356 Slots2Values.insert(std::make_pair(unsigned(Slot), V)); 357 } 358 359 /// Creates the mapping from slot numbers to function's unnamed IR values. 360 static void initSlots2Values(const Function &F, 361 DenseMap<unsigned, const Value *> &Slots2Values) { 362 ModuleSlotTracker MST(F.getParent(), /*ShouldInitializeAllMetadata=*/false); 363 MST.incorporateFunction(F); 364 for (const auto &Arg : F.args()) 365 mapValueToSlot(&Arg, MST, Slots2Values); 366 for (const auto &BB : F) { 367 mapValueToSlot(&BB, MST, Slots2Values); 368 for (const auto &I : BB) 369 mapValueToSlot(&I, MST, Slots2Values); 370 } 371 } 372 373 const Value* PerFunctionMIParsingState::getIRValue(unsigned Slot) { 374 if (Slots2Values.empty()) 375 initSlots2Values(MF.getFunction(), Slots2Values); 376 return Slots2Values.lookup(Slot); 377 } 378 379 namespace { 380 381 /// A wrapper struct around the 'MachineOperand' struct that includes a source 382 /// range and other attributes. 383 struct ParsedMachineOperand { 384 MachineOperand Operand; 385 StringRef::iterator Begin; 386 StringRef::iterator End; 387 std::optional<unsigned> TiedDefIdx; 388 389 ParsedMachineOperand(const MachineOperand &Operand, StringRef::iterator Begin, 390 StringRef::iterator End, 391 std::optional<unsigned> &TiedDefIdx) 392 : Operand(Operand), Begin(Begin), End(End), TiedDefIdx(TiedDefIdx) { 393 if (TiedDefIdx) 394 assert(Operand.isReg() && Operand.isUse() && 395 "Only used register operands can be tied"); 396 } 397 }; 398 399 class MIParser { 400 MachineFunction &MF; 401 SMDiagnostic &Error; 402 StringRef Source, CurrentSource; 403 SMRange SourceRange; 404 MIToken Token; 405 PerFunctionMIParsingState &PFS; 406 /// Maps from slot numbers to function's unnamed basic blocks. 407 DenseMap<unsigned, const BasicBlock *> Slots2BasicBlocks; 408 409 public: 410 MIParser(PerFunctionMIParsingState &PFS, SMDiagnostic &Error, 411 StringRef Source); 412 MIParser(PerFunctionMIParsingState &PFS, SMDiagnostic &Error, 413 StringRef Source, SMRange SourceRange); 414 415 /// \p SkipChar gives the number of characters to skip before looking 416 /// for the next token. 417 void lex(unsigned SkipChar = 0); 418 419 /// Report an error at the current location with the given message. 420 /// 421 /// This function always return true. 422 bool error(const Twine &Msg); 423 424 /// Report an error at the given location with the given message. 425 /// 426 /// This function always return true. 427 bool error(StringRef::iterator Loc, const Twine &Msg); 428 429 bool 430 parseBasicBlockDefinitions(DenseMap<unsigned, MachineBasicBlock *> &MBBSlots); 431 bool parseBasicBlocks(); 432 bool parse(MachineInstr *&MI); 433 bool parseStandaloneMBB(MachineBasicBlock *&MBB); 434 bool parseStandaloneNamedRegister(Register &Reg); 435 bool parseStandaloneVirtualRegister(VRegInfo *&Info); 436 bool parseStandaloneRegister(Register &Reg); 437 bool parseStandaloneStackObject(int &FI); 438 bool parseStandaloneMDNode(MDNode *&Node); 439 bool parseMachineMetadata(); 440 bool parseMDTuple(MDNode *&MD, bool IsDistinct); 441 bool parseMDNodeVector(SmallVectorImpl<Metadata *> &Elts); 442 bool parseMetadata(Metadata *&MD); 443 444 bool 445 parseBasicBlockDefinition(DenseMap<unsigned, MachineBasicBlock *> &MBBSlots); 446 bool parseBasicBlock(MachineBasicBlock &MBB, 447 MachineBasicBlock *&AddFalthroughFrom); 448 bool parseBasicBlockLiveins(MachineBasicBlock &MBB); 449 bool parseBasicBlockSuccessors(MachineBasicBlock &MBB); 450 451 bool parseNamedRegister(Register &Reg); 452 bool parseVirtualRegister(VRegInfo *&Info); 453 bool parseNamedVirtualRegister(VRegInfo *&Info); 454 bool parseRegister(Register &Reg, VRegInfo *&VRegInfo); 455 bool parseRegisterFlag(unsigned &Flags); 456 bool parseRegisterClassOrBank(VRegInfo &RegInfo); 457 bool parseSubRegisterIndex(unsigned &SubReg); 458 bool parseRegisterTiedDefIndex(unsigned &TiedDefIdx); 459 bool parseRegisterOperand(MachineOperand &Dest, 460 std::optional<unsigned> &TiedDefIdx, 461 bool IsDef = false); 462 bool parseImmediateOperand(MachineOperand &Dest); 463 bool parseIRConstant(StringRef::iterator Loc, StringRef StringValue, 464 const Constant *&C); 465 bool parseIRConstant(StringRef::iterator Loc, const Constant *&C); 466 bool parseLowLevelType(StringRef::iterator Loc, LLT &Ty); 467 bool parseTypedImmediateOperand(MachineOperand &Dest); 468 bool parseFPImmediateOperand(MachineOperand &Dest); 469 bool parseMBBReference(MachineBasicBlock *&MBB); 470 bool parseMBBOperand(MachineOperand &Dest); 471 bool parseStackFrameIndex(int &FI); 472 bool parseStackObjectOperand(MachineOperand &Dest); 473 bool parseFixedStackFrameIndex(int &FI); 474 bool parseFixedStackObjectOperand(MachineOperand &Dest); 475 bool parseGlobalValue(GlobalValue *&GV); 476 bool parseGlobalAddressOperand(MachineOperand &Dest); 477 bool parseConstantPoolIndexOperand(MachineOperand &Dest); 478 bool parseSubRegisterIndexOperand(MachineOperand &Dest); 479 bool parseJumpTableIndexOperand(MachineOperand &Dest); 480 bool parseExternalSymbolOperand(MachineOperand &Dest); 481 bool parseMCSymbolOperand(MachineOperand &Dest); 482 [[nodiscard]] bool parseMDNode(MDNode *&Node); 483 bool parseDIExpression(MDNode *&Expr); 484 bool parseDILocation(MDNode *&Expr); 485 bool parseMetadataOperand(MachineOperand &Dest); 486 bool parseCFIOffset(int &Offset); 487 bool parseCFIRegister(unsigned &Reg); 488 bool parseCFIAddressSpace(unsigned &AddressSpace); 489 bool parseCFIEscapeValues(std::string& Values); 490 bool parseCFIOperand(MachineOperand &Dest); 491 bool parseIRBlock(BasicBlock *&BB, const Function &F); 492 bool parseBlockAddressOperand(MachineOperand &Dest); 493 bool parseIntrinsicOperand(MachineOperand &Dest); 494 bool parsePredicateOperand(MachineOperand &Dest); 495 bool parseShuffleMaskOperand(MachineOperand &Dest); 496 bool parseTargetIndexOperand(MachineOperand &Dest); 497 bool parseDbgInstrRefOperand(MachineOperand &Dest); 498 bool parseCustomRegisterMaskOperand(MachineOperand &Dest); 499 bool parseLiveoutRegisterMaskOperand(MachineOperand &Dest); 500 bool parseMachineOperand(const unsigned OpCode, const unsigned OpIdx, 501 MachineOperand &Dest, 502 std::optional<unsigned> &TiedDefIdx); 503 bool parseMachineOperandAndTargetFlags(const unsigned OpCode, 504 const unsigned OpIdx, 505 MachineOperand &Dest, 506 std::optional<unsigned> &TiedDefIdx); 507 bool parseOffset(int64_t &Offset); 508 bool parseIRBlockAddressTaken(BasicBlock *&BB); 509 bool parseAlignment(uint64_t &Alignment); 510 bool parseAddrspace(unsigned &Addrspace); 511 bool parseSectionID(std::optional<MBBSectionID> &SID); 512 bool parseBBID(std::optional<UniqueBBID> &BBID); 513 bool parseCallFrameSize(unsigned &CallFrameSize); 514 bool parseOperandsOffset(MachineOperand &Op); 515 bool parseIRValue(const Value *&V); 516 bool parseMemoryOperandFlag(MachineMemOperand::Flags &Flags); 517 bool parseMemoryPseudoSourceValue(const PseudoSourceValue *&PSV); 518 bool parseMachinePointerInfo(MachinePointerInfo &Dest); 519 bool parseOptionalScope(LLVMContext &Context, SyncScope::ID &SSID); 520 bool parseOptionalAtomicOrdering(AtomicOrdering &Order); 521 bool parseMachineMemoryOperand(MachineMemOperand *&Dest); 522 bool parsePreOrPostInstrSymbol(MCSymbol *&Symbol); 523 bool parseHeapAllocMarker(MDNode *&Node); 524 bool parsePCSections(MDNode *&Node); 525 526 bool parseTargetImmMnemonic(const unsigned OpCode, const unsigned OpIdx, 527 MachineOperand &Dest, const MIRFormatter &MF); 528 529 private: 530 /// Convert the integer literal in the current token into an unsigned integer. 531 /// 532 /// Return true if an error occurred. 533 bool getUnsigned(unsigned &Result); 534 535 /// Convert the integer literal in the current token into an uint64. 536 /// 537 /// Return true if an error occurred. 538 bool getUint64(uint64_t &Result); 539 540 /// Convert the hexadecimal literal in the current token into an unsigned 541 /// APInt with a minimum bitwidth required to represent the value. 542 /// 543 /// Return true if the literal does not represent an integer value. 544 bool getHexUint(APInt &Result); 545 546 /// If the current token is of the given kind, consume it and return false. 547 /// Otherwise report an error and return true. 548 bool expectAndConsume(MIToken::TokenKind TokenKind); 549 550 /// If the current token is of the given kind, consume it and return true. 551 /// Otherwise return false. 552 bool consumeIfPresent(MIToken::TokenKind TokenKind); 553 554 bool parseInstruction(unsigned &OpCode, unsigned &Flags); 555 556 bool assignRegisterTies(MachineInstr &MI, 557 ArrayRef<ParsedMachineOperand> Operands); 558 559 bool verifyImplicitOperands(ArrayRef<ParsedMachineOperand> Operands, 560 const MCInstrDesc &MCID); 561 562 const BasicBlock *getIRBlock(unsigned Slot); 563 const BasicBlock *getIRBlock(unsigned Slot, const Function &F); 564 565 /// Get or create an MCSymbol for a given name. 566 MCSymbol *getOrCreateMCSymbol(StringRef Name); 567 568 /// parseStringConstant 569 /// ::= StringConstant 570 bool parseStringConstant(std::string &Result); 571 572 /// Map the location in the MI string to the corresponding location specified 573 /// in `SourceRange`. 574 SMLoc mapSMLoc(StringRef::iterator Loc); 575 }; 576 577 } // end anonymous namespace 578 579 MIParser::MIParser(PerFunctionMIParsingState &PFS, SMDiagnostic &Error, 580 StringRef Source) 581 : MF(PFS.MF), Error(Error), Source(Source), CurrentSource(Source), PFS(PFS) 582 {} 583 584 MIParser::MIParser(PerFunctionMIParsingState &PFS, SMDiagnostic &Error, 585 StringRef Source, SMRange SourceRange) 586 : MF(PFS.MF), Error(Error), Source(Source), CurrentSource(Source), 587 SourceRange(SourceRange), PFS(PFS) {} 588 589 void MIParser::lex(unsigned SkipChar) { 590 CurrentSource = lexMIToken( 591 CurrentSource.substr(SkipChar), Token, 592 [this](StringRef::iterator Loc, const Twine &Msg) { error(Loc, Msg); }); 593 } 594 595 bool MIParser::error(const Twine &Msg) { return error(Token.location(), Msg); } 596 597 bool MIParser::error(StringRef::iterator Loc, const Twine &Msg) { 598 const SourceMgr &SM = *PFS.SM; 599 assert(Loc >= Source.data() && Loc <= (Source.data() + Source.size())); 600 const MemoryBuffer &Buffer = *SM.getMemoryBuffer(SM.getMainFileID()); 601 if (Loc >= Buffer.getBufferStart() && Loc <= Buffer.getBufferEnd()) { 602 // Create an ordinary diagnostic when the source manager's buffer is the 603 // source string. 604 Error = SM.GetMessage(SMLoc::getFromPointer(Loc), SourceMgr::DK_Error, Msg); 605 return true; 606 } 607 // Create a diagnostic for a YAML string literal. 608 Error = SMDiagnostic(SM, SMLoc(), Buffer.getBufferIdentifier(), 1, 609 Loc - Source.data(), SourceMgr::DK_Error, Msg.str(), 610 Source, {}, {}); 611 return true; 612 } 613 614 SMLoc MIParser::mapSMLoc(StringRef::iterator Loc) { 615 assert(SourceRange.isValid() && "Invalid source range"); 616 assert(Loc >= Source.data() && Loc <= (Source.data() + Source.size())); 617 return SMLoc::getFromPointer(SourceRange.Start.getPointer() + 618 (Loc - Source.data())); 619 } 620 621 typedef function_ref<bool(StringRef::iterator Loc, const Twine &)> 622 ErrorCallbackType; 623 624 static const char *toString(MIToken::TokenKind TokenKind) { 625 switch (TokenKind) { 626 case MIToken::comma: 627 return "','"; 628 case MIToken::equal: 629 return "'='"; 630 case MIToken::colon: 631 return "':'"; 632 case MIToken::lparen: 633 return "'('"; 634 case MIToken::rparen: 635 return "')'"; 636 default: 637 return "<unknown token>"; 638 } 639 } 640 641 bool MIParser::expectAndConsume(MIToken::TokenKind TokenKind) { 642 if (Token.isNot(TokenKind)) 643 return error(Twine("expected ") + toString(TokenKind)); 644 lex(); 645 return false; 646 } 647 648 bool MIParser::consumeIfPresent(MIToken::TokenKind TokenKind) { 649 if (Token.isNot(TokenKind)) 650 return false; 651 lex(); 652 return true; 653 } 654 655 // Parse Machine Basic Block Section ID. 656 bool MIParser::parseSectionID(std::optional<MBBSectionID> &SID) { 657 assert(Token.is(MIToken::kw_bbsections)); 658 lex(); 659 if (Token.is(MIToken::IntegerLiteral)) { 660 unsigned Value = 0; 661 if (getUnsigned(Value)) 662 return error("Unknown Section ID"); 663 SID = MBBSectionID{Value}; 664 } else { 665 const StringRef &S = Token.stringValue(); 666 if (S == "Exception") 667 SID = MBBSectionID::ExceptionSectionID; 668 else if (S == "Cold") 669 SID = MBBSectionID::ColdSectionID; 670 else 671 return error("Unknown Section ID"); 672 } 673 lex(); 674 return false; 675 } 676 677 // Parse Machine Basic Block ID. 678 bool MIParser::parseBBID(std::optional<UniqueBBID> &BBID) { 679 assert(Token.is(MIToken::kw_bb_id)); 680 lex(); 681 unsigned BaseID = 0; 682 unsigned CloneID = 0; 683 if (getUnsigned(BaseID)) 684 return error("Unknown BB ID"); 685 lex(); 686 if (Token.is(MIToken::IntegerLiteral)) { 687 if (getUnsigned(CloneID)) 688 return error("Unknown Clone ID"); 689 lex(); 690 } 691 BBID = {BaseID, CloneID}; 692 return false; 693 } 694 695 // Parse basic block call frame size. 696 bool MIParser::parseCallFrameSize(unsigned &CallFrameSize) { 697 assert(Token.is(MIToken::kw_call_frame_size)); 698 lex(); 699 unsigned Value = 0; 700 if (getUnsigned(Value)) 701 return error("Unknown call frame size"); 702 CallFrameSize = Value; 703 lex(); 704 return false; 705 } 706 707 bool MIParser::parseBasicBlockDefinition( 708 DenseMap<unsigned, MachineBasicBlock *> &MBBSlots) { 709 assert(Token.is(MIToken::MachineBasicBlockLabel)); 710 unsigned ID = 0; 711 if (getUnsigned(ID)) 712 return true; 713 auto Loc = Token.location(); 714 auto Name = Token.stringValue(); 715 lex(); 716 bool MachineBlockAddressTaken = false; 717 BasicBlock *AddressTakenIRBlock = nullptr; 718 bool IsLandingPad = false; 719 bool IsInlineAsmBrIndirectTarget = false; 720 bool IsEHFuncletEntry = false; 721 std::optional<MBBSectionID> SectionID; 722 uint64_t Alignment = 0; 723 std::optional<UniqueBBID> BBID; 724 unsigned CallFrameSize = 0; 725 BasicBlock *BB = nullptr; 726 if (consumeIfPresent(MIToken::lparen)) { 727 do { 728 // TODO: Report an error when multiple same attributes are specified. 729 switch (Token.kind()) { 730 case MIToken::kw_machine_block_address_taken: 731 MachineBlockAddressTaken = true; 732 lex(); 733 break; 734 case MIToken::kw_ir_block_address_taken: 735 if (parseIRBlockAddressTaken(AddressTakenIRBlock)) 736 return true; 737 break; 738 case MIToken::kw_landing_pad: 739 IsLandingPad = true; 740 lex(); 741 break; 742 case MIToken::kw_inlineasm_br_indirect_target: 743 IsInlineAsmBrIndirectTarget = true; 744 lex(); 745 break; 746 case MIToken::kw_ehfunclet_entry: 747 IsEHFuncletEntry = true; 748 lex(); 749 break; 750 case MIToken::kw_align: 751 if (parseAlignment(Alignment)) 752 return true; 753 break; 754 case MIToken::IRBlock: 755 case MIToken::NamedIRBlock: 756 // TODO: Report an error when both name and ir block are specified. 757 if (parseIRBlock(BB, MF.getFunction())) 758 return true; 759 lex(); 760 break; 761 case MIToken::kw_bbsections: 762 if (parseSectionID(SectionID)) 763 return true; 764 break; 765 case MIToken::kw_bb_id: 766 if (parseBBID(BBID)) 767 return true; 768 break; 769 case MIToken::kw_call_frame_size: 770 if (parseCallFrameSize(CallFrameSize)) 771 return true; 772 break; 773 default: 774 break; 775 } 776 } while (consumeIfPresent(MIToken::comma)); 777 if (expectAndConsume(MIToken::rparen)) 778 return true; 779 } 780 if (expectAndConsume(MIToken::colon)) 781 return true; 782 783 if (!Name.empty()) { 784 BB = dyn_cast_or_null<BasicBlock>( 785 MF.getFunction().getValueSymbolTable()->lookup(Name)); 786 if (!BB) 787 return error(Loc, Twine("basic block '") + Name + 788 "' is not defined in the function '" + 789 MF.getName() + "'"); 790 } 791 auto *MBB = MF.CreateMachineBasicBlock(BB, BBID); 792 MF.insert(MF.end(), MBB); 793 bool WasInserted = MBBSlots.insert(std::make_pair(ID, MBB)).second; 794 if (!WasInserted) 795 return error(Loc, Twine("redefinition of machine basic block with id #") + 796 Twine(ID)); 797 if (Alignment) 798 MBB->setAlignment(Align(Alignment)); 799 if (MachineBlockAddressTaken) 800 MBB->setMachineBlockAddressTaken(); 801 if (AddressTakenIRBlock) 802 MBB->setAddressTakenIRBlock(AddressTakenIRBlock); 803 MBB->setIsEHPad(IsLandingPad); 804 MBB->setIsInlineAsmBrIndirectTarget(IsInlineAsmBrIndirectTarget); 805 MBB->setIsEHFuncletEntry(IsEHFuncletEntry); 806 if (SectionID) { 807 MBB->setSectionID(*SectionID); 808 MF.setBBSectionsType(BasicBlockSection::List); 809 } 810 MBB->setCallFrameSize(CallFrameSize); 811 return false; 812 } 813 814 bool MIParser::parseBasicBlockDefinitions( 815 DenseMap<unsigned, MachineBasicBlock *> &MBBSlots) { 816 lex(); 817 // Skip until the first machine basic block. 818 while (Token.is(MIToken::Newline)) 819 lex(); 820 if (Token.isErrorOrEOF()) 821 return Token.isError(); 822 if (Token.isNot(MIToken::MachineBasicBlockLabel)) 823 return error("expected a basic block definition before instructions"); 824 unsigned BraceDepth = 0; 825 do { 826 if (parseBasicBlockDefinition(MBBSlots)) 827 return true; 828 bool IsAfterNewline = false; 829 // Skip until the next machine basic block. 830 while (true) { 831 if ((Token.is(MIToken::MachineBasicBlockLabel) && IsAfterNewline) || 832 Token.isErrorOrEOF()) 833 break; 834 else if (Token.is(MIToken::MachineBasicBlockLabel)) 835 return error("basic block definition should be located at the start of " 836 "the line"); 837 else if (consumeIfPresent(MIToken::Newline)) { 838 IsAfterNewline = true; 839 continue; 840 } 841 IsAfterNewline = false; 842 if (Token.is(MIToken::lbrace)) 843 ++BraceDepth; 844 if (Token.is(MIToken::rbrace)) { 845 if (!BraceDepth) 846 return error("extraneous closing brace ('}')"); 847 --BraceDepth; 848 } 849 lex(); 850 } 851 // Verify that we closed all of the '{' at the end of a file or a block. 852 if (!Token.isError() && BraceDepth) 853 return error("expected '}'"); // FIXME: Report a note that shows '{'. 854 } while (!Token.isErrorOrEOF()); 855 return Token.isError(); 856 } 857 858 bool MIParser::parseBasicBlockLiveins(MachineBasicBlock &MBB) { 859 assert(Token.is(MIToken::kw_liveins)); 860 lex(); 861 if (expectAndConsume(MIToken::colon)) 862 return true; 863 if (Token.isNewlineOrEOF()) // Allow an empty list of liveins. 864 return false; 865 do { 866 if (Token.isNot(MIToken::NamedRegister)) 867 return error("expected a named register"); 868 Register Reg; 869 if (parseNamedRegister(Reg)) 870 return true; 871 lex(); 872 LaneBitmask Mask = LaneBitmask::getAll(); 873 if (consumeIfPresent(MIToken::colon)) { 874 // Parse lane mask. 875 if (Token.isNot(MIToken::IntegerLiteral) && 876 Token.isNot(MIToken::HexLiteral)) 877 return error("expected a lane mask"); 878 static_assert(sizeof(LaneBitmask::Type) == sizeof(uint64_t), 879 "Use correct get-function for lane mask"); 880 LaneBitmask::Type V; 881 if (getUint64(V)) 882 return error("invalid lane mask value"); 883 Mask = LaneBitmask(V); 884 lex(); 885 } 886 MBB.addLiveIn(Reg, Mask); 887 } while (consumeIfPresent(MIToken::comma)); 888 return false; 889 } 890 891 bool MIParser::parseBasicBlockSuccessors(MachineBasicBlock &MBB) { 892 assert(Token.is(MIToken::kw_successors)); 893 lex(); 894 if (expectAndConsume(MIToken::colon)) 895 return true; 896 if (Token.isNewlineOrEOF()) // Allow an empty list of successors. 897 return false; 898 do { 899 if (Token.isNot(MIToken::MachineBasicBlock)) 900 return error("expected a machine basic block reference"); 901 MachineBasicBlock *SuccMBB = nullptr; 902 if (parseMBBReference(SuccMBB)) 903 return true; 904 lex(); 905 unsigned Weight = 0; 906 if (consumeIfPresent(MIToken::lparen)) { 907 if (Token.isNot(MIToken::IntegerLiteral) && 908 Token.isNot(MIToken::HexLiteral)) 909 return error("expected an integer literal after '('"); 910 if (getUnsigned(Weight)) 911 return true; 912 lex(); 913 if (expectAndConsume(MIToken::rparen)) 914 return true; 915 } 916 MBB.addSuccessor(SuccMBB, BranchProbability::getRaw(Weight)); 917 } while (consumeIfPresent(MIToken::comma)); 918 MBB.normalizeSuccProbs(); 919 return false; 920 } 921 922 bool MIParser::parseBasicBlock(MachineBasicBlock &MBB, 923 MachineBasicBlock *&AddFalthroughFrom) { 924 // Skip the definition. 925 assert(Token.is(MIToken::MachineBasicBlockLabel)); 926 lex(); 927 if (consumeIfPresent(MIToken::lparen)) { 928 while (Token.isNot(MIToken::rparen) && !Token.isErrorOrEOF()) 929 lex(); 930 consumeIfPresent(MIToken::rparen); 931 } 932 consumeIfPresent(MIToken::colon); 933 934 // Parse the liveins and successors. 935 // N.B: Multiple lists of successors and liveins are allowed and they're 936 // merged into one. 937 // Example: 938 // liveins: $edi 939 // liveins: $esi 940 // 941 // is equivalent to 942 // liveins: $edi, $esi 943 bool ExplicitSuccessors = false; 944 while (true) { 945 if (Token.is(MIToken::kw_successors)) { 946 if (parseBasicBlockSuccessors(MBB)) 947 return true; 948 ExplicitSuccessors = true; 949 } else if (Token.is(MIToken::kw_liveins)) { 950 if (parseBasicBlockLiveins(MBB)) 951 return true; 952 } else if (consumeIfPresent(MIToken::Newline)) { 953 continue; 954 } else 955 break; 956 if (!Token.isNewlineOrEOF()) 957 return error("expected line break at the end of a list"); 958 lex(); 959 } 960 961 // Parse the instructions. 962 bool IsInBundle = false; 963 MachineInstr *PrevMI = nullptr; 964 while (!Token.is(MIToken::MachineBasicBlockLabel) && 965 !Token.is(MIToken::Eof)) { 966 if (consumeIfPresent(MIToken::Newline)) 967 continue; 968 if (consumeIfPresent(MIToken::rbrace)) { 969 // The first parsing pass should verify that all closing '}' have an 970 // opening '{'. 971 assert(IsInBundle); 972 IsInBundle = false; 973 continue; 974 } 975 MachineInstr *MI = nullptr; 976 if (parse(MI)) 977 return true; 978 MBB.insert(MBB.end(), MI); 979 if (IsInBundle) { 980 PrevMI->setFlag(MachineInstr::BundledSucc); 981 MI->setFlag(MachineInstr::BundledPred); 982 } 983 PrevMI = MI; 984 if (Token.is(MIToken::lbrace)) { 985 if (IsInBundle) 986 return error("nested instruction bundles are not allowed"); 987 lex(); 988 // This instruction is the start of the bundle. 989 MI->setFlag(MachineInstr::BundledSucc); 990 IsInBundle = true; 991 if (!Token.is(MIToken::Newline)) 992 // The next instruction can be on the same line. 993 continue; 994 } 995 assert(Token.isNewlineOrEOF() && "MI is not fully parsed"); 996 lex(); 997 } 998 999 // Construct successor list by searching for basic block machine operands. 1000 if (!ExplicitSuccessors) { 1001 SmallVector<MachineBasicBlock*,4> Successors; 1002 bool IsFallthrough; 1003 guessSuccessors(MBB, Successors, IsFallthrough); 1004 for (MachineBasicBlock *Succ : Successors) 1005 MBB.addSuccessor(Succ); 1006 1007 if (IsFallthrough) { 1008 AddFalthroughFrom = &MBB; 1009 } else { 1010 MBB.normalizeSuccProbs(); 1011 } 1012 } 1013 1014 return false; 1015 } 1016 1017 bool MIParser::parseBasicBlocks() { 1018 lex(); 1019 // Skip until the first machine basic block. 1020 while (Token.is(MIToken::Newline)) 1021 lex(); 1022 if (Token.isErrorOrEOF()) 1023 return Token.isError(); 1024 // The first parsing pass should have verified that this token is a MBB label 1025 // in the 'parseBasicBlockDefinitions' method. 1026 assert(Token.is(MIToken::MachineBasicBlockLabel)); 1027 MachineBasicBlock *AddFalthroughFrom = nullptr; 1028 do { 1029 MachineBasicBlock *MBB = nullptr; 1030 if (parseMBBReference(MBB)) 1031 return true; 1032 if (AddFalthroughFrom) { 1033 if (!AddFalthroughFrom->isSuccessor(MBB)) 1034 AddFalthroughFrom->addSuccessor(MBB); 1035 AddFalthroughFrom->normalizeSuccProbs(); 1036 AddFalthroughFrom = nullptr; 1037 } 1038 if (parseBasicBlock(*MBB, AddFalthroughFrom)) 1039 return true; 1040 // The method 'parseBasicBlock' should parse the whole block until the next 1041 // block or the end of file. 1042 assert(Token.is(MIToken::MachineBasicBlockLabel) || Token.is(MIToken::Eof)); 1043 } while (Token.isNot(MIToken::Eof)); 1044 return false; 1045 } 1046 1047 bool MIParser::parse(MachineInstr *&MI) { 1048 // Parse any register operands before '=' 1049 MachineOperand MO = MachineOperand::CreateImm(0); 1050 SmallVector<ParsedMachineOperand, 8> Operands; 1051 while (Token.isRegister() || Token.isRegisterFlag()) { 1052 auto Loc = Token.location(); 1053 std::optional<unsigned> TiedDefIdx; 1054 if (parseRegisterOperand(MO, TiedDefIdx, /*IsDef=*/true)) 1055 return true; 1056 Operands.push_back( 1057 ParsedMachineOperand(MO, Loc, Token.location(), TiedDefIdx)); 1058 if (Token.isNot(MIToken::comma)) 1059 break; 1060 lex(); 1061 } 1062 if (!Operands.empty() && expectAndConsume(MIToken::equal)) 1063 return true; 1064 1065 unsigned OpCode, Flags = 0; 1066 if (Token.isError() || parseInstruction(OpCode, Flags)) 1067 return true; 1068 1069 // Parse the remaining machine operands. 1070 while (!Token.isNewlineOrEOF() && Token.isNot(MIToken::kw_pre_instr_symbol) && 1071 Token.isNot(MIToken::kw_post_instr_symbol) && 1072 Token.isNot(MIToken::kw_heap_alloc_marker) && 1073 Token.isNot(MIToken::kw_pcsections) && 1074 Token.isNot(MIToken::kw_cfi_type) && 1075 Token.isNot(MIToken::kw_debug_location) && 1076 Token.isNot(MIToken::kw_debug_instr_number) && 1077 Token.isNot(MIToken::coloncolon) && Token.isNot(MIToken::lbrace)) { 1078 auto Loc = Token.location(); 1079 std::optional<unsigned> TiedDefIdx; 1080 if (parseMachineOperandAndTargetFlags(OpCode, Operands.size(), MO, TiedDefIdx)) 1081 return true; 1082 Operands.push_back( 1083 ParsedMachineOperand(MO, Loc, Token.location(), TiedDefIdx)); 1084 if (Token.isNewlineOrEOF() || Token.is(MIToken::coloncolon) || 1085 Token.is(MIToken::lbrace)) 1086 break; 1087 if (Token.isNot(MIToken::comma)) 1088 return error("expected ',' before the next machine operand"); 1089 lex(); 1090 } 1091 1092 MCSymbol *PreInstrSymbol = nullptr; 1093 if (Token.is(MIToken::kw_pre_instr_symbol)) 1094 if (parsePreOrPostInstrSymbol(PreInstrSymbol)) 1095 return true; 1096 MCSymbol *PostInstrSymbol = nullptr; 1097 if (Token.is(MIToken::kw_post_instr_symbol)) 1098 if (parsePreOrPostInstrSymbol(PostInstrSymbol)) 1099 return true; 1100 MDNode *HeapAllocMarker = nullptr; 1101 if (Token.is(MIToken::kw_heap_alloc_marker)) 1102 if (parseHeapAllocMarker(HeapAllocMarker)) 1103 return true; 1104 MDNode *PCSections = nullptr; 1105 if (Token.is(MIToken::kw_pcsections)) 1106 if (parsePCSections(PCSections)) 1107 return true; 1108 1109 unsigned CFIType = 0; 1110 if (Token.is(MIToken::kw_cfi_type)) { 1111 lex(); 1112 if (Token.isNot(MIToken::IntegerLiteral)) 1113 return error("expected an integer literal after 'cfi-type'"); 1114 // getUnsigned is sufficient for 32-bit integers. 1115 if (getUnsigned(CFIType)) 1116 return true; 1117 lex(); 1118 // Lex past trailing comma if present. 1119 if (Token.is(MIToken::comma)) 1120 lex(); 1121 } 1122 1123 unsigned InstrNum = 0; 1124 if (Token.is(MIToken::kw_debug_instr_number)) { 1125 lex(); 1126 if (Token.isNot(MIToken::IntegerLiteral)) 1127 return error("expected an integer literal after 'debug-instr-number'"); 1128 if (getUnsigned(InstrNum)) 1129 return true; 1130 lex(); 1131 // Lex past trailing comma if present. 1132 if (Token.is(MIToken::comma)) 1133 lex(); 1134 } 1135 1136 DebugLoc DebugLocation; 1137 if (Token.is(MIToken::kw_debug_location)) { 1138 lex(); 1139 MDNode *Node = nullptr; 1140 if (Token.is(MIToken::exclaim)) { 1141 if (parseMDNode(Node)) 1142 return true; 1143 } else if (Token.is(MIToken::md_dilocation)) { 1144 if (parseDILocation(Node)) 1145 return true; 1146 } else 1147 return error("expected a metadata node after 'debug-location'"); 1148 if (!isa<DILocation>(Node)) 1149 return error("referenced metadata is not a DILocation"); 1150 DebugLocation = DebugLoc(Node); 1151 } 1152 1153 // Parse the machine memory operands. 1154 SmallVector<MachineMemOperand *, 2> MemOperands; 1155 if (Token.is(MIToken::coloncolon)) { 1156 lex(); 1157 while (!Token.isNewlineOrEOF()) { 1158 MachineMemOperand *MemOp = nullptr; 1159 if (parseMachineMemoryOperand(MemOp)) 1160 return true; 1161 MemOperands.push_back(MemOp); 1162 if (Token.isNewlineOrEOF()) 1163 break; 1164 if (Token.isNot(MIToken::comma)) 1165 return error("expected ',' before the next machine memory operand"); 1166 lex(); 1167 } 1168 } 1169 1170 const auto &MCID = MF.getSubtarget().getInstrInfo()->get(OpCode); 1171 if (!MCID.isVariadic()) { 1172 // FIXME: Move the implicit operand verification to the machine verifier. 1173 if (verifyImplicitOperands(Operands, MCID)) 1174 return true; 1175 } 1176 1177 MI = MF.CreateMachineInstr(MCID, DebugLocation, /*NoImplicit=*/true); 1178 MI->setFlags(Flags); 1179 1180 // Don't check the operands make sense, let the verifier catch any 1181 // improprieties. 1182 for (const auto &Operand : Operands) 1183 MI->addOperand(MF, Operand.Operand); 1184 1185 if (assignRegisterTies(*MI, Operands)) 1186 return true; 1187 if (PreInstrSymbol) 1188 MI->setPreInstrSymbol(MF, PreInstrSymbol); 1189 if (PostInstrSymbol) 1190 MI->setPostInstrSymbol(MF, PostInstrSymbol); 1191 if (HeapAllocMarker) 1192 MI->setHeapAllocMarker(MF, HeapAllocMarker); 1193 if (PCSections) 1194 MI->setPCSections(MF, PCSections); 1195 if (CFIType) 1196 MI->setCFIType(MF, CFIType); 1197 if (!MemOperands.empty()) 1198 MI->setMemRefs(MF, MemOperands); 1199 if (InstrNum) 1200 MI->setDebugInstrNum(InstrNum); 1201 return false; 1202 } 1203 1204 bool MIParser::parseStandaloneMBB(MachineBasicBlock *&MBB) { 1205 lex(); 1206 if (Token.isNot(MIToken::MachineBasicBlock)) 1207 return error("expected a machine basic block reference"); 1208 if (parseMBBReference(MBB)) 1209 return true; 1210 lex(); 1211 if (Token.isNot(MIToken::Eof)) 1212 return error( 1213 "expected end of string after the machine basic block reference"); 1214 return false; 1215 } 1216 1217 bool MIParser::parseStandaloneNamedRegister(Register &Reg) { 1218 lex(); 1219 if (Token.isNot(MIToken::NamedRegister)) 1220 return error("expected a named register"); 1221 if (parseNamedRegister(Reg)) 1222 return true; 1223 lex(); 1224 if (Token.isNot(MIToken::Eof)) 1225 return error("expected end of string after the register reference"); 1226 return false; 1227 } 1228 1229 bool MIParser::parseStandaloneVirtualRegister(VRegInfo *&Info) { 1230 lex(); 1231 if (Token.isNot(MIToken::VirtualRegister)) 1232 return error("expected a virtual register"); 1233 if (parseVirtualRegister(Info)) 1234 return true; 1235 lex(); 1236 if (Token.isNot(MIToken::Eof)) 1237 return error("expected end of string after the register reference"); 1238 return false; 1239 } 1240 1241 bool MIParser::parseStandaloneRegister(Register &Reg) { 1242 lex(); 1243 if (Token.isNot(MIToken::NamedRegister) && 1244 Token.isNot(MIToken::VirtualRegister)) 1245 return error("expected either a named or virtual register"); 1246 1247 VRegInfo *Info; 1248 if (parseRegister(Reg, Info)) 1249 return true; 1250 1251 lex(); 1252 if (Token.isNot(MIToken::Eof)) 1253 return error("expected end of string after the register reference"); 1254 return false; 1255 } 1256 1257 bool MIParser::parseStandaloneStackObject(int &FI) { 1258 lex(); 1259 if (Token.isNot(MIToken::StackObject)) 1260 return error("expected a stack object"); 1261 if (parseStackFrameIndex(FI)) 1262 return true; 1263 if (Token.isNot(MIToken::Eof)) 1264 return error("expected end of string after the stack object reference"); 1265 return false; 1266 } 1267 1268 bool MIParser::parseStandaloneMDNode(MDNode *&Node) { 1269 lex(); 1270 if (Token.is(MIToken::exclaim)) { 1271 if (parseMDNode(Node)) 1272 return true; 1273 } else if (Token.is(MIToken::md_diexpr)) { 1274 if (parseDIExpression(Node)) 1275 return true; 1276 } else if (Token.is(MIToken::md_dilocation)) { 1277 if (parseDILocation(Node)) 1278 return true; 1279 } else 1280 return error("expected a metadata node"); 1281 if (Token.isNot(MIToken::Eof)) 1282 return error("expected end of string after the metadata node"); 1283 return false; 1284 } 1285 1286 bool MIParser::parseMachineMetadata() { 1287 lex(); 1288 if (Token.isNot(MIToken::exclaim)) 1289 return error("expected a metadata node"); 1290 1291 lex(); 1292 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isSigned()) 1293 return error("expected metadata id after '!'"); 1294 unsigned ID = 0; 1295 if (getUnsigned(ID)) 1296 return true; 1297 lex(); 1298 if (expectAndConsume(MIToken::equal)) 1299 return true; 1300 bool IsDistinct = Token.is(MIToken::kw_distinct); 1301 if (IsDistinct) 1302 lex(); 1303 if (Token.isNot(MIToken::exclaim)) 1304 return error("expected a metadata node"); 1305 lex(); 1306 1307 MDNode *MD; 1308 if (parseMDTuple(MD, IsDistinct)) 1309 return true; 1310 1311 auto FI = PFS.MachineForwardRefMDNodes.find(ID); 1312 if (FI != PFS.MachineForwardRefMDNodes.end()) { 1313 FI->second.first->replaceAllUsesWith(MD); 1314 PFS.MachineForwardRefMDNodes.erase(FI); 1315 1316 assert(PFS.MachineMetadataNodes[ID] == MD && "Tracking VH didn't work"); 1317 } else { 1318 auto [It, Inserted] = PFS.MachineMetadataNodes.try_emplace(ID); 1319 if (!Inserted) 1320 return error("Metadata id is already used"); 1321 It->second.reset(MD); 1322 } 1323 1324 return false; 1325 } 1326 1327 bool MIParser::parseMDTuple(MDNode *&MD, bool IsDistinct) { 1328 SmallVector<Metadata *, 16> Elts; 1329 if (parseMDNodeVector(Elts)) 1330 return true; 1331 MD = (IsDistinct ? MDTuple::getDistinct 1332 : MDTuple::get)(MF.getFunction().getContext(), Elts); 1333 return false; 1334 } 1335 1336 bool MIParser::parseMDNodeVector(SmallVectorImpl<Metadata *> &Elts) { 1337 if (Token.isNot(MIToken::lbrace)) 1338 return error("expected '{' here"); 1339 lex(); 1340 1341 if (Token.is(MIToken::rbrace)) { 1342 lex(); 1343 return false; 1344 } 1345 1346 do { 1347 Metadata *MD; 1348 if (parseMetadata(MD)) 1349 return true; 1350 1351 Elts.push_back(MD); 1352 1353 if (Token.isNot(MIToken::comma)) 1354 break; 1355 lex(); 1356 } while (true); 1357 1358 if (Token.isNot(MIToken::rbrace)) 1359 return error("expected end of metadata node"); 1360 lex(); 1361 1362 return false; 1363 } 1364 1365 // ::= !42 1366 // ::= !"string" 1367 bool MIParser::parseMetadata(Metadata *&MD) { 1368 if (Token.isNot(MIToken::exclaim)) 1369 return error("expected '!' here"); 1370 lex(); 1371 1372 if (Token.is(MIToken::StringConstant)) { 1373 std::string Str; 1374 if (parseStringConstant(Str)) 1375 return true; 1376 MD = MDString::get(MF.getFunction().getContext(), Str); 1377 return false; 1378 } 1379 1380 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isSigned()) 1381 return error("expected metadata id after '!'"); 1382 1383 SMLoc Loc = mapSMLoc(Token.location()); 1384 1385 unsigned ID = 0; 1386 if (getUnsigned(ID)) 1387 return true; 1388 lex(); 1389 1390 auto NodeInfo = PFS.IRSlots.MetadataNodes.find(ID); 1391 if (NodeInfo != PFS.IRSlots.MetadataNodes.end()) { 1392 MD = NodeInfo->second.get(); 1393 return false; 1394 } 1395 // Check machine metadata. 1396 NodeInfo = PFS.MachineMetadataNodes.find(ID); 1397 if (NodeInfo != PFS.MachineMetadataNodes.end()) { 1398 MD = NodeInfo->second.get(); 1399 return false; 1400 } 1401 // Forward reference. 1402 auto &FwdRef = PFS.MachineForwardRefMDNodes[ID]; 1403 FwdRef = std::make_pair( 1404 MDTuple::getTemporary(MF.getFunction().getContext(), {}), Loc); 1405 PFS.MachineMetadataNodes[ID].reset(FwdRef.first.get()); 1406 MD = FwdRef.first.get(); 1407 1408 return false; 1409 } 1410 1411 static const char *printImplicitRegisterFlag(const MachineOperand &MO) { 1412 assert(MO.isImplicit()); 1413 return MO.isDef() ? "implicit-def" : "implicit"; 1414 } 1415 1416 static std::string getRegisterName(const TargetRegisterInfo *TRI, 1417 Register Reg) { 1418 assert(Reg.isPhysical() && "expected phys reg"); 1419 return StringRef(TRI->getName(Reg)).lower(); 1420 } 1421 1422 /// Return true if the parsed machine operands contain a given machine operand. 1423 static bool isImplicitOperandIn(const MachineOperand &ImplicitOperand, 1424 ArrayRef<ParsedMachineOperand> Operands) { 1425 for (const auto &I : Operands) { 1426 if (ImplicitOperand.isIdenticalTo(I.Operand)) 1427 return true; 1428 } 1429 return false; 1430 } 1431 1432 bool MIParser::verifyImplicitOperands(ArrayRef<ParsedMachineOperand> Operands, 1433 const MCInstrDesc &MCID) { 1434 if (MCID.isCall()) 1435 // We can't verify call instructions as they can contain arbitrary implicit 1436 // register and register mask operands. 1437 return false; 1438 1439 // Gather all the expected implicit operands. 1440 SmallVector<MachineOperand, 4> ImplicitOperands; 1441 for (MCPhysReg ImpDef : MCID.implicit_defs()) 1442 ImplicitOperands.push_back(MachineOperand::CreateReg(ImpDef, true, true)); 1443 for (MCPhysReg ImpUse : MCID.implicit_uses()) 1444 ImplicitOperands.push_back(MachineOperand::CreateReg(ImpUse, false, true)); 1445 1446 const auto *TRI = MF.getSubtarget().getRegisterInfo(); 1447 assert(TRI && "Expected target register info"); 1448 for (const auto &I : ImplicitOperands) { 1449 if (isImplicitOperandIn(I, Operands)) 1450 continue; 1451 return error(Operands.empty() ? Token.location() : Operands.back().End, 1452 Twine("missing implicit register operand '") + 1453 printImplicitRegisterFlag(I) + " $" + 1454 getRegisterName(TRI, I.getReg()) + "'"); 1455 } 1456 return false; 1457 } 1458 1459 bool MIParser::parseInstruction(unsigned &OpCode, unsigned &Flags) { 1460 // Allow frame and fast math flags for OPCODE 1461 // clang-format off 1462 while (Token.is(MIToken::kw_frame_setup) || 1463 Token.is(MIToken::kw_frame_destroy) || 1464 Token.is(MIToken::kw_nnan) || 1465 Token.is(MIToken::kw_ninf) || 1466 Token.is(MIToken::kw_nsz) || 1467 Token.is(MIToken::kw_arcp) || 1468 Token.is(MIToken::kw_contract) || 1469 Token.is(MIToken::kw_afn) || 1470 Token.is(MIToken::kw_reassoc) || 1471 Token.is(MIToken::kw_nuw) || 1472 Token.is(MIToken::kw_nsw) || 1473 Token.is(MIToken::kw_exact) || 1474 Token.is(MIToken::kw_nofpexcept) || 1475 Token.is(MIToken::kw_noconvergent) || 1476 Token.is(MIToken::kw_unpredictable) || 1477 Token.is(MIToken::kw_nneg) || 1478 Token.is(MIToken::kw_disjoint) || 1479 Token.is(MIToken::kw_nusw) || 1480 Token.is(MIToken::kw_samesign)) { 1481 // clang-format on 1482 // Mine frame and fast math flags 1483 if (Token.is(MIToken::kw_frame_setup)) 1484 Flags |= MachineInstr::FrameSetup; 1485 if (Token.is(MIToken::kw_frame_destroy)) 1486 Flags |= MachineInstr::FrameDestroy; 1487 if (Token.is(MIToken::kw_nnan)) 1488 Flags |= MachineInstr::FmNoNans; 1489 if (Token.is(MIToken::kw_ninf)) 1490 Flags |= MachineInstr::FmNoInfs; 1491 if (Token.is(MIToken::kw_nsz)) 1492 Flags |= MachineInstr::FmNsz; 1493 if (Token.is(MIToken::kw_arcp)) 1494 Flags |= MachineInstr::FmArcp; 1495 if (Token.is(MIToken::kw_contract)) 1496 Flags |= MachineInstr::FmContract; 1497 if (Token.is(MIToken::kw_afn)) 1498 Flags |= MachineInstr::FmAfn; 1499 if (Token.is(MIToken::kw_reassoc)) 1500 Flags |= MachineInstr::FmReassoc; 1501 if (Token.is(MIToken::kw_nuw)) 1502 Flags |= MachineInstr::NoUWrap; 1503 if (Token.is(MIToken::kw_nsw)) 1504 Flags |= MachineInstr::NoSWrap; 1505 if (Token.is(MIToken::kw_exact)) 1506 Flags |= MachineInstr::IsExact; 1507 if (Token.is(MIToken::kw_nofpexcept)) 1508 Flags |= MachineInstr::NoFPExcept; 1509 if (Token.is(MIToken::kw_unpredictable)) 1510 Flags |= MachineInstr::Unpredictable; 1511 if (Token.is(MIToken::kw_noconvergent)) 1512 Flags |= MachineInstr::NoConvergent; 1513 if (Token.is(MIToken::kw_nneg)) 1514 Flags |= MachineInstr::NonNeg; 1515 if (Token.is(MIToken::kw_disjoint)) 1516 Flags |= MachineInstr::Disjoint; 1517 if (Token.is(MIToken::kw_nusw)) 1518 Flags |= MachineInstr::NoUSWrap; 1519 if (Token.is(MIToken::kw_samesign)) 1520 Flags |= MachineInstr::SameSign; 1521 1522 lex(); 1523 } 1524 if (Token.isNot(MIToken::Identifier)) 1525 return error("expected a machine instruction"); 1526 StringRef InstrName = Token.stringValue(); 1527 if (PFS.Target.parseInstrName(InstrName, OpCode)) 1528 return error(Twine("unknown machine instruction name '") + InstrName + "'"); 1529 lex(); 1530 return false; 1531 } 1532 1533 bool MIParser::parseNamedRegister(Register &Reg) { 1534 assert(Token.is(MIToken::NamedRegister) && "Needs NamedRegister token"); 1535 StringRef Name = Token.stringValue(); 1536 if (PFS.Target.getRegisterByName(Name, Reg)) 1537 return error(Twine("unknown register name '") + Name + "'"); 1538 return false; 1539 } 1540 1541 bool MIParser::parseNamedVirtualRegister(VRegInfo *&Info) { 1542 assert(Token.is(MIToken::NamedVirtualRegister) && "Expected NamedVReg token"); 1543 StringRef Name = Token.stringValue(); 1544 // TODO: Check that the VReg name is not the same as a physical register name. 1545 // If it is, then print a warning (when warnings are implemented). 1546 Info = &PFS.getVRegInfoNamed(Name); 1547 return false; 1548 } 1549 1550 bool MIParser::parseVirtualRegister(VRegInfo *&Info) { 1551 if (Token.is(MIToken::NamedVirtualRegister)) 1552 return parseNamedVirtualRegister(Info); 1553 assert(Token.is(MIToken::VirtualRegister) && "Needs VirtualRegister token"); 1554 unsigned ID; 1555 if (getUnsigned(ID)) 1556 return true; 1557 Info = &PFS.getVRegInfo(ID); 1558 return false; 1559 } 1560 1561 bool MIParser::parseRegister(Register &Reg, VRegInfo *&Info) { 1562 switch (Token.kind()) { 1563 case MIToken::underscore: 1564 Reg = 0; 1565 return false; 1566 case MIToken::NamedRegister: 1567 return parseNamedRegister(Reg); 1568 case MIToken::NamedVirtualRegister: 1569 case MIToken::VirtualRegister: 1570 if (parseVirtualRegister(Info)) 1571 return true; 1572 Reg = Info->VReg; 1573 return false; 1574 // TODO: Parse other register kinds. 1575 default: 1576 llvm_unreachable("The current token should be a register"); 1577 } 1578 } 1579 1580 bool MIParser::parseRegisterClassOrBank(VRegInfo &RegInfo) { 1581 if (Token.isNot(MIToken::Identifier) && Token.isNot(MIToken::underscore)) 1582 return error("expected '_', register class, or register bank name"); 1583 StringRef::iterator Loc = Token.location(); 1584 StringRef Name = Token.stringValue(); 1585 1586 // Was it a register class? 1587 const TargetRegisterClass *RC = PFS.Target.getRegClass(Name); 1588 if (RC) { 1589 lex(); 1590 1591 switch (RegInfo.Kind) { 1592 case VRegInfo::UNKNOWN: 1593 case VRegInfo::NORMAL: 1594 RegInfo.Kind = VRegInfo::NORMAL; 1595 if (RegInfo.Explicit && RegInfo.D.RC != RC) { 1596 const TargetRegisterInfo &TRI = *MF.getSubtarget().getRegisterInfo(); 1597 return error(Loc, Twine("conflicting register classes, previously: ") + 1598 Twine(TRI.getRegClassName(RegInfo.D.RC))); 1599 } 1600 RegInfo.D.RC = RC; 1601 RegInfo.Explicit = true; 1602 return false; 1603 1604 case VRegInfo::GENERIC: 1605 case VRegInfo::REGBANK: 1606 return error(Loc, "register class specification on generic register"); 1607 } 1608 llvm_unreachable("Unexpected register kind"); 1609 } 1610 1611 // Should be a register bank or a generic register. 1612 const RegisterBank *RegBank = nullptr; 1613 if (Name != "_") { 1614 RegBank = PFS.Target.getRegBank(Name); 1615 if (!RegBank) 1616 return error(Loc, "expected '_', register class, or register bank name"); 1617 } 1618 1619 lex(); 1620 1621 switch (RegInfo.Kind) { 1622 case VRegInfo::UNKNOWN: 1623 case VRegInfo::GENERIC: 1624 case VRegInfo::REGBANK: 1625 RegInfo.Kind = RegBank ? VRegInfo::REGBANK : VRegInfo::GENERIC; 1626 if (RegInfo.Explicit && RegInfo.D.RegBank != RegBank) 1627 return error(Loc, "conflicting generic register banks"); 1628 RegInfo.D.RegBank = RegBank; 1629 RegInfo.Explicit = true; 1630 return false; 1631 1632 case VRegInfo::NORMAL: 1633 return error(Loc, "register bank specification on normal register"); 1634 } 1635 llvm_unreachable("Unexpected register kind"); 1636 } 1637 1638 bool MIParser::parseRegisterFlag(unsigned &Flags) { 1639 const unsigned OldFlags = Flags; 1640 switch (Token.kind()) { 1641 case MIToken::kw_implicit: 1642 Flags |= RegState::Implicit; 1643 break; 1644 case MIToken::kw_implicit_define: 1645 Flags |= RegState::ImplicitDefine; 1646 break; 1647 case MIToken::kw_def: 1648 Flags |= RegState::Define; 1649 break; 1650 case MIToken::kw_dead: 1651 Flags |= RegState::Dead; 1652 break; 1653 case MIToken::kw_killed: 1654 Flags |= RegState::Kill; 1655 break; 1656 case MIToken::kw_undef: 1657 Flags |= RegState::Undef; 1658 break; 1659 case MIToken::kw_internal: 1660 Flags |= RegState::InternalRead; 1661 break; 1662 case MIToken::kw_early_clobber: 1663 Flags |= RegState::EarlyClobber; 1664 break; 1665 case MIToken::kw_debug_use: 1666 Flags |= RegState::Debug; 1667 break; 1668 case MIToken::kw_renamable: 1669 Flags |= RegState::Renamable; 1670 break; 1671 default: 1672 llvm_unreachable("The current token should be a register flag"); 1673 } 1674 if (OldFlags == Flags) 1675 // We know that the same flag is specified more than once when the flags 1676 // weren't modified. 1677 return error("duplicate '" + Token.stringValue() + "' register flag"); 1678 lex(); 1679 return false; 1680 } 1681 1682 bool MIParser::parseSubRegisterIndex(unsigned &SubReg) { 1683 assert(Token.is(MIToken::dot)); 1684 lex(); 1685 if (Token.isNot(MIToken::Identifier)) 1686 return error("expected a subregister index after '.'"); 1687 auto Name = Token.stringValue(); 1688 SubReg = PFS.Target.getSubRegIndex(Name); 1689 if (!SubReg) 1690 return error(Twine("use of unknown subregister index '") + Name + "'"); 1691 lex(); 1692 return false; 1693 } 1694 1695 bool MIParser::parseRegisterTiedDefIndex(unsigned &TiedDefIdx) { 1696 if (!consumeIfPresent(MIToken::kw_tied_def)) 1697 return true; 1698 if (Token.isNot(MIToken::IntegerLiteral)) 1699 return error("expected an integer literal after 'tied-def'"); 1700 if (getUnsigned(TiedDefIdx)) 1701 return true; 1702 lex(); 1703 if (expectAndConsume(MIToken::rparen)) 1704 return true; 1705 return false; 1706 } 1707 1708 bool MIParser::assignRegisterTies(MachineInstr &MI, 1709 ArrayRef<ParsedMachineOperand> Operands) { 1710 SmallVector<std::pair<unsigned, unsigned>, 4> TiedRegisterPairs; 1711 for (unsigned I = 0, E = Operands.size(); I != E; ++I) { 1712 if (!Operands[I].TiedDefIdx) 1713 continue; 1714 // The parser ensures that this operand is a register use, so we just have 1715 // to check the tied-def operand. 1716 unsigned DefIdx = *Operands[I].TiedDefIdx; 1717 if (DefIdx >= E) 1718 return error(Operands[I].Begin, 1719 Twine("use of invalid tied-def operand index '" + 1720 Twine(DefIdx) + "'; instruction has only ") + 1721 Twine(E) + " operands"); 1722 const auto &DefOperand = Operands[DefIdx].Operand; 1723 if (!DefOperand.isReg() || !DefOperand.isDef()) 1724 // FIXME: add note with the def operand. 1725 return error(Operands[I].Begin, 1726 Twine("use of invalid tied-def operand index '") + 1727 Twine(DefIdx) + "'; the operand #" + Twine(DefIdx) + 1728 " isn't a defined register"); 1729 // Check that the tied-def operand wasn't tied elsewhere. 1730 for (const auto &TiedPair : TiedRegisterPairs) { 1731 if (TiedPair.first == DefIdx) 1732 return error(Operands[I].Begin, 1733 Twine("the tied-def operand #") + Twine(DefIdx) + 1734 " is already tied with another register operand"); 1735 } 1736 TiedRegisterPairs.push_back(std::make_pair(DefIdx, I)); 1737 } 1738 // FIXME: Verify that for non INLINEASM instructions, the def and use tied 1739 // indices must be less than tied max. 1740 for (const auto &TiedPair : TiedRegisterPairs) 1741 MI.tieOperands(TiedPair.first, TiedPair.second); 1742 return false; 1743 } 1744 1745 bool MIParser::parseRegisterOperand(MachineOperand &Dest, 1746 std::optional<unsigned> &TiedDefIdx, 1747 bool IsDef) { 1748 unsigned Flags = IsDef ? RegState::Define : 0; 1749 while (Token.isRegisterFlag()) { 1750 if (parseRegisterFlag(Flags)) 1751 return true; 1752 } 1753 if (!Token.isRegister()) 1754 return error("expected a register after register flags"); 1755 Register Reg; 1756 VRegInfo *RegInfo; 1757 if (parseRegister(Reg, RegInfo)) 1758 return true; 1759 lex(); 1760 unsigned SubReg = 0; 1761 if (Token.is(MIToken::dot)) { 1762 if (parseSubRegisterIndex(SubReg)) 1763 return true; 1764 if (!Reg.isVirtual()) 1765 return error("subregister index expects a virtual register"); 1766 } 1767 if (Token.is(MIToken::colon)) { 1768 if (!Reg.isVirtual()) 1769 return error("register class specification expects a virtual register"); 1770 lex(); 1771 if (parseRegisterClassOrBank(*RegInfo)) 1772 return true; 1773 } 1774 MachineRegisterInfo &MRI = MF.getRegInfo(); 1775 if ((Flags & RegState::Define) == 0) { 1776 if (consumeIfPresent(MIToken::lparen)) { 1777 unsigned Idx; 1778 if (!parseRegisterTiedDefIndex(Idx)) 1779 TiedDefIdx = Idx; 1780 else { 1781 // Try a redundant low-level type. 1782 LLT Ty; 1783 if (parseLowLevelType(Token.location(), Ty)) 1784 return error("expected tied-def or low-level type after '('"); 1785 1786 if (expectAndConsume(MIToken::rparen)) 1787 return true; 1788 1789 if (MRI.getType(Reg).isValid() && MRI.getType(Reg) != Ty) 1790 return error("inconsistent type for generic virtual register"); 1791 1792 MRI.setRegClassOrRegBank(Reg, static_cast<RegisterBank *>(nullptr)); 1793 MRI.setType(Reg, Ty); 1794 MRI.noteNewVirtualRegister(Reg); 1795 } 1796 } 1797 } else if (consumeIfPresent(MIToken::lparen)) { 1798 // Virtual registers may have a tpe with GlobalISel. 1799 if (!Reg.isVirtual()) 1800 return error("unexpected type on physical register"); 1801 1802 LLT Ty; 1803 if (parseLowLevelType(Token.location(), Ty)) 1804 return true; 1805 1806 if (expectAndConsume(MIToken::rparen)) 1807 return true; 1808 1809 if (MRI.getType(Reg).isValid() && MRI.getType(Reg) != Ty) 1810 return error("inconsistent type for generic virtual register"); 1811 1812 MRI.setRegClassOrRegBank(Reg, static_cast<RegisterBank *>(nullptr)); 1813 MRI.setType(Reg, Ty); 1814 } else if (Reg.isVirtual()) { 1815 // Generic virtual registers must have a type. 1816 // If we end up here this means the type hasn't been specified and 1817 // this is bad! 1818 if (RegInfo->Kind == VRegInfo::GENERIC || 1819 RegInfo->Kind == VRegInfo::REGBANK) 1820 return error("generic virtual registers must have a type"); 1821 } 1822 1823 if (Flags & RegState::Define) { 1824 if (Flags & RegState::Kill) 1825 return error("cannot have a killed def operand"); 1826 } else { 1827 if (Flags & RegState::Dead) 1828 return error("cannot have a dead use operand"); 1829 } 1830 1831 Dest = MachineOperand::CreateReg( 1832 Reg, Flags & RegState::Define, Flags & RegState::Implicit, 1833 Flags & RegState::Kill, Flags & RegState::Dead, Flags & RegState::Undef, 1834 Flags & RegState::EarlyClobber, SubReg, Flags & RegState::Debug, 1835 Flags & RegState::InternalRead, Flags & RegState::Renamable); 1836 1837 return false; 1838 } 1839 1840 bool MIParser::parseImmediateOperand(MachineOperand &Dest) { 1841 assert(Token.is(MIToken::IntegerLiteral)); 1842 const APSInt &Int = Token.integerValue(); 1843 if (auto SImm = Int.trySExtValue(); Int.isSigned() && SImm.has_value()) 1844 Dest = MachineOperand::CreateImm(*SImm); 1845 else if (auto UImm = Int.tryZExtValue(); !Int.isSigned() && UImm.has_value()) 1846 Dest = MachineOperand::CreateImm(*UImm); 1847 else 1848 return error("integer literal is too large to be an immediate operand"); 1849 lex(); 1850 return false; 1851 } 1852 1853 bool MIParser::parseTargetImmMnemonic(const unsigned OpCode, 1854 const unsigned OpIdx, 1855 MachineOperand &Dest, 1856 const MIRFormatter &MF) { 1857 assert(Token.is(MIToken::dot)); 1858 auto Loc = Token.location(); // record start position 1859 size_t Len = 1; // for "." 1860 lex(); 1861 1862 // Handle the case that mnemonic starts with number. 1863 if (Token.is(MIToken::IntegerLiteral)) { 1864 Len += Token.range().size(); 1865 lex(); 1866 } 1867 1868 StringRef Src; 1869 if (Token.is(MIToken::comma)) 1870 Src = StringRef(Loc, Len); 1871 else { 1872 assert(Token.is(MIToken::Identifier)); 1873 Src = StringRef(Loc, Len + Token.stringValue().size()); 1874 } 1875 int64_t Val; 1876 if (MF.parseImmMnemonic(OpCode, OpIdx, Src, Val, 1877 [this](StringRef::iterator Loc, const Twine &Msg) 1878 -> bool { return error(Loc, Msg); })) 1879 return true; 1880 1881 Dest = MachineOperand::CreateImm(Val); 1882 if (!Token.is(MIToken::comma)) 1883 lex(); 1884 return false; 1885 } 1886 1887 static bool parseIRConstant(StringRef::iterator Loc, StringRef StringValue, 1888 PerFunctionMIParsingState &PFS, const Constant *&C, 1889 ErrorCallbackType ErrCB) { 1890 auto Source = StringValue.str(); // The source has to be null terminated. 1891 SMDiagnostic Err; 1892 C = parseConstantValue(Source, Err, *PFS.MF.getFunction().getParent(), 1893 &PFS.IRSlots); 1894 if (!C) 1895 return ErrCB(Loc + Err.getColumnNo(), Err.getMessage()); 1896 return false; 1897 } 1898 1899 bool MIParser::parseIRConstant(StringRef::iterator Loc, StringRef StringValue, 1900 const Constant *&C) { 1901 return ::parseIRConstant( 1902 Loc, StringValue, PFS, C, 1903 [this](StringRef::iterator Loc, const Twine &Msg) -> bool { 1904 return error(Loc, Msg); 1905 }); 1906 } 1907 1908 bool MIParser::parseIRConstant(StringRef::iterator Loc, const Constant *&C) { 1909 if (parseIRConstant(Loc, StringRef(Loc, Token.range().end() - Loc), C)) 1910 return true; 1911 lex(); 1912 return false; 1913 } 1914 1915 // See LLT implementation for bit size limits. 1916 static bool verifyScalarSize(uint64_t Size) { 1917 return Size != 0 && isUInt<16>(Size); 1918 } 1919 1920 static bool verifyVectorElementCount(uint64_t NumElts) { 1921 return NumElts != 0 && isUInt<16>(NumElts); 1922 } 1923 1924 static bool verifyAddrSpace(uint64_t AddrSpace) { 1925 return isUInt<24>(AddrSpace); 1926 } 1927 1928 bool MIParser::parseLowLevelType(StringRef::iterator Loc, LLT &Ty) { 1929 if (Token.range().front() == 's' || Token.range().front() == 'p') { 1930 StringRef SizeStr = Token.range().drop_front(); 1931 if (SizeStr.size() == 0 || !llvm::all_of(SizeStr, isdigit)) 1932 return error("expected integers after 's'/'p' type character"); 1933 } 1934 1935 if (Token.range().front() == 's') { 1936 auto ScalarSize = APSInt(Token.range().drop_front()).getZExtValue(); 1937 if (ScalarSize) { 1938 if (!verifyScalarSize(ScalarSize)) 1939 return error("invalid size for scalar type"); 1940 Ty = LLT::scalar(ScalarSize); 1941 } else { 1942 Ty = LLT::token(); 1943 } 1944 lex(); 1945 return false; 1946 } else if (Token.range().front() == 'p') { 1947 const DataLayout &DL = MF.getDataLayout(); 1948 uint64_t AS = APSInt(Token.range().drop_front()).getZExtValue(); 1949 if (!verifyAddrSpace(AS)) 1950 return error("invalid address space number"); 1951 1952 Ty = LLT::pointer(AS, DL.getPointerSizeInBits(AS)); 1953 lex(); 1954 return false; 1955 } 1956 1957 // Now we're looking for a vector. 1958 if (Token.isNot(MIToken::less)) 1959 return error(Loc, "expected sN, pA, <M x sN>, <M x pA>, <vscale x M x sN>, " 1960 "or <vscale x M x pA> for GlobalISel type"); 1961 lex(); 1962 1963 bool HasVScale = 1964 Token.is(MIToken::Identifier) && Token.stringValue() == "vscale"; 1965 if (HasVScale) { 1966 lex(); 1967 if (Token.isNot(MIToken::Identifier) || Token.stringValue() != "x") 1968 return error("expected <vscale x M x sN> or <vscale x M x pA>"); 1969 lex(); 1970 } 1971 1972 auto GetError = [this, &HasVScale, Loc]() { 1973 if (HasVScale) 1974 return error( 1975 Loc, "expected <vscale x M x sN> or <vscale M x pA> for vector type"); 1976 return error(Loc, "expected <M x sN> or <M x pA> for vector type"); 1977 }; 1978 1979 if (Token.isNot(MIToken::IntegerLiteral)) 1980 return GetError(); 1981 uint64_t NumElements = Token.integerValue().getZExtValue(); 1982 if (!verifyVectorElementCount(NumElements)) 1983 return error("invalid number of vector elements"); 1984 1985 lex(); 1986 1987 if (Token.isNot(MIToken::Identifier) || Token.stringValue() != "x") 1988 return GetError(); 1989 lex(); 1990 1991 if (Token.range().front() != 's' && Token.range().front() != 'p') 1992 return GetError(); 1993 1994 StringRef SizeStr = Token.range().drop_front(); 1995 if (SizeStr.size() == 0 || !llvm::all_of(SizeStr, isdigit)) 1996 return error("expected integers after 's'/'p' type character"); 1997 1998 if (Token.range().front() == 's') { 1999 auto ScalarSize = APSInt(Token.range().drop_front()).getZExtValue(); 2000 if (!verifyScalarSize(ScalarSize)) 2001 return error("invalid size for scalar element in vector"); 2002 Ty = LLT::scalar(ScalarSize); 2003 } else if (Token.range().front() == 'p') { 2004 const DataLayout &DL = MF.getDataLayout(); 2005 uint64_t AS = APSInt(Token.range().drop_front()).getZExtValue(); 2006 if (!verifyAddrSpace(AS)) 2007 return error("invalid address space number"); 2008 2009 Ty = LLT::pointer(AS, DL.getPointerSizeInBits(AS)); 2010 } else 2011 return GetError(); 2012 lex(); 2013 2014 if (Token.isNot(MIToken::greater)) 2015 return GetError(); 2016 2017 lex(); 2018 2019 Ty = LLT::vector(ElementCount::get(NumElements, HasVScale), Ty); 2020 return false; 2021 } 2022 2023 bool MIParser::parseTypedImmediateOperand(MachineOperand &Dest) { 2024 assert(Token.is(MIToken::Identifier)); 2025 StringRef TypeStr = Token.range(); 2026 if (TypeStr.front() != 'i' && TypeStr.front() != 's' && 2027 TypeStr.front() != 'p') 2028 return error( 2029 "a typed immediate operand should start with one of 'i', 's', or 'p'"); 2030 StringRef SizeStr = Token.range().drop_front(); 2031 if (SizeStr.size() == 0 || !llvm::all_of(SizeStr, isdigit)) 2032 return error("expected integers after 'i'/'s'/'p' type character"); 2033 2034 auto Loc = Token.location(); 2035 lex(); 2036 if (Token.isNot(MIToken::IntegerLiteral)) { 2037 if (Token.isNot(MIToken::Identifier) || 2038 !(Token.range() == "true" || Token.range() == "false")) 2039 return error("expected an integer literal"); 2040 } 2041 const Constant *C = nullptr; 2042 if (parseIRConstant(Loc, C)) 2043 return true; 2044 Dest = MachineOperand::CreateCImm(cast<ConstantInt>(C)); 2045 return false; 2046 } 2047 2048 bool MIParser::parseFPImmediateOperand(MachineOperand &Dest) { 2049 auto Loc = Token.location(); 2050 lex(); 2051 if (Token.isNot(MIToken::FloatingPointLiteral) && 2052 Token.isNot(MIToken::HexLiteral)) 2053 return error("expected a floating point literal"); 2054 const Constant *C = nullptr; 2055 if (parseIRConstant(Loc, C)) 2056 return true; 2057 Dest = MachineOperand::CreateFPImm(cast<ConstantFP>(C)); 2058 return false; 2059 } 2060 2061 static bool getHexUint(const MIToken &Token, APInt &Result) { 2062 assert(Token.is(MIToken::HexLiteral)); 2063 StringRef S = Token.range(); 2064 assert(S[0] == '0' && tolower(S[1]) == 'x'); 2065 // This could be a floating point literal with a special prefix. 2066 if (!isxdigit(S[2])) 2067 return true; 2068 StringRef V = S.substr(2); 2069 APInt A(V.size()*4, V, 16); 2070 2071 // If A is 0, then A.getActiveBits() is 0. This isn't a valid bitwidth. Make 2072 // sure it isn't the case before constructing result. 2073 unsigned NumBits = (A == 0) ? 32 : A.getActiveBits(); 2074 Result = APInt(NumBits, ArrayRef<uint64_t>(A.getRawData(), A.getNumWords())); 2075 return false; 2076 } 2077 2078 static bool getUnsigned(const MIToken &Token, unsigned &Result, 2079 ErrorCallbackType ErrCB) { 2080 if (Token.hasIntegerValue()) { 2081 const uint64_t Limit = uint64_t(std::numeric_limits<unsigned>::max()) + 1; 2082 uint64_t Val64 = Token.integerValue().getLimitedValue(Limit); 2083 if (Val64 == Limit) 2084 return ErrCB(Token.location(), "expected 32-bit integer (too large)"); 2085 Result = Val64; 2086 return false; 2087 } 2088 if (Token.is(MIToken::HexLiteral)) { 2089 APInt A; 2090 if (getHexUint(Token, A)) 2091 return true; 2092 if (A.getBitWidth() > 32) 2093 return ErrCB(Token.location(), "expected 32-bit integer (too large)"); 2094 Result = A.getZExtValue(); 2095 return false; 2096 } 2097 return true; 2098 } 2099 2100 bool MIParser::getUnsigned(unsigned &Result) { 2101 return ::getUnsigned( 2102 Token, Result, [this](StringRef::iterator Loc, const Twine &Msg) -> bool { 2103 return error(Loc, Msg); 2104 }); 2105 } 2106 2107 bool MIParser::parseMBBReference(MachineBasicBlock *&MBB) { 2108 assert(Token.is(MIToken::MachineBasicBlock) || 2109 Token.is(MIToken::MachineBasicBlockLabel)); 2110 unsigned Number; 2111 if (getUnsigned(Number)) 2112 return true; 2113 auto MBBInfo = PFS.MBBSlots.find(Number); 2114 if (MBBInfo == PFS.MBBSlots.end()) 2115 return error(Twine("use of undefined machine basic block #") + 2116 Twine(Number)); 2117 MBB = MBBInfo->second; 2118 // TODO: Only parse the name if it's a MachineBasicBlockLabel. Deprecate once 2119 // we drop the <irname> from the bb.<id>.<irname> format. 2120 if (!Token.stringValue().empty() && Token.stringValue() != MBB->getName()) 2121 return error(Twine("the name of machine basic block #") + Twine(Number) + 2122 " isn't '" + Token.stringValue() + "'"); 2123 return false; 2124 } 2125 2126 bool MIParser::parseMBBOperand(MachineOperand &Dest) { 2127 MachineBasicBlock *MBB; 2128 if (parseMBBReference(MBB)) 2129 return true; 2130 Dest = MachineOperand::CreateMBB(MBB); 2131 lex(); 2132 return false; 2133 } 2134 2135 bool MIParser::parseStackFrameIndex(int &FI) { 2136 assert(Token.is(MIToken::StackObject)); 2137 unsigned ID; 2138 if (getUnsigned(ID)) 2139 return true; 2140 auto ObjectInfo = PFS.StackObjectSlots.find(ID); 2141 if (ObjectInfo == PFS.StackObjectSlots.end()) 2142 return error(Twine("use of undefined stack object '%stack.") + Twine(ID) + 2143 "'"); 2144 StringRef Name; 2145 if (const auto *Alloca = 2146 MF.getFrameInfo().getObjectAllocation(ObjectInfo->second)) 2147 Name = Alloca->getName(); 2148 if (!Token.stringValue().empty() && Token.stringValue() != Name) 2149 return error(Twine("the name of the stack object '%stack.") + Twine(ID) + 2150 "' isn't '" + Token.stringValue() + "'"); 2151 lex(); 2152 FI = ObjectInfo->second; 2153 return false; 2154 } 2155 2156 bool MIParser::parseStackObjectOperand(MachineOperand &Dest) { 2157 int FI; 2158 if (parseStackFrameIndex(FI)) 2159 return true; 2160 Dest = MachineOperand::CreateFI(FI); 2161 return false; 2162 } 2163 2164 bool MIParser::parseFixedStackFrameIndex(int &FI) { 2165 assert(Token.is(MIToken::FixedStackObject)); 2166 unsigned ID; 2167 if (getUnsigned(ID)) 2168 return true; 2169 auto ObjectInfo = PFS.FixedStackObjectSlots.find(ID); 2170 if (ObjectInfo == PFS.FixedStackObjectSlots.end()) 2171 return error(Twine("use of undefined fixed stack object '%fixed-stack.") + 2172 Twine(ID) + "'"); 2173 lex(); 2174 FI = ObjectInfo->second; 2175 return false; 2176 } 2177 2178 bool MIParser::parseFixedStackObjectOperand(MachineOperand &Dest) { 2179 int FI; 2180 if (parseFixedStackFrameIndex(FI)) 2181 return true; 2182 Dest = MachineOperand::CreateFI(FI); 2183 return false; 2184 } 2185 2186 static bool parseGlobalValue(const MIToken &Token, 2187 PerFunctionMIParsingState &PFS, GlobalValue *&GV, 2188 ErrorCallbackType ErrCB) { 2189 switch (Token.kind()) { 2190 case MIToken::NamedGlobalValue: { 2191 const Module *M = PFS.MF.getFunction().getParent(); 2192 GV = M->getNamedValue(Token.stringValue()); 2193 if (!GV) 2194 return ErrCB(Token.location(), Twine("use of undefined global value '") + 2195 Token.range() + "'"); 2196 break; 2197 } 2198 case MIToken::GlobalValue: { 2199 unsigned GVIdx; 2200 if (getUnsigned(Token, GVIdx, ErrCB)) 2201 return true; 2202 GV = PFS.IRSlots.GlobalValues.get(GVIdx); 2203 if (!GV) 2204 return ErrCB(Token.location(), Twine("use of undefined global value '@") + 2205 Twine(GVIdx) + "'"); 2206 break; 2207 } 2208 default: 2209 llvm_unreachable("The current token should be a global value"); 2210 } 2211 return false; 2212 } 2213 2214 bool MIParser::parseGlobalValue(GlobalValue *&GV) { 2215 return ::parseGlobalValue( 2216 Token, PFS, GV, 2217 [this](StringRef::iterator Loc, const Twine &Msg) -> bool { 2218 return error(Loc, Msg); 2219 }); 2220 } 2221 2222 bool MIParser::parseGlobalAddressOperand(MachineOperand &Dest) { 2223 GlobalValue *GV = nullptr; 2224 if (parseGlobalValue(GV)) 2225 return true; 2226 lex(); 2227 Dest = MachineOperand::CreateGA(GV, /*Offset=*/0); 2228 if (parseOperandsOffset(Dest)) 2229 return true; 2230 return false; 2231 } 2232 2233 bool MIParser::parseConstantPoolIndexOperand(MachineOperand &Dest) { 2234 assert(Token.is(MIToken::ConstantPoolItem)); 2235 unsigned ID; 2236 if (getUnsigned(ID)) 2237 return true; 2238 auto ConstantInfo = PFS.ConstantPoolSlots.find(ID); 2239 if (ConstantInfo == PFS.ConstantPoolSlots.end()) 2240 return error("use of undefined constant '%const." + Twine(ID) + "'"); 2241 lex(); 2242 Dest = MachineOperand::CreateCPI(ID, /*Offset=*/0); 2243 if (parseOperandsOffset(Dest)) 2244 return true; 2245 return false; 2246 } 2247 2248 bool MIParser::parseJumpTableIndexOperand(MachineOperand &Dest) { 2249 assert(Token.is(MIToken::JumpTableIndex)); 2250 unsigned ID; 2251 if (getUnsigned(ID)) 2252 return true; 2253 auto JumpTableEntryInfo = PFS.JumpTableSlots.find(ID); 2254 if (JumpTableEntryInfo == PFS.JumpTableSlots.end()) 2255 return error("use of undefined jump table '%jump-table." + Twine(ID) + "'"); 2256 lex(); 2257 Dest = MachineOperand::CreateJTI(JumpTableEntryInfo->second); 2258 return false; 2259 } 2260 2261 bool MIParser::parseExternalSymbolOperand(MachineOperand &Dest) { 2262 assert(Token.is(MIToken::ExternalSymbol)); 2263 const char *Symbol = MF.createExternalSymbolName(Token.stringValue()); 2264 lex(); 2265 Dest = MachineOperand::CreateES(Symbol); 2266 if (parseOperandsOffset(Dest)) 2267 return true; 2268 return false; 2269 } 2270 2271 bool MIParser::parseMCSymbolOperand(MachineOperand &Dest) { 2272 assert(Token.is(MIToken::MCSymbol)); 2273 MCSymbol *Symbol = getOrCreateMCSymbol(Token.stringValue()); 2274 lex(); 2275 Dest = MachineOperand::CreateMCSymbol(Symbol); 2276 if (parseOperandsOffset(Dest)) 2277 return true; 2278 return false; 2279 } 2280 2281 bool MIParser::parseSubRegisterIndexOperand(MachineOperand &Dest) { 2282 assert(Token.is(MIToken::SubRegisterIndex)); 2283 StringRef Name = Token.stringValue(); 2284 unsigned SubRegIndex = PFS.Target.getSubRegIndex(Token.stringValue()); 2285 if (SubRegIndex == 0) 2286 return error(Twine("unknown subregister index '") + Name + "'"); 2287 lex(); 2288 Dest = MachineOperand::CreateImm(SubRegIndex); 2289 return false; 2290 } 2291 2292 bool MIParser::parseMDNode(MDNode *&Node) { 2293 assert(Token.is(MIToken::exclaim)); 2294 2295 auto Loc = Token.location(); 2296 lex(); 2297 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isSigned()) 2298 return error("expected metadata id after '!'"); 2299 unsigned ID; 2300 if (getUnsigned(ID)) 2301 return true; 2302 auto NodeInfo = PFS.IRSlots.MetadataNodes.find(ID); 2303 if (NodeInfo == PFS.IRSlots.MetadataNodes.end()) { 2304 NodeInfo = PFS.MachineMetadataNodes.find(ID); 2305 if (NodeInfo == PFS.MachineMetadataNodes.end()) 2306 return error(Loc, "use of undefined metadata '!" + Twine(ID) + "'"); 2307 } 2308 lex(); 2309 Node = NodeInfo->second.get(); 2310 return false; 2311 } 2312 2313 bool MIParser::parseDIExpression(MDNode *&Expr) { 2314 unsigned Read; 2315 Expr = llvm::parseDIExpressionBodyAtBeginning( 2316 CurrentSource, Read, Error, *PFS.MF.getFunction().getParent(), 2317 &PFS.IRSlots); 2318 CurrentSource = CurrentSource.substr(Read); 2319 lex(); 2320 if (!Expr) 2321 return error(Error.getMessage()); 2322 return false; 2323 } 2324 2325 bool MIParser::parseDILocation(MDNode *&Loc) { 2326 assert(Token.is(MIToken::md_dilocation)); 2327 lex(); 2328 2329 bool HaveLine = false; 2330 unsigned Line = 0; 2331 unsigned Column = 0; 2332 MDNode *Scope = nullptr; 2333 MDNode *InlinedAt = nullptr; 2334 bool ImplicitCode = false; 2335 uint64_t AtomGroup = 0; 2336 uint64_t AtomRank = 0; 2337 2338 if (expectAndConsume(MIToken::lparen)) 2339 return true; 2340 2341 if (Token.isNot(MIToken::rparen)) { 2342 do { 2343 if (Token.is(MIToken::Identifier)) { 2344 if (Token.stringValue() == "line") { 2345 lex(); 2346 if (expectAndConsume(MIToken::colon)) 2347 return true; 2348 if (Token.isNot(MIToken::IntegerLiteral) || 2349 Token.integerValue().isSigned()) 2350 return error("expected unsigned integer"); 2351 Line = Token.integerValue().getZExtValue(); 2352 HaveLine = true; 2353 lex(); 2354 continue; 2355 } 2356 if (Token.stringValue() == "column") { 2357 lex(); 2358 if (expectAndConsume(MIToken::colon)) 2359 return true; 2360 if (Token.isNot(MIToken::IntegerLiteral) || 2361 Token.integerValue().isSigned()) 2362 return error("expected unsigned integer"); 2363 Column = Token.integerValue().getZExtValue(); 2364 lex(); 2365 continue; 2366 } 2367 if (Token.stringValue() == "scope") { 2368 lex(); 2369 if (expectAndConsume(MIToken::colon)) 2370 return true; 2371 if (parseMDNode(Scope)) 2372 return error("expected metadata node"); 2373 if (!isa<DIScope>(Scope)) 2374 return error("expected DIScope node"); 2375 continue; 2376 } 2377 if (Token.stringValue() == "inlinedAt") { 2378 lex(); 2379 if (expectAndConsume(MIToken::colon)) 2380 return true; 2381 if (Token.is(MIToken::exclaim)) { 2382 if (parseMDNode(InlinedAt)) 2383 return true; 2384 } else if (Token.is(MIToken::md_dilocation)) { 2385 if (parseDILocation(InlinedAt)) 2386 return true; 2387 } else 2388 return error("expected metadata node"); 2389 if (!isa<DILocation>(InlinedAt)) 2390 return error("expected DILocation node"); 2391 continue; 2392 } 2393 if (Token.stringValue() == "isImplicitCode") { 2394 lex(); 2395 if (expectAndConsume(MIToken::colon)) 2396 return true; 2397 if (!Token.is(MIToken::Identifier)) 2398 return error("expected true/false"); 2399 // As far as I can see, we don't have any existing need for parsing 2400 // true/false in MIR yet. Do it ad-hoc until there's something else 2401 // that needs it. 2402 if (Token.stringValue() == "true") 2403 ImplicitCode = true; 2404 else if (Token.stringValue() == "false") 2405 ImplicitCode = false; 2406 else 2407 return error("expected true/false"); 2408 lex(); 2409 continue; 2410 } 2411 if (Token.stringValue() == "atomGroup") { 2412 lex(); 2413 if (expectAndConsume(MIToken::colon)) 2414 return true; 2415 if (Token.isNot(MIToken::IntegerLiteral) || 2416 Token.integerValue().isSigned()) 2417 return error("expected unsigned integer"); 2418 AtomGroup = Token.integerValue().getZExtValue(); 2419 lex(); 2420 continue; 2421 } 2422 if (Token.stringValue() == "atomRank") { 2423 lex(); 2424 if (expectAndConsume(MIToken::colon)) 2425 return true; 2426 if (Token.isNot(MIToken::IntegerLiteral) || 2427 Token.integerValue().isSigned()) 2428 return error("expected unsigned integer"); 2429 AtomRank = Token.integerValue().getZExtValue(); 2430 lex(); 2431 continue; 2432 } 2433 } 2434 return error(Twine("invalid DILocation argument '") + 2435 Token.stringValue() + "'"); 2436 } while (consumeIfPresent(MIToken::comma)); 2437 } 2438 2439 if (expectAndConsume(MIToken::rparen)) 2440 return true; 2441 2442 if (!HaveLine) 2443 return error("DILocation requires line number"); 2444 if (!Scope) 2445 return error("DILocation requires a scope"); 2446 2447 Loc = DILocation::get(MF.getFunction().getContext(), Line, Column, Scope, 2448 InlinedAt, ImplicitCode, AtomGroup, AtomRank); 2449 return false; 2450 } 2451 2452 bool MIParser::parseMetadataOperand(MachineOperand &Dest) { 2453 MDNode *Node = nullptr; 2454 if (Token.is(MIToken::exclaim)) { 2455 if (parseMDNode(Node)) 2456 return true; 2457 } else if (Token.is(MIToken::md_diexpr)) { 2458 if (parseDIExpression(Node)) 2459 return true; 2460 } 2461 Dest = MachineOperand::CreateMetadata(Node); 2462 return false; 2463 } 2464 2465 bool MIParser::parseCFIOffset(int &Offset) { 2466 if (Token.isNot(MIToken::IntegerLiteral)) 2467 return error("expected a cfi offset"); 2468 if (Token.integerValue().getSignificantBits() > 32) 2469 return error("expected a 32 bit integer (the cfi offset is too large)"); 2470 Offset = (int)Token.integerValue().getExtValue(); 2471 lex(); 2472 return false; 2473 } 2474 2475 bool MIParser::parseCFIRegister(unsigned &Reg) { 2476 if (Token.isNot(MIToken::NamedRegister)) 2477 return error("expected a cfi register"); 2478 Register LLVMReg; 2479 if (parseNamedRegister(LLVMReg)) 2480 return true; 2481 const auto *TRI = MF.getSubtarget().getRegisterInfo(); 2482 assert(TRI && "Expected target register info"); 2483 int DwarfReg = TRI->getDwarfRegNum(LLVMReg, true); 2484 if (DwarfReg < 0) 2485 return error("invalid DWARF register"); 2486 Reg = (unsigned)DwarfReg; 2487 lex(); 2488 return false; 2489 } 2490 2491 bool MIParser::parseCFIAddressSpace(unsigned &AddressSpace) { 2492 if (Token.isNot(MIToken::IntegerLiteral)) 2493 return error("expected a cfi address space literal"); 2494 if (Token.integerValue().isSigned()) 2495 return error("expected an unsigned integer (cfi address space)"); 2496 AddressSpace = Token.integerValue().getZExtValue(); 2497 lex(); 2498 return false; 2499 } 2500 2501 bool MIParser::parseCFIEscapeValues(std::string &Values) { 2502 do { 2503 if (Token.isNot(MIToken::HexLiteral)) 2504 return error("expected a hexadecimal literal"); 2505 unsigned Value; 2506 if (getUnsigned(Value)) 2507 return true; 2508 if (Value > UINT8_MAX) 2509 return error("expected a 8-bit integer (too large)"); 2510 Values.push_back(static_cast<uint8_t>(Value)); 2511 lex(); 2512 } while (consumeIfPresent(MIToken::comma)); 2513 return false; 2514 } 2515 2516 bool MIParser::parseCFIOperand(MachineOperand &Dest) { 2517 auto Kind = Token.kind(); 2518 lex(); 2519 int Offset; 2520 unsigned Reg; 2521 unsigned AddressSpace; 2522 unsigned CFIIndex; 2523 switch (Kind) { 2524 case MIToken::kw_cfi_same_value: 2525 if (parseCFIRegister(Reg)) 2526 return true; 2527 CFIIndex = MF.addFrameInst(MCCFIInstruction::createSameValue(nullptr, Reg)); 2528 break; 2529 case MIToken::kw_cfi_offset: 2530 if (parseCFIRegister(Reg) || expectAndConsume(MIToken::comma) || 2531 parseCFIOffset(Offset)) 2532 return true; 2533 CFIIndex = 2534 MF.addFrameInst(MCCFIInstruction::createOffset(nullptr, Reg, Offset)); 2535 break; 2536 case MIToken::kw_cfi_rel_offset: 2537 if (parseCFIRegister(Reg) || expectAndConsume(MIToken::comma) || 2538 parseCFIOffset(Offset)) 2539 return true; 2540 CFIIndex = MF.addFrameInst( 2541 MCCFIInstruction::createRelOffset(nullptr, Reg, Offset)); 2542 break; 2543 case MIToken::kw_cfi_def_cfa_register: 2544 if (parseCFIRegister(Reg)) 2545 return true; 2546 CFIIndex = 2547 MF.addFrameInst(MCCFIInstruction::createDefCfaRegister(nullptr, Reg)); 2548 break; 2549 case MIToken::kw_cfi_def_cfa_offset: 2550 if (parseCFIOffset(Offset)) 2551 return true; 2552 CFIIndex = 2553 MF.addFrameInst(MCCFIInstruction::cfiDefCfaOffset(nullptr, Offset)); 2554 break; 2555 case MIToken::kw_cfi_adjust_cfa_offset: 2556 if (parseCFIOffset(Offset)) 2557 return true; 2558 CFIIndex = MF.addFrameInst( 2559 MCCFIInstruction::createAdjustCfaOffset(nullptr, Offset)); 2560 break; 2561 case MIToken::kw_cfi_def_cfa: 2562 if (parseCFIRegister(Reg) || expectAndConsume(MIToken::comma) || 2563 parseCFIOffset(Offset)) 2564 return true; 2565 CFIIndex = 2566 MF.addFrameInst(MCCFIInstruction::cfiDefCfa(nullptr, Reg, Offset)); 2567 break; 2568 case MIToken::kw_cfi_llvm_def_aspace_cfa: 2569 if (parseCFIRegister(Reg) || expectAndConsume(MIToken::comma) || 2570 parseCFIOffset(Offset) || expectAndConsume(MIToken::comma) || 2571 parseCFIAddressSpace(AddressSpace)) 2572 return true; 2573 CFIIndex = MF.addFrameInst(MCCFIInstruction::createLLVMDefAspaceCfa( 2574 nullptr, Reg, Offset, AddressSpace, SMLoc())); 2575 break; 2576 case MIToken::kw_cfi_remember_state: 2577 CFIIndex = MF.addFrameInst(MCCFIInstruction::createRememberState(nullptr)); 2578 break; 2579 case MIToken::kw_cfi_restore: 2580 if (parseCFIRegister(Reg)) 2581 return true; 2582 CFIIndex = MF.addFrameInst(MCCFIInstruction::createRestore(nullptr, Reg)); 2583 break; 2584 case MIToken::kw_cfi_restore_state: 2585 CFIIndex = MF.addFrameInst(MCCFIInstruction::createRestoreState(nullptr)); 2586 break; 2587 case MIToken::kw_cfi_undefined: 2588 if (parseCFIRegister(Reg)) 2589 return true; 2590 CFIIndex = MF.addFrameInst(MCCFIInstruction::createUndefined(nullptr, Reg)); 2591 break; 2592 case MIToken::kw_cfi_register: { 2593 unsigned Reg2; 2594 if (parseCFIRegister(Reg) || expectAndConsume(MIToken::comma) || 2595 parseCFIRegister(Reg2)) 2596 return true; 2597 2598 CFIIndex = 2599 MF.addFrameInst(MCCFIInstruction::createRegister(nullptr, Reg, Reg2)); 2600 break; 2601 } 2602 case MIToken::kw_cfi_window_save: 2603 CFIIndex = MF.addFrameInst(MCCFIInstruction::createWindowSave(nullptr)); 2604 break; 2605 case MIToken::kw_cfi_aarch64_negate_ra_sign_state: 2606 CFIIndex = MF.addFrameInst(MCCFIInstruction::createNegateRAState(nullptr)); 2607 break; 2608 case MIToken::kw_cfi_aarch64_negate_ra_sign_state_with_pc: 2609 CFIIndex = 2610 MF.addFrameInst(MCCFIInstruction::createNegateRAStateWithPC(nullptr)); 2611 break; 2612 case MIToken::kw_cfi_escape: { 2613 std::string Values; 2614 if (parseCFIEscapeValues(Values)) 2615 return true; 2616 CFIIndex = MF.addFrameInst(MCCFIInstruction::createEscape(nullptr, Values)); 2617 break; 2618 } 2619 default: 2620 // TODO: Parse the other CFI operands. 2621 llvm_unreachable("The current token should be a cfi operand"); 2622 } 2623 Dest = MachineOperand::CreateCFIIndex(CFIIndex); 2624 return false; 2625 } 2626 2627 bool MIParser::parseIRBlock(BasicBlock *&BB, const Function &F) { 2628 switch (Token.kind()) { 2629 case MIToken::NamedIRBlock: { 2630 BB = dyn_cast_or_null<BasicBlock>( 2631 F.getValueSymbolTable()->lookup(Token.stringValue())); 2632 if (!BB) 2633 return error(Twine("use of undefined IR block '") + Token.range() + "'"); 2634 break; 2635 } 2636 case MIToken::IRBlock: { 2637 unsigned SlotNumber = 0; 2638 if (getUnsigned(SlotNumber)) 2639 return true; 2640 BB = const_cast<BasicBlock *>(getIRBlock(SlotNumber, F)); 2641 if (!BB) 2642 return error(Twine("use of undefined IR block '%ir-block.") + 2643 Twine(SlotNumber) + "'"); 2644 break; 2645 } 2646 default: 2647 llvm_unreachable("The current token should be an IR block reference"); 2648 } 2649 return false; 2650 } 2651 2652 bool MIParser::parseBlockAddressOperand(MachineOperand &Dest) { 2653 assert(Token.is(MIToken::kw_blockaddress)); 2654 lex(); 2655 if (expectAndConsume(MIToken::lparen)) 2656 return true; 2657 if (Token.isNot(MIToken::GlobalValue) && 2658 Token.isNot(MIToken::NamedGlobalValue)) 2659 return error("expected a global value"); 2660 GlobalValue *GV = nullptr; 2661 if (parseGlobalValue(GV)) 2662 return true; 2663 auto *F = dyn_cast<Function>(GV); 2664 if (!F) 2665 return error("expected an IR function reference"); 2666 lex(); 2667 if (expectAndConsume(MIToken::comma)) 2668 return true; 2669 BasicBlock *BB = nullptr; 2670 if (Token.isNot(MIToken::IRBlock) && Token.isNot(MIToken::NamedIRBlock)) 2671 return error("expected an IR block reference"); 2672 if (parseIRBlock(BB, *F)) 2673 return true; 2674 lex(); 2675 if (expectAndConsume(MIToken::rparen)) 2676 return true; 2677 Dest = MachineOperand::CreateBA(BlockAddress::get(F, BB), /*Offset=*/0); 2678 if (parseOperandsOffset(Dest)) 2679 return true; 2680 return false; 2681 } 2682 2683 bool MIParser::parseIntrinsicOperand(MachineOperand &Dest) { 2684 assert(Token.is(MIToken::kw_intrinsic)); 2685 lex(); 2686 if (expectAndConsume(MIToken::lparen)) 2687 return error("expected syntax intrinsic(@llvm.whatever)"); 2688 2689 if (Token.isNot(MIToken::NamedGlobalValue)) 2690 return error("expected syntax intrinsic(@llvm.whatever)"); 2691 2692 std::string Name = std::string(Token.stringValue()); 2693 lex(); 2694 2695 if (expectAndConsume(MIToken::rparen)) 2696 return error("expected ')' to terminate intrinsic name"); 2697 2698 // Find out what intrinsic we're dealing with. 2699 Intrinsic::ID ID = Intrinsic::lookupIntrinsicID(Name); 2700 if (ID == Intrinsic::not_intrinsic) 2701 return error("unknown intrinsic name"); 2702 Dest = MachineOperand::CreateIntrinsicID(ID); 2703 2704 return false; 2705 } 2706 2707 bool MIParser::parsePredicateOperand(MachineOperand &Dest) { 2708 assert(Token.is(MIToken::kw_intpred) || Token.is(MIToken::kw_floatpred)); 2709 bool IsFloat = Token.is(MIToken::kw_floatpred); 2710 lex(); 2711 2712 if (expectAndConsume(MIToken::lparen)) 2713 return error("expected syntax intpred(whatever) or floatpred(whatever"); 2714 2715 if (Token.isNot(MIToken::Identifier)) 2716 return error("whatever"); 2717 2718 CmpInst::Predicate Pred; 2719 if (IsFloat) { 2720 Pred = StringSwitch<CmpInst::Predicate>(Token.stringValue()) 2721 .Case("false", CmpInst::FCMP_FALSE) 2722 .Case("oeq", CmpInst::FCMP_OEQ) 2723 .Case("ogt", CmpInst::FCMP_OGT) 2724 .Case("oge", CmpInst::FCMP_OGE) 2725 .Case("olt", CmpInst::FCMP_OLT) 2726 .Case("ole", CmpInst::FCMP_OLE) 2727 .Case("one", CmpInst::FCMP_ONE) 2728 .Case("ord", CmpInst::FCMP_ORD) 2729 .Case("uno", CmpInst::FCMP_UNO) 2730 .Case("ueq", CmpInst::FCMP_UEQ) 2731 .Case("ugt", CmpInst::FCMP_UGT) 2732 .Case("uge", CmpInst::FCMP_UGE) 2733 .Case("ult", CmpInst::FCMP_ULT) 2734 .Case("ule", CmpInst::FCMP_ULE) 2735 .Case("une", CmpInst::FCMP_UNE) 2736 .Case("true", CmpInst::FCMP_TRUE) 2737 .Default(CmpInst::BAD_FCMP_PREDICATE); 2738 if (!CmpInst::isFPPredicate(Pred)) 2739 return error("invalid floating-point predicate"); 2740 } else { 2741 Pred = StringSwitch<CmpInst::Predicate>(Token.stringValue()) 2742 .Case("eq", CmpInst::ICMP_EQ) 2743 .Case("ne", CmpInst::ICMP_NE) 2744 .Case("sgt", CmpInst::ICMP_SGT) 2745 .Case("sge", CmpInst::ICMP_SGE) 2746 .Case("slt", CmpInst::ICMP_SLT) 2747 .Case("sle", CmpInst::ICMP_SLE) 2748 .Case("ugt", CmpInst::ICMP_UGT) 2749 .Case("uge", CmpInst::ICMP_UGE) 2750 .Case("ult", CmpInst::ICMP_ULT) 2751 .Case("ule", CmpInst::ICMP_ULE) 2752 .Default(CmpInst::BAD_ICMP_PREDICATE); 2753 if (!CmpInst::isIntPredicate(Pred)) 2754 return error("invalid integer predicate"); 2755 } 2756 2757 lex(); 2758 Dest = MachineOperand::CreatePredicate(Pred); 2759 if (expectAndConsume(MIToken::rparen)) 2760 return error("predicate should be terminated by ')'."); 2761 2762 return false; 2763 } 2764 2765 bool MIParser::parseShuffleMaskOperand(MachineOperand &Dest) { 2766 assert(Token.is(MIToken::kw_shufflemask)); 2767 2768 lex(); 2769 if (expectAndConsume(MIToken::lparen)) 2770 return error("expected syntax shufflemask(<integer or undef>, ...)"); 2771 2772 SmallVector<int, 32> ShufMask; 2773 do { 2774 if (Token.is(MIToken::kw_undef)) { 2775 ShufMask.push_back(-1); 2776 } else if (Token.is(MIToken::IntegerLiteral)) { 2777 const APSInt &Int = Token.integerValue(); 2778 ShufMask.push_back(Int.getExtValue()); 2779 } else 2780 return error("expected integer constant"); 2781 2782 lex(); 2783 } while (consumeIfPresent(MIToken::comma)); 2784 2785 if (expectAndConsume(MIToken::rparen)) 2786 return error("shufflemask should be terminated by ')'."); 2787 2788 ArrayRef<int> MaskAlloc = MF.allocateShuffleMask(ShufMask); 2789 Dest = MachineOperand::CreateShuffleMask(MaskAlloc); 2790 return false; 2791 } 2792 2793 bool MIParser::parseDbgInstrRefOperand(MachineOperand &Dest) { 2794 assert(Token.is(MIToken::kw_dbg_instr_ref)); 2795 2796 lex(); 2797 if (expectAndConsume(MIToken::lparen)) 2798 return error("expected syntax dbg-instr-ref(<unsigned>, <unsigned>)"); 2799 2800 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isNegative()) 2801 return error("expected unsigned integer for instruction index"); 2802 uint64_t InstrIdx = Token.integerValue().getZExtValue(); 2803 assert(InstrIdx <= std::numeric_limits<unsigned>::max() && 2804 "Instruction reference's instruction index is too large"); 2805 lex(); 2806 2807 if (expectAndConsume(MIToken::comma)) 2808 return error("expected syntax dbg-instr-ref(<unsigned>, <unsigned>)"); 2809 2810 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isNegative()) 2811 return error("expected unsigned integer for operand index"); 2812 uint64_t OpIdx = Token.integerValue().getZExtValue(); 2813 assert(OpIdx <= std::numeric_limits<unsigned>::max() && 2814 "Instruction reference's operand index is too large"); 2815 lex(); 2816 2817 if (expectAndConsume(MIToken::rparen)) 2818 return error("expected syntax dbg-instr-ref(<unsigned>, <unsigned>)"); 2819 2820 Dest = MachineOperand::CreateDbgInstrRef(InstrIdx, OpIdx); 2821 return false; 2822 } 2823 2824 bool MIParser::parseTargetIndexOperand(MachineOperand &Dest) { 2825 assert(Token.is(MIToken::kw_target_index)); 2826 lex(); 2827 if (expectAndConsume(MIToken::lparen)) 2828 return true; 2829 if (Token.isNot(MIToken::Identifier)) 2830 return error("expected the name of the target index"); 2831 int Index = 0; 2832 if (PFS.Target.getTargetIndex(Token.stringValue(), Index)) 2833 return error("use of undefined target index '" + Token.stringValue() + "'"); 2834 lex(); 2835 if (expectAndConsume(MIToken::rparen)) 2836 return true; 2837 Dest = MachineOperand::CreateTargetIndex(unsigned(Index), /*Offset=*/0); 2838 if (parseOperandsOffset(Dest)) 2839 return true; 2840 return false; 2841 } 2842 2843 bool MIParser::parseCustomRegisterMaskOperand(MachineOperand &Dest) { 2844 assert(Token.stringValue() == "CustomRegMask" && "Expected a custom RegMask"); 2845 lex(); 2846 if (expectAndConsume(MIToken::lparen)) 2847 return true; 2848 2849 uint32_t *Mask = MF.allocateRegMask(); 2850 do { 2851 if (Token.isNot(MIToken::rparen)) { 2852 if (Token.isNot(MIToken::NamedRegister)) 2853 return error("expected a named register"); 2854 Register Reg; 2855 if (parseNamedRegister(Reg)) 2856 return true; 2857 lex(); 2858 Mask[Reg.id() / 32] |= 1U << (Reg.id() % 32); 2859 } 2860 2861 // TODO: Report an error if the same register is used more than once. 2862 } while (consumeIfPresent(MIToken::comma)); 2863 2864 if (expectAndConsume(MIToken::rparen)) 2865 return true; 2866 Dest = MachineOperand::CreateRegMask(Mask); 2867 return false; 2868 } 2869 2870 bool MIParser::parseLiveoutRegisterMaskOperand(MachineOperand &Dest) { 2871 assert(Token.is(MIToken::kw_liveout)); 2872 uint32_t *Mask = MF.allocateRegMask(); 2873 lex(); 2874 if (expectAndConsume(MIToken::lparen)) 2875 return true; 2876 while (true) { 2877 if (Token.isNot(MIToken::NamedRegister)) 2878 return error("expected a named register"); 2879 Register Reg; 2880 if (parseNamedRegister(Reg)) 2881 return true; 2882 lex(); 2883 Mask[Reg.id() / 32] |= 1U << (Reg.id() % 32); 2884 // TODO: Report an error if the same register is used more than once. 2885 if (Token.isNot(MIToken::comma)) 2886 break; 2887 lex(); 2888 } 2889 if (expectAndConsume(MIToken::rparen)) 2890 return true; 2891 Dest = MachineOperand::CreateRegLiveOut(Mask); 2892 return false; 2893 } 2894 2895 bool MIParser::parseMachineOperand(const unsigned OpCode, const unsigned OpIdx, 2896 MachineOperand &Dest, 2897 std::optional<unsigned> &TiedDefIdx) { 2898 switch (Token.kind()) { 2899 case MIToken::kw_implicit: 2900 case MIToken::kw_implicit_define: 2901 case MIToken::kw_def: 2902 case MIToken::kw_dead: 2903 case MIToken::kw_killed: 2904 case MIToken::kw_undef: 2905 case MIToken::kw_internal: 2906 case MIToken::kw_early_clobber: 2907 case MIToken::kw_debug_use: 2908 case MIToken::kw_renamable: 2909 case MIToken::underscore: 2910 case MIToken::NamedRegister: 2911 case MIToken::VirtualRegister: 2912 case MIToken::NamedVirtualRegister: 2913 return parseRegisterOperand(Dest, TiedDefIdx); 2914 case MIToken::IntegerLiteral: 2915 return parseImmediateOperand(Dest); 2916 case MIToken::kw_half: 2917 case MIToken::kw_bfloat: 2918 case MIToken::kw_float: 2919 case MIToken::kw_double: 2920 case MIToken::kw_x86_fp80: 2921 case MIToken::kw_fp128: 2922 case MIToken::kw_ppc_fp128: 2923 return parseFPImmediateOperand(Dest); 2924 case MIToken::MachineBasicBlock: 2925 return parseMBBOperand(Dest); 2926 case MIToken::StackObject: 2927 return parseStackObjectOperand(Dest); 2928 case MIToken::FixedStackObject: 2929 return parseFixedStackObjectOperand(Dest); 2930 case MIToken::GlobalValue: 2931 case MIToken::NamedGlobalValue: 2932 return parseGlobalAddressOperand(Dest); 2933 case MIToken::ConstantPoolItem: 2934 return parseConstantPoolIndexOperand(Dest); 2935 case MIToken::JumpTableIndex: 2936 return parseJumpTableIndexOperand(Dest); 2937 case MIToken::ExternalSymbol: 2938 return parseExternalSymbolOperand(Dest); 2939 case MIToken::MCSymbol: 2940 return parseMCSymbolOperand(Dest); 2941 case MIToken::SubRegisterIndex: 2942 return parseSubRegisterIndexOperand(Dest); 2943 case MIToken::md_diexpr: 2944 case MIToken::exclaim: 2945 return parseMetadataOperand(Dest); 2946 case MIToken::kw_cfi_same_value: 2947 case MIToken::kw_cfi_offset: 2948 case MIToken::kw_cfi_rel_offset: 2949 case MIToken::kw_cfi_def_cfa_register: 2950 case MIToken::kw_cfi_def_cfa_offset: 2951 case MIToken::kw_cfi_adjust_cfa_offset: 2952 case MIToken::kw_cfi_escape: 2953 case MIToken::kw_cfi_def_cfa: 2954 case MIToken::kw_cfi_llvm_def_aspace_cfa: 2955 case MIToken::kw_cfi_register: 2956 case MIToken::kw_cfi_remember_state: 2957 case MIToken::kw_cfi_restore: 2958 case MIToken::kw_cfi_restore_state: 2959 case MIToken::kw_cfi_undefined: 2960 case MIToken::kw_cfi_window_save: 2961 case MIToken::kw_cfi_aarch64_negate_ra_sign_state: 2962 case MIToken::kw_cfi_aarch64_negate_ra_sign_state_with_pc: 2963 return parseCFIOperand(Dest); 2964 case MIToken::kw_blockaddress: 2965 return parseBlockAddressOperand(Dest); 2966 case MIToken::kw_intrinsic: 2967 return parseIntrinsicOperand(Dest); 2968 case MIToken::kw_target_index: 2969 return parseTargetIndexOperand(Dest); 2970 case MIToken::kw_liveout: 2971 return parseLiveoutRegisterMaskOperand(Dest); 2972 case MIToken::kw_floatpred: 2973 case MIToken::kw_intpred: 2974 return parsePredicateOperand(Dest); 2975 case MIToken::kw_shufflemask: 2976 return parseShuffleMaskOperand(Dest); 2977 case MIToken::kw_dbg_instr_ref: 2978 return parseDbgInstrRefOperand(Dest); 2979 case MIToken::Error: 2980 return true; 2981 case MIToken::Identifier: 2982 if (const auto *RegMask = PFS.Target.getRegMask(Token.stringValue())) { 2983 Dest = MachineOperand::CreateRegMask(RegMask); 2984 lex(); 2985 break; 2986 } else if (Token.stringValue() == "CustomRegMask") { 2987 return parseCustomRegisterMaskOperand(Dest); 2988 } else 2989 return parseTypedImmediateOperand(Dest); 2990 case MIToken::dot: { 2991 const auto *TII = MF.getSubtarget().getInstrInfo(); 2992 if (const auto *Formatter = TII->getMIRFormatter()) { 2993 return parseTargetImmMnemonic(OpCode, OpIdx, Dest, *Formatter); 2994 } 2995 [[fallthrough]]; 2996 } 2997 default: 2998 // FIXME: Parse the MCSymbol machine operand. 2999 return error("expected a machine operand"); 3000 } 3001 return false; 3002 } 3003 3004 bool MIParser::parseMachineOperandAndTargetFlags( 3005 const unsigned OpCode, const unsigned OpIdx, MachineOperand &Dest, 3006 std::optional<unsigned> &TiedDefIdx) { 3007 unsigned TF = 0; 3008 bool HasTargetFlags = false; 3009 if (Token.is(MIToken::kw_target_flags)) { 3010 HasTargetFlags = true; 3011 lex(); 3012 if (expectAndConsume(MIToken::lparen)) 3013 return true; 3014 if (Token.isNot(MIToken::Identifier)) 3015 return error("expected the name of the target flag"); 3016 if (PFS.Target.getDirectTargetFlag(Token.stringValue(), TF)) { 3017 if (PFS.Target.getBitmaskTargetFlag(Token.stringValue(), TF)) 3018 return error("use of undefined target flag '" + Token.stringValue() + 3019 "'"); 3020 } 3021 lex(); 3022 while (Token.is(MIToken::comma)) { 3023 lex(); 3024 if (Token.isNot(MIToken::Identifier)) 3025 return error("expected the name of the target flag"); 3026 unsigned BitFlag = 0; 3027 if (PFS.Target.getBitmaskTargetFlag(Token.stringValue(), BitFlag)) 3028 return error("use of undefined target flag '" + Token.stringValue() + 3029 "'"); 3030 // TODO: Report an error when using a duplicate bit target flag. 3031 TF |= BitFlag; 3032 lex(); 3033 } 3034 if (expectAndConsume(MIToken::rparen)) 3035 return true; 3036 } 3037 auto Loc = Token.location(); 3038 if (parseMachineOperand(OpCode, OpIdx, Dest, TiedDefIdx)) 3039 return true; 3040 if (!HasTargetFlags) 3041 return false; 3042 if (Dest.isReg()) 3043 return error(Loc, "register operands can't have target flags"); 3044 Dest.setTargetFlags(TF); 3045 return false; 3046 } 3047 3048 bool MIParser::parseOffset(int64_t &Offset) { 3049 if (Token.isNot(MIToken::plus) && Token.isNot(MIToken::minus)) 3050 return false; 3051 StringRef Sign = Token.range(); 3052 bool IsNegative = Token.is(MIToken::minus); 3053 lex(); 3054 if (Token.isNot(MIToken::IntegerLiteral)) 3055 return error("expected an integer literal after '" + Sign + "'"); 3056 if (Token.integerValue().getSignificantBits() > 64) 3057 return error("expected 64-bit integer (too large)"); 3058 Offset = Token.integerValue().getExtValue(); 3059 if (IsNegative) 3060 Offset = -Offset; 3061 lex(); 3062 return false; 3063 } 3064 3065 bool MIParser::parseIRBlockAddressTaken(BasicBlock *&BB) { 3066 assert(Token.is(MIToken::kw_ir_block_address_taken)); 3067 lex(); 3068 if (Token.isNot(MIToken::IRBlock) && Token.isNot(MIToken::NamedIRBlock)) 3069 return error("expected basic block after 'ir_block_address_taken'"); 3070 3071 if (parseIRBlock(BB, MF.getFunction())) 3072 return true; 3073 3074 lex(); 3075 return false; 3076 } 3077 3078 bool MIParser::parseAlignment(uint64_t &Alignment) { 3079 assert(Token.is(MIToken::kw_align) || Token.is(MIToken::kw_basealign)); 3080 lex(); 3081 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isSigned()) 3082 return error("expected an integer literal after 'align'"); 3083 if (getUint64(Alignment)) 3084 return true; 3085 lex(); 3086 3087 if (!isPowerOf2_64(Alignment)) 3088 return error("expected a power-of-2 literal after 'align'"); 3089 3090 return false; 3091 } 3092 3093 bool MIParser::parseAddrspace(unsigned &Addrspace) { 3094 assert(Token.is(MIToken::kw_addrspace)); 3095 lex(); 3096 if (Token.isNot(MIToken::IntegerLiteral) || Token.integerValue().isSigned()) 3097 return error("expected an integer literal after 'addrspace'"); 3098 if (getUnsigned(Addrspace)) 3099 return true; 3100 lex(); 3101 return false; 3102 } 3103 3104 bool MIParser::parseOperandsOffset(MachineOperand &Op) { 3105 int64_t Offset = 0; 3106 if (parseOffset(Offset)) 3107 return true; 3108 Op.setOffset(Offset); 3109 return false; 3110 } 3111 3112 static bool parseIRValue(const MIToken &Token, PerFunctionMIParsingState &PFS, 3113 const Value *&V, ErrorCallbackType ErrCB) { 3114 switch (Token.kind()) { 3115 case MIToken::NamedIRValue: { 3116 V = PFS.MF.getFunction().getValueSymbolTable()->lookup(Token.stringValue()); 3117 break; 3118 } 3119 case MIToken::IRValue: { 3120 unsigned SlotNumber = 0; 3121 if (getUnsigned(Token, SlotNumber, ErrCB)) 3122 return true; 3123 V = PFS.getIRValue(SlotNumber); 3124 break; 3125 } 3126 case MIToken::NamedGlobalValue: 3127 case MIToken::GlobalValue: { 3128 GlobalValue *GV = nullptr; 3129 if (parseGlobalValue(Token, PFS, GV, ErrCB)) 3130 return true; 3131 V = GV; 3132 break; 3133 } 3134 case MIToken::QuotedIRValue: { 3135 const Constant *C = nullptr; 3136 if (parseIRConstant(Token.location(), Token.stringValue(), PFS, C, ErrCB)) 3137 return true; 3138 V = C; 3139 break; 3140 } 3141 case MIToken::kw_unknown_address: 3142 V = nullptr; 3143 return false; 3144 default: 3145 llvm_unreachable("The current token should be an IR block reference"); 3146 } 3147 if (!V) 3148 return ErrCB(Token.location(), Twine("use of undefined IR value '") + Token.range() + "'"); 3149 return false; 3150 } 3151 3152 bool MIParser::parseIRValue(const Value *&V) { 3153 return ::parseIRValue( 3154 Token, PFS, V, [this](StringRef::iterator Loc, const Twine &Msg) -> bool { 3155 return error(Loc, Msg); 3156 }); 3157 } 3158 3159 bool MIParser::getUint64(uint64_t &Result) { 3160 if (Token.hasIntegerValue()) { 3161 if (Token.integerValue().getActiveBits() > 64) 3162 return error("expected 64-bit integer (too large)"); 3163 Result = Token.integerValue().getZExtValue(); 3164 return false; 3165 } 3166 if (Token.is(MIToken::HexLiteral)) { 3167 APInt A; 3168 if (getHexUint(A)) 3169 return true; 3170 if (A.getBitWidth() > 64) 3171 return error("expected 64-bit integer (too large)"); 3172 Result = A.getZExtValue(); 3173 return false; 3174 } 3175 return true; 3176 } 3177 3178 bool MIParser::getHexUint(APInt &Result) { 3179 return ::getHexUint(Token, Result); 3180 } 3181 3182 bool MIParser::parseMemoryOperandFlag(MachineMemOperand::Flags &Flags) { 3183 const auto OldFlags = Flags; 3184 switch (Token.kind()) { 3185 case MIToken::kw_volatile: 3186 Flags |= MachineMemOperand::MOVolatile; 3187 break; 3188 case MIToken::kw_non_temporal: 3189 Flags |= MachineMemOperand::MONonTemporal; 3190 break; 3191 case MIToken::kw_dereferenceable: 3192 Flags |= MachineMemOperand::MODereferenceable; 3193 break; 3194 case MIToken::kw_invariant: 3195 Flags |= MachineMemOperand::MOInvariant; 3196 break; 3197 case MIToken::StringConstant: { 3198 MachineMemOperand::Flags TF; 3199 if (PFS.Target.getMMOTargetFlag(Token.stringValue(), TF)) 3200 return error("use of undefined target MMO flag '" + Token.stringValue() + 3201 "'"); 3202 Flags |= TF; 3203 break; 3204 } 3205 default: 3206 llvm_unreachable("The current token should be a memory operand flag"); 3207 } 3208 if (OldFlags == Flags) 3209 // We know that the same flag is specified more than once when the flags 3210 // weren't modified. 3211 return error("duplicate '" + Token.stringValue() + "' memory operand flag"); 3212 lex(); 3213 return false; 3214 } 3215 3216 bool MIParser::parseMemoryPseudoSourceValue(const PseudoSourceValue *&PSV) { 3217 switch (Token.kind()) { 3218 case MIToken::kw_stack: 3219 PSV = MF.getPSVManager().getStack(); 3220 break; 3221 case MIToken::kw_got: 3222 PSV = MF.getPSVManager().getGOT(); 3223 break; 3224 case MIToken::kw_jump_table: 3225 PSV = MF.getPSVManager().getJumpTable(); 3226 break; 3227 case MIToken::kw_constant_pool: 3228 PSV = MF.getPSVManager().getConstantPool(); 3229 break; 3230 case MIToken::FixedStackObject: { 3231 int FI; 3232 if (parseFixedStackFrameIndex(FI)) 3233 return true; 3234 PSV = MF.getPSVManager().getFixedStack(FI); 3235 // The token was already consumed, so use return here instead of break. 3236 return false; 3237 } 3238 case MIToken::StackObject: { 3239 int FI; 3240 if (parseStackFrameIndex(FI)) 3241 return true; 3242 PSV = MF.getPSVManager().getFixedStack(FI); 3243 // The token was already consumed, so use return here instead of break. 3244 return false; 3245 } 3246 case MIToken::kw_call_entry: 3247 lex(); 3248 switch (Token.kind()) { 3249 case MIToken::GlobalValue: 3250 case MIToken::NamedGlobalValue: { 3251 GlobalValue *GV = nullptr; 3252 if (parseGlobalValue(GV)) 3253 return true; 3254 PSV = MF.getPSVManager().getGlobalValueCallEntry(GV); 3255 break; 3256 } 3257 case MIToken::ExternalSymbol: 3258 PSV = MF.getPSVManager().getExternalSymbolCallEntry( 3259 MF.createExternalSymbolName(Token.stringValue())); 3260 break; 3261 default: 3262 return error( 3263 "expected a global value or an external symbol after 'call-entry'"); 3264 } 3265 break; 3266 case MIToken::kw_custom: { 3267 lex(); 3268 const auto *TII = MF.getSubtarget().getInstrInfo(); 3269 if (const auto *Formatter = TII->getMIRFormatter()) { 3270 if (Formatter->parseCustomPseudoSourceValue( 3271 Token.stringValue(), MF, PFS, PSV, 3272 [this](StringRef::iterator Loc, const Twine &Msg) -> bool { 3273 return error(Loc, Msg); 3274 })) 3275 return true; 3276 } else 3277 return error("unable to parse target custom pseudo source value"); 3278 break; 3279 } 3280 default: 3281 llvm_unreachable("The current token should be pseudo source value"); 3282 } 3283 lex(); 3284 return false; 3285 } 3286 3287 bool MIParser::parseMachinePointerInfo(MachinePointerInfo &Dest) { 3288 if (Token.is(MIToken::kw_constant_pool) || Token.is(MIToken::kw_stack) || 3289 Token.is(MIToken::kw_got) || Token.is(MIToken::kw_jump_table) || 3290 Token.is(MIToken::FixedStackObject) || Token.is(MIToken::StackObject) || 3291 Token.is(MIToken::kw_call_entry) || Token.is(MIToken::kw_custom)) { 3292 const PseudoSourceValue *PSV = nullptr; 3293 if (parseMemoryPseudoSourceValue(PSV)) 3294 return true; 3295 int64_t Offset = 0; 3296 if (parseOffset(Offset)) 3297 return true; 3298 Dest = MachinePointerInfo(PSV, Offset); 3299 return false; 3300 } 3301 if (Token.isNot(MIToken::NamedIRValue) && Token.isNot(MIToken::IRValue) && 3302 Token.isNot(MIToken::GlobalValue) && 3303 Token.isNot(MIToken::NamedGlobalValue) && 3304 Token.isNot(MIToken::QuotedIRValue) && 3305 Token.isNot(MIToken::kw_unknown_address)) 3306 return error("expected an IR value reference"); 3307 const Value *V = nullptr; 3308 if (parseIRValue(V)) 3309 return true; 3310 if (V && !V->getType()->isPointerTy()) 3311 return error("expected a pointer IR value"); 3312 lex(); 3313 int64_t Offset = 0; 3314 if (parseOffset(Offset)) 3315 return true; 3316 Dest = MachinePointerInfo(V, Offset); 3317 return false; 3318 } 3319 3320 bool MIParser::parseOptionalScope(LLVMContext &Context, 3321 SyncScope::ID &SSID) { 3322 SSID = SyncScope::System; 3323 if (Token.is(MIToken::Identifier) && Token.stringValue() == "syncscope") { 3324 lex(); 3325 if (expectAndConsume(MIToken::lparen)) 3326 return error("expected '(' in syncscope"); 3327 3328 std::string SSN; 3329 if (parseStringConstant(SSN)) 3330 return true; 3331 3332 SSID = Context.getOrInsertSyncScopeID(SSN); 3333 if (expectAndConsume(MIToken::rparen)) 3334 return error("expected ')' in syncscope"); 3335 } 3336 3337 return false; 3338 } 3339 3340 bool MIParser::parseOptionalAtomicOrdering(AtomicOrdering &Order) { 3341 Order = AtomicOrdering::NotAtomic; 3342 if (Token.isNot(MIToken::Identifier)) 3343 return false; 3344 3345 Order = StringSwitch<AtomicOrdering>(Token.stringValue()) 3346 .Case("unordered", AtomicOrdering::Unordered) 3347 .Case("monotonic", AtomicOrdering::Monotonic) 3348 .Case("acquire", AtomicOrdering::Acquire) 3349 .Case("release", AtomicOrdering::Release) 3350 .Case("acq_rel", AtomicOrdering::AcquireRelease) 3351 .Case("seq_cst", AtomicOrdering::SequentiallyConsistent) 3352 .Default(AtomicOrdering::NotAtomic); 3353 3354 if (Order != AtomicOrdering::NotAtomic) { 3355 lex(); 3356 return false; 3357 } 3358 3359 return error("expected an atomic scope, ordering or a size specification"); 3360 } 3361 3362 bool MIParser::parseMachineMemoryOperand(MachineMemOperand *&Dest) { 3363 if (expectAndConsume(MIToken::lparen)) 3364 return true; 3365 MachineMemOperand::Flags Flags = MachineMemOperand::MONone; 3366 while (Token.isMemoryOperandFlag()) { 3367 if (parseMemoryOperandFlag(Flags)) 3368 return true; 3369 } 3370 if (Token.isNot(MIToken::Identifier) || 3371 (Token.stringValue() != "load" && Token.stringValue() != "store")) 3372 return error("expected 'load' or 'store' memory operation"); 3373 if (Token.stringValue() == "load") 3374 Flags |= MachineMemOperand::MOLoad; 3375 else 3376 Flags |= MachineMemOperand::MOStore; 3377 lex(); 3378 3379 // Optional 'store' for operands that both load and store. 3380 if (Token.is(MIToken::Identifier) && Token.stringValue() == "store") { 3381 Flags |= MachineMemOperand::MOStore; 3382 lex(); 3383 } 3384 3385 // Optional synchronization scope. 3386 SyncScope::ID SSID; 3387 if (parseOptionalScope(MF.getFunction().getContext(), SSID)) 3388 return true; 3389 3390 // Up to two atomic orderings (cmpxchg provides guarantees on failure). 3391 AtomicOrdering Order, FailureOrder; 3392 if (parseOptionalAtomicOrdering(Order)) 3393 return true; 3394 3395 if (parseOptionalAtomicOrdering(FailureOrder)) 3396 return true; 3397 3398 if (Token.isNot(MIToken::IntegerLiteral) && 3399 Token.isNot(MIToken::kw_unknown_size) && 3400 Token.isNot(MIToken::lparen)) 3401 return error("expected memory LLT, the size integer literal or 'unknown-size' after " 3402 "memory operation"); 3403 3404 LLT MemoryType; 3405 if (Token.is(MIToken::IntegerLiteral)) { 3406 uint64_t Size; 3407 if (getUint64(Size)) 3408 return true; 3409 3410 // Convert from bytes to bits for storage. 3411 MemoryType = LLT::scalar(8 * Size); 3412 lex(); 3413 } else if (Token.is(MIToken::kw_unknown_size)) { 3414 lex(); 3415 } else { 3416 if (expectAndConsume(MIToken::lparen)) 3417 return true; 3418 if (parseLowLevelType(Token.location(), MemoryType)) 3419 return true; 3420 if (expectAndConsume(MIToken::rparen)) 3421 return true; 3422 } 3423 3424 MachinePointerInfo Ptr = MachinePointerInfo(); 3425 if (Token.is(MIToken::Identifier)) { 3426 const char *Word = 3427 ((Flags & MachineMemOperand::MOLoad) && 3428 (Flags & MachineMemOperand::MOStore)) 3429 ? "on" 3430 : Flags & MachineMemOperand::MOLoad ? "from" : "into"; 3431 if (Token.stringValue() != Word) 3432 return error(Twine("expected '") + Word + "'"); 3433 lex(); 3434 3435 if (parseMachinePointerInfo(Ptr)) 3436 return true; 3437 } 3438 uint64_t BaseAlignment = 3439 MemoryType.isValid() 3440 ? PowerOf2Ceil(MemoryType.getSizeInBytes().getKnownMinValue()) 3441 : 1; 3442 AAMDNodes AAInfo; 3443 MDNode *Range = nullptr; 3444 while (consumeIfPresent(MIToken::comma)) { 3445 switch (Token.kind()) { 3446 case MIToken::kw_align: { 3447 // align is printed if it is different than size. 3448 uint64_t Alignment; 3449 if (parseAlignment(Alignment)) 3450 return true; 3451 if (Ptr.Offset & (Alignment - 1)) { 3452 // MachineMemOperand::getAlign never returns a value greater than the 3453 // alignment of offset, so this just guards against hand-written MIR 3454 // that specifies a large "align" value when it should probably use 3455 // "basealign" instead. 3456 return error("specified alignment is more aligned than offset"); 3457 } 3458 BaseAlignment = Alignment; 3459 break; 3460 } 3461 case MIToken::kw_basealign: 3462 // basealign is printed if it is different than align. 3463 if (parseAlignment(BaseAlignment)) 3464 return true; 3465 break; 3466 case MIToken::kw_addrspace: 3467 if (parseAddrspace(Ptr.AddrSpace)) 3468 return true; 3469 break; 3470 case MIToken::md_tbaa: 3471 lex(); 3472 if (parseMDNode(AAInfo.TBAA)) 3473 return true; 3474 break; 3475 case MIToken::md_alias_scope: 3476 lex(); 3477 if (parseMDNode(AAInfo.Scope)) 3478 return true; 3479 break; 3480 case MIToken::md_noalias: 3481 lex(); 3482 if (parseMDNode(AAInfo.NoAlias)) 3483 return true; 3484 break; 3485 case MIToken::md_range: 3486 lex(); 3487 if (parseMDNode(Range)) 3488 return true; 3489 break; 3490 // TODO: Report an error on duplicate metadata nodes. 3491 default: 3492 return error("expected 'align' or '!tbaa' or '!alias.scope' or " 3493 "'!noalias' or '!range'"); 3494 } 3495 } 3496 if (expectAndConsume(MIToken::rparen)) 3497 return true; 3498 Dest = MF.getMachineMemOperand(Ptr, Flags, MemoryType, Align(BaseAlignment), 3499 AAInfo, Range, SSID, Order, FailureOrder); 3500 return false; 3501 } 3502 3503 bool MIParser::parsePreOrPostInstrSymbol(MCSymbol *&Symbol) { 3504 assert((Token.is(MIToken::kw_pre_instr_symbol) || 3505 Token.is(MIToken::kw_post_instr_symbol)) && 3506 "Invalid token for a pre- post-instruction symbol!"); 3507 lex(); 3508 if (Token.isNot(MIToken::MCSymbol)) 3509 return error("expected a symbol after 'pre-instr-symbol'"); 3510 Symbol = getOrCreateMCSymbol(Token.stringValue()); 3511 lex(); 3512 if (Token.isNewlineOrEOF() || Token.is(MIToken::coloncolon) || 3513 Token.is(MIToken::lbrace)) 3514 return false; 3515 if (Token.isNot(MIToken::comma)) 3516 return error("expected ',' before the next machine operand"); 3517 lex(); 3518 return false; 3519 } 3520 3521 bool MIParser::parseHeapAllocMarker(MDNode *&Node) { 3522 assert(Token.is(MIToken::kw_heap_alloc_marker) && 3523 "Invalid token for a heap alloc marker!"); 3524 lex(); 3525 if (parseMDNode(Node)) 3526 return true; 3527 if (!Node) 3528 return error("expected a MDNode after 'heap-alloc-marker'"); 3529 if (Token.isNewlineOrEOF() || Token.is(MIToken::coloncolon) || 3530 Token.is(MIToken::lbrace)) 3531 return false; 3532 if (Token.isNot(MIToken::comma)) 3533 return error("expected ',' before the next machine operand"); 3534 lex(); 3535 return false; 3536 } 3537 3538 bool MIParser::parsePCSections(MDNode *&Node) { 3539 assert(Token.is(MIToken::kw_pcsections) && 3540 "Invalid token for a PC sections!"); 3541 lex(); 3542 if (parseMDNode(Node)) 3543 return true; 3544 if (!Node) 3545 return error("expected a MDNode after 'pcsections'"); 3546 if (Token.isNewlineOrEOF() || Token.is(MIToken::coloncolon) || 3547 Token.is(MIToken::lbrace)) 3548 return false; 3549 if (Token.isNot(MIToken::comma)) 3550 return error("expected ',' before the next machine operand"); 3551 lex(); 3552 return false; 3553 } 3554 3555 static void initSlots2BasicBlocks( 3556 const Function &F, 3557 DenseMap<unsigned, const BasicBlock *> &Slots2BasicBlocks) { 3558 ModuleSlotTracker MST(F.getParent(), /*ShouldInitializeAllMetadata=*/false); 3559 MST.incorporateFunction(F); 3560 for (const auto &BB : F) { 3561 if (BB.hasName()) 3562 continue; 3563 int Slot = MST.getLocalSlot(&BB); 3564 if (Slot == -1) 3565 continue; 3566 Slots2BasicBlocks.insert(std::make_pair(unsigned(Slot), &BB)); 3567 } 3568 } 3569 3570 static const BasicBlock *getIRBlockFromSlot( 3571 unsigned Slot, 3572 const DenseMap<unsigned, const BasicBlock *> &Slots2BasicBlocks) { 3573 return Slots2BasicBlocks.lookup(Slot); 3574 } 3575 3576 const BasicBlock *MIParser::getIRBlock(unsigned Slot) { 3577 if (Slots2BasicBlocks.empty()) 3578 initSlots2BasicBlocks(MF.getFunction(), Slots2BasicBlocks); 3579 return getIRBlockFromSlot(Slot, Slots2BasicBlocks); 3580 } 3581 3582 const BasicBlock *MIParser::getIRBlock(unsigned Slot, const Function &F) { 3583 if (&F == &MF.getFunction()) 3584 return getIRBlock(Slot); 3585 DenseMap<unsigned, const BasicBlock *> CustomSlots2BasicBlocks; 3586 initSlots2BasicBlocks(F, CustomSlots2BasicBlocks); 3587 return getIRBlockFromSlot(Slot, CustomSlots2BasicBlocks); 3588 } 3589 3590 MCSymbol *MIParser::getOrCreateMCSymbol(StringRef Name) { 3591 // FIXME: Currently we can't recognize temporary or local symbols and call all 3592 // of the appropriate forms to create them. However, this handles basic cases 3593 // well as most of the special aspects are recognized by a prefix on their 3594 // name, and the input names should already be unique. For test cases, keeping 3595 // the symbol name out of the symbol table isn't terribly important. 3596 return MF.getContext().getOrCreateSymbol(Name); 3597 } 3598 3599 bool MIParser::parseStringConstant(std::string &Result) { 3600 if (Token.isNot(MIToken::StringConstant)) 3601 return error("expected string constant"); 3602 Result = std::string(Token.stringValue()); 3603 lex(); 3604 return false; 3605 } 3606 3607 bool llvm::parseMachineBasicBlockDefinitions(PerFunctionMIParsingState &PFS, 3608 StringRef Src, 3609 SMDiagnostic &Error) { 3610 return MIParser(PFS, Error, Src).parseBasicBlockDefinitions(PFS.MBBSlots); 3611 } 3612 3613 bool llvm::parseMachineInstructions(PerFunctionMIParsingState &PFS, 3614 StringRef Src, SMDiagnostic &Error) { 3615 return MIParser(PFS, Error, Src).parseBasicBlocks(); 3616 } 3617 3618 bool llvm::parseMBBReference(PerFunctionMIParsingState &PFS, 3619 MachineBasicBlock *&MBB, StringRef Src, 3620 SMDiagnostic &Error) { 3621 return MIParser(PFS, Error, Src).parseStandaloneMBB(MBB); 3622 } 3623 3624 bool llvm::parseRegisterReference(PerFunctionMIParsingState &PFS, 3625 Register &Reg, StringRef Src, 3626 SMDiagnostic &Error) { 3627 return MIParser(PFS, Error, Src).parseStandaloneRegister(Reg); 3628 } 3629 3630 bool llvm::parseNamedRegisterReference(PerFunctionMIParsingState &PFS, 3631 Register &Reg, StringRef Src, 3632 SMDiagnostic &Error) { 3633 return MIParser(PFS, Error, Src).parseStandaloneNamedRegister(Reg); 3634 } 3635 3636 bool llvm::parseVirtualRegisterReference(PerFunctionMIParsingState &PFS, 3637 VRegInfo *&Info, StringRef Src, 3638 SMDiagnostic &Error) { 3639 return MIParser(PFS, Error, Src).parseStandaloneVirtualRegister(Info); 3640 } 3641 3642 bool llvm::parseStackObjectReference(PerFunctionMIParsingState &PFS, 3643 int &FI, StringRef Src, 3644 SMDiagnostic &Error) { 3645 return MIParser(PFS, Error, Src).parseStandaloneStackObject(FI); 3646 } 3647 3648 bool llvm::parseMDNode(PerFunctionMIParsingState &PFS, 3649 MDNode *&Node, StringRef Src, SMDiagnostic &Error) { 3650 return MIParser(PFS, Error, Src).parseStandaloneMDNode(Node); 3651 } 3652 3653 bool llvm::parseMachineMetadata(PerFunctionMIParsingState &PFS, StringRef Src, 3654 SMRange SrcRange, SMDiagnostic &Error) { 3655 return MIParser(PFS, Error, Src, SrcRange).parseMachineMetadata(); 3656 } 3657 3658 bool MIRFormatter::parseIRValue(StringRef Src, MachineFunction &MF, 3659 PerFunctionMIParsingState &PFS, const Value *&V, 3660 ErrorCallbackType ErrorCallback) { 3661 MIToken Token; 3662 Src = lexMIToken(Src, Token, [&](StringRef::iterator Loc, const Twine &Msg) { 3663 ErrorCallback(Loc, Msg); 3664 }); 3665 V = nullptr; 3666 3667 return ::parseIRValue(Token, PFS, V, ErrorCallback); 3668 } 3669