10b57cec5SDimitry Andric //===- MILexer.h - Lexer for machine instructions ---------------*- C++ -*-===// 20b57cec5SDimitry Andric // 30b57cec5SDimitry Andric // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 40b57cec5SDimitry Andric // See https://llvm.org/LICENSE.txt for license information. 50b57cec5SDimitry Andric // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 60b57cec5SDimitry Andric // 70b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 80b57cec5SDimitry Andric // 90b57cec5SDimitry Andric // This file declares the function that lexes the machine instruction source 100b57cec5SDimitry Andric // string. 110b57cec5SDimitry Andric // 120b57cec5SDimitry Andric //===----------------------------------------------------------------------===// 130b57cec5SDimitry Andric 140b57cec5SDimitry Andric #ifndef LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H 150b57cec5SDimitry Andric #define LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H 160b57cec5SDimitry Andric 170b57cec5SDimitry Andric #include "llvm/ADT/APSInt.h" 180b57cec5SDimitry Andric #include "llvm/ADT/StringRef.h" 190b57cec5SDimitry Andric #include <string> 200b57cec5SDimitry Andric 210b57cec5SDimitry Andric namespace llvm { 220b57cec5SDimitry Andric 230b57cec5SDimitry Andric class Twine; 240b57cec5SDimitry Andric 250b57cec5SDimitry Andric /// A token produced by the machine instruction lexer. 260b57cec5SDimitry Andric struct MIToken { 270b57cec5SDimitry Andric enum TokenKind { 280b57cec5SDimitry Andric // Markers 290b57cec5SDimitry Andric Eof, 300b57cec5SDimitry Andric Error, 310b57cec5SDimitry Andric Newline, 320b57cec5SDimitry Andric 330b57cec5SDimitry Andric // Tokens with no info. 340b57cec5SDimitry Andric comma, 350b57cec5SDimitry Andric equal, 360b57cec5SDimitry Andric underscore, 370b57cec5SDimitry Andric colon, 380b57cec5SDimitry Andric coloncolon, 390b57cec5SDimitry Andric dot, 400b57cec5SDimitry Andric exclaim, 410b57cec5SDimitry Andric lparen, 420b57cec5SDimitry Andric rparen, 430b57cec5SDimitry Andric lbrace, 440b57cec5SDimitry Andric rbrace, 450b57cec5SDimitry Andric plus, 460b57cec5SDimitry Andric minus, 470b57cec5SDimitry Andric less, 480b57cec5SDimitry Andric greater, 490b57cec5SDimitry Andric 500b57cec5SDimitry Andric // Keywords 510b57cec5SDimitry Andric kw_implicit, 520b57cec5SDimitry Andric kw_implicit_define, 530b57cec5SDimitry Andric kw_def, 540b57cec5SDimitry Andric kw_dead, 550b57cec5SDimitry Andric kw_dereferenceable, 560b57cec5SDimitry Andric kw_killed, 570b57cec5SDimitry Andric kw_undef, 580b57cec5SDimitry Andric kw_internal, 590b57cec5SDimitry Andric kw_early_clobber, 600b57cec5SDimitry Andric kw_debug_use, 610b57cec5SDimitry Andric kw_renamable, 620b57cec5SDimitry Andric kw_tied_def, 630b57cec5SDimitry Andric kw_frame_setup, 640b57cec5SDimitry Andric kw_frame_destroy, 650b57cec5SDimitry Andric kw_nnan, 660b57cec5SDimitry Andric kw_ninf, 670b57cec5SDimitry Andric kw_nsz, 680b57cec5SDimitry Andric kw_arcp, 690b57cec5SDimitry Andric kw_contract, 700b57cec5SDimitry Andric kw_afn, 710b57cec5SDimitry Andric kw_reassoc, 72*0fca6ea1SDimitry Andric kw_nusw, 730b57cec5SDimitry Andric kw_nuw, 740b57cec5SDimitry Andric kw_nsw, 750b57cec5SDimitry Andric kw_exact, 76480093f4SDimitry Andric kw_nofpexcept, 7706c3fb27SDimitry Andric kw_unpredictable, 78*0fca6ea1SDimitry Andric kw_nneg, 79*0fca6ea1SDimitry Andric kw_disjoint, 800b57cec5SDimitry Andric kw_debug_location, 81e8d8bef9SDimitry Andric kw_debug_instr_number, 82bdd1243dSDimitry Andric kw_dbg_instr_ref, 830b57cec5SDimitry Andric kw_cfi_same_value, 840b57cec5SDimitry Andric kw_cfi_offset, 850b57cec5SDimitry Andric kw_cfi_rel_offset, 860b57cec5SDimitry Andric kw_cfi_def_cfa_register, 870b57cec5SDimitry Andric kw_cfi_def_cfa_offset, 880b57cec5SDimitry Andric kw_cfi_adjust_cfa_offset, 890b57cec5SDimitry Andric kw_cfi_escape, 900b57cec5SDimitry Andric kw_cfi_def_cfa, 91fe6060f1SDimitry Andric kw_cfi_llvm_def_aspace_cfa, 920b57cec5SDimitry Andric kw_cfi_register, 930b57cec5SDimitry Andric kw_cfi_remember_state, 940b57cec5SDimitry Andric kw_cfi_restore, 950b57cec5SDimitry Andric kw_cfi_restore_state, 960b57cec5SDimitry Andric kw_cfi_undefined, 970b57cec5SDimitry Andric kw_cfi_window_save, 980b57cec5SDimitry Andric kw_cfi_aarch64_negate_ra_sign_state, 990b57cec5SDimitry Andric kw_blockaddress, 1000b57cec5SDimitry Andric kw_intrinsic, 1010b57cec5SDimitry Andric kw_target_index, 1020b57cec5SDimitry Andric kw_half, 103*0fca6ea1SDimitry Andric kw_bfloat, 1040b57cec5SDimitry Andric kw_float, 1050b57cec5SDimitry Andric kw_double, 1060b57cec5SDimitry Andric kw_x86_fp80, 1070b57cec5SDimitry Andric kw_fp128, 1080b57cec5SDimitry Andric kw_ppc_fp128, 1090b57cec5SDimitry Andric kw_target_flags, 1100b57cec5SDimitry Andric kw_volatile, 1110b57cec5SDimitry Andric kw_non_temporal, 1120b57cec5SDimitry Andric kw_invariant, 1130b57cec5SDimitry Andric kw_align, 114e8d8bef9SDimitry Andric kw_basealign, 1150b57cec5SDimitry Andric kw_addrspace, 1160b57cec5SDimitry Andric kw_stack, 1170b57cec5SDimitry Andric kw_got, 1180b57cec5SDimitry Andric kw_jump_table, 1190b57cec5SDimitry Andric kw_constant_pool, 1200b57cec5SDimitry Andric kw_call_entry, 121480093f4SDimitry Andric kw_custom, 1220b57cec5SDimitry Andric kw_liveout, 1230b57cec5SDimitry Andric kw_landing_pad, 124349cc55cSDimitry Andric kw_inlineasm_br_indirect_target, 1255ffd83dbSDimitry Andric kw_ehfunclet_entry, 1260b57cec5SDimitry Andric kw_liveins, 1270b57cec5SDimitry Andric kw_successors, 1280b57cec5SDimitry Andric kw_floatpred, 1290b57cec5SDimitry Andric kw_intpred, 1308bcb0991SDimitry Andric kw_shufflemask, 1310b57cec5SDimitry Andric kw_pre_instr_symbol, 1320b57cec5SDimitry Andric kw_post_instr_symbol, 133480093f4SDimitry Andric kw_heap_alloc_marker, 134bdd1243dSDimitry Andric kw_pcsections, 135bdd1243dSDimitry Andric kw_cfi_type, 1365ffd83dbSDimitry Andric kw_bbsections, 137bdd1243dSDimitry Andric kw_bb_id, 1380b57cec5SDimitry Andric kw_unknown_size, 139fe6060f1SDimitry Andric kw_unknown_address, 140bdd1243dSDimitry Andric kw_ir_block_address_taken, 141bdd1243dSDimitry Andric kw_machine_block_address_taken, 1425f757f3fSDimitry Andric kw_call_frame_size, 1435f757f3fSDimitry Andric kw_noconvergent, 144fe6060f1SDimitry Andric 145fe6060f1SDimitry Andric // Metadata types. 146fe6060f1SDimitry Andric kw_distinct, 1470b57cec5SDimitry Andric 1480b57cec5SDimitry Andric // Named metadata keywords 1490b57cec5SDimitry Andric md_tbaa, 1500b57cec5SDimitry Andric md_alias_scope, 1510b57cec5SDimitry Andric md_noalias, 1520b57cec5SDimitry Andric md_range, 1530b57cec5SDimitry Andric md_diexpr, 1540b57cec5SDimitry Andric md_dilocation, 1550b57cec5SDimitry Andric 1560b57cec5SDimitry Andric // Identifier tokens 1570b57cec5SDimitry Andric Identifier, 1580b57cec5SDimitry Andric NamedRegister, 1590b57cec5SDimitry Andric NamedVirtualRegister, 1600b57cec5SDimitry Andric MachineBasicBlockLabel, 1610b57cec5SDimitry Andric MachineBasicBlock, 1620b57cec5SDimitry Andric StackObject, 1630b57cec5SDimitry Andric FixedStackObject, 1640b57cec5SDimitry Andric NamedGlobalValue, 1650b57cec5SDimitry Andric GlobalValue, 1660b57cec5SDimitry Andric ExternalSymbol, 1670b57cec5SDimitry Andric MCSymbol, 1680b57cec5SDimitry Andric 1690b57cec5SDimitry Andric // Other tokens 1700b57cec5SDimitry Andric IntegerLiteral, 1710b57cec5SDimitry Andric FloatingPointLiteral, 1720b57cec5SDimitry Andric HexLiteral, 1738bcb0991SDimitry Andric VectorLiteral, 1740b57cec5SDimitry Andric VirtualRegister, 1750b57cec5SDimitry Andric ConstantPoolItem, 1760b57cec5SDimitry Andric JumpTableIndex, 1770b57cec5SDimitry Andric NamedIRBlock, 1780b57cec5SDimitry Andric IRBlock, 1790b57cec5SDimitry Andric NamedIRValue, 1800b57cec5SDimitry Andric IRValue, 1810b57cec5SDimitry Andric QuotedIRValue, // `<constant value>` 1820b57cec5SDimitry Andric SubRegisterIndex, 1830b57cec5SDimitry Andric StringConstant 1840b57cec5SDimitry Andric }; 1850b57cec5SDimitry Andric 1860b57cec5SDimitry Andric private: 1870b57cec5SDimitry Andric TokenKind Kind = Error; 1880b57cec5SDimitry Andric StringRef Range; 1890b57cec5SDimitry Andric StringRef StringValue; 1900b57cec5SDimitry Andric std::string StringValueStorage; 1910b57cec5SDimitry Andric APSInt IntVal; 1920b57cec5SDimitry Andric 1930b57cec5SDimitry Andric public: 1940b57cec5SDimitry Andric MIToken() = default; 1950b57cec5SDimitry Andric 1960b57cec5SDimitry Andric MIToken &reset(TokenKind Kind, StringRef Range); 1970b57cec5SDimitry Andric 1980b57cec5SDimitry Andric MIToken &setStringValue(StringRef StrVal); 1990b57cec5SDimitry Andric MIToken &setOwnedStringValue(std::string StrVal); 2000b57cec5SDimitry Andric MIToken &setIntegerValue(APSInt IntVal); 2010b57cec5SDimitry Andric kindMIToken2020b57cec5SDimitry Andric TokenKind kind() const { return Kind; } 2030b57cec5SDimitry Andric isErrorMIToken2040b57cec5SDimitry Andric bool isError() const { return Kind == Error; } 2050b57cec5SDimitry Andric isNewlineOrEOFMIToken2060b57cec5SDimitry Andric bool isNewlineOrEOF() const { return Kind == Newline || Kind == Eof; } 2070b57cec5SDimitry Andric isErrorOrEOFMIToken2080b57cec5SDimitry Andric bool isErrorOrEOF() const { return Kind == Error || Kind == Eof; } 2090b57cec5SDimitry Andric isRegisterMIToken2100b57cec5SDimitry Andric bool isRegister() const { 2110b57cec5SDimitry Andric return Kind == NamedRegister || Kind == underscore || 2120b57cec5SDimitry Andric Kind == NamedVirtualRegister || Kind == VirtualRegister; 2130b57cec5SDimitry Andric } 2140b57cec5SDimitry Andric isRegisterFlagMIToken2150b57cec5SDimitry Andric bool isRegisterFlag() const { 2160b57cec5SDimitry Andric return Kind == kw_implicit || Kind == kw_implicit_define || 2170b57cec5SDimitry Andric Kind == kw_def || Kind == kw_dead || Kind == kw_killed || 2180b57cec5SDimitry Andric Kind == kw_undef || Kind == kw_internal || 2190b57cec5SDimitry Andric Kind == kw_early_clobber || Kind == kw_debug_use || 2200b57cec5SDimitry Andric Kind == kw_renamable; 2210b57cec5SDimitry Andric } 2220b57cec5SDimitry Andric isMemoryOperandFlagMIToken2230b57cec5SDimitry Andric bool isMemoryOperandFlag() const { 2240b57cec5SDimitry Andric return Kind == kw_volatile || Kind == kw_non_temporal || 2250b57cec5SDimitry Andric Kind == kw_dereferenceable || Kind == kw_invariant || 2260b57cec5SDimitry Andric Kind == StringConstant; 2270b57cec5SDimitry Andric } 2280b57cec5SDimitry Andric isMIToken2290b57cec5SDimitry Andric bool is(TokenKind K) const { return Kind == K; } 2300b57cec5SDimitry Andric isNotMIToken2310b57cec5SDimitry Andric bool isNot(TokenKind K) const { return Kind != K; } 2320b57cec5SDimitry Andric locationMIToken2330b57cec5SDimitry Andric StringRef::iterator location() const { return Range.begin(); } 2340b57cec5SDimitry Andric rangeMIToken2350b57cec5SDimitry Andric StringRef range() const { return Range; } 2360b57cec5SDimitry Andric 2370b57cec5SDimitry Andric /// Return the token's string value. stringValueMIToken2380b57cec5SDimitry Andric StringRef stringValue() const { return StringValue; } 2390b57cec5SDimitry Andric integerValueMIToken2400b57cec5SDimitry Andric const APSInt &integerValue() const { return IntVal; } 2410b57cec5SDimitry Andric hasIntegerValueMIToken2420b57cec5SDimitry Andric bool hasIntegerValue() const { 2430b57cec5SDimitry Andric return Kind == IntegerLiteral || Kind == MachineBasicBlock || 2440b57cec5SDimitry Andric Kind == MachineBasicBlockLabel || Kind == StackObject || 2450b57cec5SDimitry Andric Kind == FixedStackObject || Kind == GlobalValue || 2460b57cec5SDimitry Andric Kind == VirtualRegister || Kind == ConstantPoolItem || 2470b57cec5SDimitry Andric Kind == JumpTableIndex || Kind == IRBlock || Kind == IRValue; 2480b57cec5SDimitry Andric } 2490b57cec5SDimitry Andric }; 2500b57cec5SDimitry Andric 2510b57cec5SDimitry Andric /// Consume a single machine instruction token in the given source and return 2520b57cec5SDimitry Andric /// the remaining source string. 2530b57cec5SDimitry Andric StringRef lexMIToken( 2540b57cec5SDimitry Andric StringRef Source, MIToken &Token, 2550b57cec5SDimitry Andric function_ref<void(StringRef::iterator, const Twine &)> ErrorCallback); 2560b57cec5SDimitry Andric 2570b57cec5SDimitry Andric } // end namespace llvm 2580b57cec5SDimitry Andric 2590b57cec5SDimitry Andric #endif // LLVM_LIB_CODEGEN_MIRPARSER_MILEXER_H 260