//===- RISCVVEmitter.cpp - Generate riscv_vector.h for use with clang -----===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This tablegen backend is responsible for emitting riscv_vector.h which // includes a declaration and definition of each intrinsic functions specified // in https://github.com/riscv/rvv-intrinsic-doc. // // See also the documentation in include/clang/Basic/riscv_vector.td. // //===----------------------------------------------------------------------===// #include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/SmallSet.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/StringMap.h" #include "llvm/ADT/StringSet.h" #include "llvm/ADT/Twine.h" #include "llvm/TableGen/Error.h" #include "llvm/TableGen/Record.h" #include using namespace llvm; using BasicType = char; using VScaleVal = Optional; namespace { // Exponential LMUL struct LMULType { int Log2LMUL; LMULType(int Log2LMUL); // Return the C/C++ string representation of LMUL std::string str() const; Optional getScale(unsigned ElementBitwidth) const; void MulLog2LMUL(int Log2LMUL); LMULType &operator*=(uint32_t RHS); }; // This class is compact representation of a valid and invalid RVVType. class RVVType { enum ScalarTypeKind : uint32_t { Void, Size_t, Ptrdiff_t, UnsignedLong, SignedLong, Boolean, SignedInteger, UnsignedInteger, Float, Invalid, }; BasicType BT; ScalarTypeKind ScalarType = Invalid; LMULType LMUL; bool IsPointer = false; // IsConstant indices are "int", but have the constant expression. bool IsImmediate = false; // Const qualifier for pointer to const object or object of const type. bool IsConstant = false; unsigned ElementBitwidth = 0; VScaleVal Scale = 0; bool Valid; std::string BuiltinStr; std::string ClangBuiltinStr; std::string Str; std::string ShortStr; public: RVVType() : RVVType(BasicType(), 0, StringRef()) {} RVVType(BasicType BT, int Log2LMUL, StringRef prototype); // Return the string representation of a type, which is an encoded string for // passing to the BUILTIN() macro in Builtins.def. const std::string &getBuiltinStr() const { return BuiltinStr; } // Return the clang builtin type for RVV vector type which are used in the // riscv_vector.h header file. const std::string &getClangBuiltinStr() const { return ClangBuiltinStr; } // Return the C/C++ string representation of a type for use in the // riscv_vector.h header file. const std::string &getTypeStr() const { return Str; } // Return the short name of a type for C/C++ name suffix. const std::string &getShortStr() { // Not all types are used in short name, so compute the short name by // demanded. if (ShortStr.empty()) initShortStr(); return ShortStr; } bool isValid() const { return Valid; } bool isScalar() const { return Scale.hasValue() && Scale.getValue() == 0; } bool isVector() const { return Scale.hasValue() && Scale.getValue() != 0; } bool isVector(unsigned Width) const { return isVector() && ElementBitwidth == Width; } bool isFloat() const { return ScalarType == ScalarTypeKind::Float; } bool isSignedInteger() const { return ScalarType == ScalarTypeKind::SignedInteger; } bool isFloatVector(unsigned Width) const { return isVector() && isFloat() && ElementBitwidth == Width; } bool isFloat(unsigned Width) const { return isFloat() && ElementBitwidth == Width; } private: // Verify RVV vector type and set Valid. bool verifyType() const; // Creates a type based on basic types of TypeRange void applyBasicType(); // Applies a prototype modifier to the current type. The result maybe an // invalid type. void applyModifier(StringRef prototype); // Compute and record a string for legal type. void initBuiltinStr(); // Compute and record a builtin RVV vector type string. void initClangBuiltinStr(); // Compute and record a type string for used in the header. void initTypeStr(); // Compute and record a short name of a type for C/C++ name suffix. void initShortStr(); }; using RVVTypePtr = RVVType *; using RVVTypes = std::vector; using RISCVPredefinedMacroT = uint8_t; enum RISCVPredefinedMacro : RISCVPredefinedMacroT { Basic = 0, V = 1 << 1, Zfh = 1 << 2, RV64 = 1 << 3, VectorMaxELen64 = 1 << 4, VectorMaxELenFp32 = 1 << 5, VectorMaxELenFp64 = 1 << 6, }; // TODO refactor RVVIntrinsic class design after support all intrinsic // combination. This represents an instantiation of an intrinsic with a // particular type and prototype class RVVIntrinsic { private: std::string BuiltinName; // Builtin name std::string Name; // C intrinsic name. std::string MangledName; std::string IRName; bool IsMask; bool HasVL; bool HasPolicy; bool HasNoMaskedOverloaded; bool HasAutoDef; // There is automiatic definition in header std::string ManualCodegen; RVVTypePtr OutputType; // Builtin output type RVVTypes InputTypes; // Builtin input types // The types we use to obtain the specific LLVM intrinsic. They are index of // InputTypes. -1 means the return type. std::vector IntrinsicTypes; RISCVPredefinedMacroT RISCVPredefinedMacros = 0; unsigned NF = 1; public: RVVIntrinsic(StringRef Name, StringRef Suffix, StringRef MangledName, StringRef MangledSuffix, StringRef IRName, bool IsMask, bool HasMaskedOffOperand, bool HasVL, bool HasPolicy, bool HasNoMaskedOverloaded, bool HasAutoDef, StringRef ManualCodegen, const RVVTypes &Types, const std::vector &IntrinsicTypes, const std::vector &RequiredFeatures, unsigned NF); ~RVVIntrinsic() = default; StringRef getBuiltinName() const { return BuiltinName; } StringRef getName() const { return Name; } StringRef getMangledName() const { return MangledName; } bool hasVL() const { return HasVL; } bool hasPolicy() const { return HasPolicy; } bool hasNoMaskedOverloaded() const { return HasNoMaskedOverloaded; } bool hasManualCodegen() const { return !ManualCodegen.empty(); } bool hasAutoDef() const { return HasAutoDef; } bool isMask() const { return IsMask; } StringRef getIRName() const { return IRName; } StringRef getManualCodegen() const { return ManualCodegen; } RISCVPredefinedMacroT getRISCVPredefinedMacros() const { return RISCVPredefinedMacros; } unsigned getNF() const { return NF; } const std::vector &getIntrinsicTypes() const { return IntrinsicTypes; } // Return the type string for a BUILTIN() macro in Builtins.def. std::string getBuiltinTypeStr() const; // Emit the code block for switch body in EmitRISCVBuiltinExpr, it should // init the RVVIntrinsic ID and IntrinsicTypes. void emitCodeGenSwitchBody(raw_ostream &o) const; // Emit the macros for mapping C/C++ intrinsic function to builtin functions. void emitIntrinsicFuncDef(raw_ostream &o) const; // Emit the mangled function definition. void emitMangledFuncDef(raw_ostream &o) const; }; class RVVEmitter { private: RecordKeeper &Records; std::string HeaderCode; // Concat BasicType, LMUL and Proto as key StringMap LegalTypes; StringSet<> IllegalTypes; public: RVVEmitter(RecordKeeper &R) : Records(R) {} /// Emit riscv_vector.h void createHeader(raw_ostream &o); /// Emit all the __builtin prototypes and code needed by Sema. void createBuiltins(raw_ostream &o); /// Emit all the information needed to map builtin -> LLVM IR intrinsic. void createCodeGen(raw_ostream &o); std::string getSuffixStr(char Type, int Log2LMUL, StringRef Prototypes); private: /// Create all intrinsics and add them to \p Out void createRVVIntrinsics(std::vector> &Out); /// Create Headers and add them to \p Out void createRVVHeaders(raw_ostream &OS); /// Compute output and input types by applying different config (basic type /// and LMUL with type transformers). It also record result of type in legal /// or illegal set to avoid compute the same config again. The result maybe /// have illegal RVVType. Optional computeTypes(BasicType BT, int Log2LMUL, unsigned NF, ArrayRef PrototypeSeq); Optional computeType(BasicType BT, int Log2LMUL, StringRef Proto); /// Emit Acrh predecessor definitions and body, assume the element of Defs are /// sorted by extension. void emitArchMacroAndBody( std::vector> &Defs, raw_ostream &o, std::function); // Emit the architecture preprocessor definitions. Return true when emits // non-empty string. bool emitMacroRestrictionStr(RISCVPredefinedMacroT PredefinedMacros, raw_ostream &o); // Slice Prototypes string into sub prototype string and process each sub // prototype string individually in the Handler. void parsePrototypes(StringRef Prototypes, std::function Handler); }; } // namespace //===----------------------------------------------------------------------===// // Type implementation //===----------------------------------------------------------------------===// LMULType::LMULType(int NewLog2LMUL) { // Check Log2LMUL is -3, -2, -1, 0, 1, 2, 3 assert(NewLog2LMUL <= 3 && NewLog2LMUL >= -3 && "Bad LMUL number!"); Log2LMUL = NewLog2LMUL; } std::string LMULType::str() const { if (Log2LMUL < 0) return "mf" + utostr(1ULL << (-Log2LMUL)); return "m" + utostr(1ULL << Log2LMUL); } VScaleVal LMULType::getScale(unsigned ElementBitwidth) const { int Log2ScaleResult = 0; switch (ElementBitwidth) { default: break; case 8: Log2ScaleResult = Log2LMUL + 3; break; case 16: Log2ScaleResult = Log2LMUL + 2; break; case 32: Log2ScaleResult = Log2LMUL + 1; break; case 64: Log2ScaleResult = Log2LMUL; break; } // Illegal vscale result would be less than 1 if (Log2ScaleResult < 0) return None; return 1 << Log2ScaleResult; } void LMULType::MulLog2LMUL(int log2LMUL) { Log2LMUL += log2LMUL; } LMULType &LMULType::operator*=(uint32_t RHS) { assert(isPowerOf2_32(RHS)); this->Log2LMUL = this->Log2LMUL + Log2_32(RHS); return *this; } RVVType::RVVType(BasicType BT, int Log2LMUL, StringRef prototype) : BT(BT), LMUL(LMULType(Log2LMUL)) { applyBasicType(); applyModifier(prototype); Valid = verifyType(); if (Valid) { initBuiltinStr(); initTypeStr(); if (isVector()) { initClangBuiltinStr(); } } } // clang-format off // boolean type are encoded the ratio of n (SEW/LMUL) // SEW/LMUL | 1 | 2 | 4 | 8 | 16 | 32 | 64 // c type | vbool64_t | vbool32_t | vbool16_t | vbool8_t | vbool4_t | vbool2_t | vbool1_t // IR type | nxv1i1 | nxv2i1 | nxv4i1 | nxv8i1 | nxv16i1 | nxv32i1 | nxv64i1 // type\lmul | 1/8 | 1/4 | 1/2 | 1 | 2 | 4 | 8 // -------- |------ | -------- | ------- | ------- | -------- | -------- | -------- // i64 | N/A | N/A | N/A | nxv1i64 | nxv2i64 | nxv4i64 | nxv8i64 // i32 | N/A | N/A | nxv1i32 | nxv2i32 | nxv4i32 | nxv8i32 | nxv16i32 // i16 | N/A | nxv1i16 | nxv2i16 | nxv4i16 | nxv8i16 | nxv16i16 | nxv32i16 // i8 | nxv1i8 | nxv2i8 | nxv4i8 | nxv8i8 | nxv16i8 | nxv32i8 | nxv64i8 // double | N/A | N/A | N/A | nxv1f64 | nxv2f64 | nxv4f64 | nxv8f64 // float | N/A | N/A | nxv1f32 | nxv2f32 | nxv4f32 | nxv8f32 | nxv16f32 // half | N/A | nxv1f16 | nxv2f16 | nxv4f16 | nxv8f16 | nxv16f16 | nxv32f16 // clang-format on bool RVVType::verifyType() const { if (ScalarType == Invalid) return false; if (isScalar()) return true; if (!Scale.hasValue()) return false; if (isFloat() && ElementBitwidth == 8) return false; unsigned V = Scale.getValue(); switch (ElementBitwidth) { case 1: case 8: // Check Scale is 1,2,4,8,16,32,64 return (V <= 64 && isPowerOf2_32(V)); case 16: // Check Scale is 1,2,4,8,16,32 return (V <= 32 && isPowerOf2_32(V)); case 32: // Check Scale is 1,2,4,8,16 return (V <= 16 && isPowerOf2_32(V)); case 64: // Check Scale is 1,2,4,8 return (V <= 8 && isPowerOf2_32(V)); } return false; } void RVVType::initBuiltinStr() { assert(isValid() && "RVVType is invalid"); switch (ScalarType) { case ScalarTypeKind::Void: BuiltinStr = "v"; return; case ScalarTypeKind::Size_t: BuiltinStr = "z"; if (IsImmediate) BuiltinStr = "I" + BuiltinStr; if (IsPointer) BuiltinStr += "*"; return; case ScalarTypeKind::Ptrdiff_t: BuiltinStr = "Y"; return; case ScalarTypeKind::UnsignedLong: BuiltinStr = "ULi"; return; case ScalarTypeKind::SignedLong: BuiltinStr = "Li"; return; case ScalarTypeKind::Boolean: assert(ElementBitwidth == 1); BuiltinStr += "b"; break; case ScalarTypeKind::SignedInteger: case ScalarTypeKind::UnsignedInteger: switch (ElementBitwidth) { case 8: BuiltinStr += "c"; break; case 16: BuiltinStr += "s"; break; case 32: BuiltinStr += "i"; break; case 64: BuiltinStr += "Wi"; break; default: llvm_unreachable("Unhandled ElementBitwidth!"); } if (isSignedInteger()) BuiltinStr = "S" + BuiltinStr; else BuiltinStr = "U" + BuiltinStr; break; case ScalarTypeKind::Float: switch (ElementBitwidth) { case 16: BuiltinStr += "x"; break; case 32: BuiltinStr += "f"; break; case 64: BuiltinStr += "d"; break; default: llvm_unreachable("Unhandled ElementBitwidth!"); } break; default: llvm_unreachable("ScalarType is invalid!"); } if (IsImmediate) BuiltinStr = "I" + BuiltinStr; if (isScalar()) { if (IsConstant) BuiltinStr += "C"; if (IsPointer) BuiltinStr += "*"; return; } BuiltinStr = "q" + utostr(Scale.getValue()) + BuiltinStr; // Pointer to vector types. Defined for segment load intrinsics. // segment load intrinsics have pointer type arguments to store the loaded // vector values. if (IsPointer) BuiltinStr += "*"; } void RVVType::initClangBuiltinStr() { assert(isValid() && "RVVType is invalid"); assert(isVector() && "Handle Vector type only"); ClangBuiltinStr = "__rvv_"; switch (ScalarType) { case ScalarTypeKind::Boolean: ClangBuiltinStr += "bool" + utostr(64 / Scale.getValue()) + "_t"; return; case ScalarTypeKind::Float: ClangBuiltinStr += "float"; break; case ScalarTypeKind::SignedInteger: ClangBuiltinStr += "int"; break; case ScalarTypeKind::UnsignedInteger: ClangBuiltinStr += "uint"; break; default: llvm_unreachable("ScalarTypeKind is invalid"); } ClangBuiltinStr += utostr(ElementBitwidth) + LMUL.str() + "_t"; } void RVVType::initTypeStr() { assert(isValid() && "RVVType is invalid"); if (IsConstant) Str += "const "; auto getTypeString = [&](StringRef TypeStr) { if (isScalar()) return Twine(TypeStr + Twine(ElementBitwidth) + "_t").str(); return Twine("v" + TypeStr + Twine(ElementBitwidth) + LMUL.str() + "_t") .str(); }; switch (ScalarType) { case ScalarTypeKind::Void: Str = "void"; return; case ScalarTypeKind::Size_t: Str = "size_t"; if (IsPointer) Str += " *"; return; case ScalarTypeKind::Ptrdiff_t: Str = "ptrdiff_t"; return; case ScalarTypeKind::UnsignedLong: Str = "unsigned long"; return; case ScalarTypeKind::SignedLong: Str = "long"; return; case ScalarTypeKind::Boolean: if (isScalar()) Str += "bool"; else // Vector bool is special case, the formulate is // `vbool_t = MVT::nxv<64/N>i1` ex. vbool16_t = MVT::4i1 Str += "vbool" + utostr(64 / Scale.getValue()) + "_t"; break; case ScalarTypeKind::Float: if (isScalar()) { if (ElementBitwidth == 64) Str += "double"; else if (ElementBitwidth == 32) Str += "float"; else if (ElementBitwidth == 16) Str += "_Float16"; else llvm_unreachable("Unhandled floating type."); } else Str += getTypeString("float"); break; case ScalarTypeKind::SignedInteger: Str += getTypeString("int"); break; case ScalarTypeKind::UnsignedInteger: Str += getTypeString("uint"); break; default: llvm_unreachable("ScalarType is invalid!"); } if (IsPointer) Str += " *"; } void RVVType::initShortStr() { switch (ScalarType) { case ScalarTypeKind::Boolean: assert(isVector()); ShortStr = "b" + utostr(64 / Scale.getValue()); return; case ScalarTypeKind::Float: ShortStr = "f" + utostr(ElementBitwidth); break; case ScalarTypeKind::SignedInteger: ShortStr = "i" + utostr(ElementBitwidth); break; case ScalarTypeKind::UnsignedInteger: ShortStr = "u" + utostr(ElementBitwidth); break; default: PrintFatalError("Unhandled case!"); } if (isVector()) ShortStr += LMUL.str(); } void RVVType::applyBasicType() { switch (BT) { case 'c': ElementBitwidth = 8; ScalarType = ScalarTypeKind::SignedInteger; break; case 's': ElementBitwidth = 16; ScalarType = ScalarTypeKind::SignedInteger; break; case 'i': ElementBitwidth = 32; ScalarType = ScalarTypeKind::SignedInteger; break; case 'l': ElementBitwidth = 64; ScalarType = ScalarTypeKind::SignedInteger; break; case 'x': ElementBitwidth = 16; ScalarType = ScalarTypeKind::Float; break; case 'f': ElementBitwidth = 32; ScalarType = ScalarTypeKind::Float; break; case 'd': ElementBitwidth = 64; ScalarType = ScalarTypeKind::Float; break; default: PrintFatalError("Unhandled type code!"); } assert(ElementBitwidth != 0 && "Bad element bitwidth!"); } void RVVType::applyModifier(StringRef Transformer) { if (Transformer.empty()) return; // Handle primitive type transformer auto PType = Transformer.back(); switch (PType) { case 'e': Scale = 0; break; case 'v': Scale = LMUL.getScale(ElementBitwidth); break; case 'w': ElementBitwidth *= 2; LMUL *= 2; Scale = LMUL.getScale(ElementBitwidth); break; case 'q': ElementBitwidth *= 4; LMUL *= 4; Scale = LMUL.getScale(ElementBitwidth); break; case 'o': ElementBitwidth *= 8; LMUL *= 8; Scale = LMUL.getScale(ElementBitwidth); break; case 'm': ScalarType = ScalarTypeKind::Boolean; Scale = LMUL.getScale(ElementBitwidth); ElementBitwidth = 1; break; case '0': ScalarType = ScalarTypeKind::Void; break; case 'z': ScalarType = ScalarTypeKind::Size_t; break; case 't': ScalarType = ScalarTypeKind::Ptrdiff_t; break; case 'u': ScalarType = ScalarTypeKind::UnsignedLong; break; case 'l': ScalarType = ScalarTypeKind::SignedLong; break; default: PrintFatalError("Illegal primitive type transformers!"); } Transformer = Transformer.drop_back(); // Extract and compute complex type transformer. It can only appear one time. if (Transformer.startswith("(")) { size_t Idx = Transformer.find(')'); assert(Idx != StringRef::npos); StringRef ComplexType = Transformer.slice(1, Idx); Transformer = Transformer.drop_front(Idx + 1); assert(!Transformer.contains('(') && "Only allow one complex type transformer"); auto UpdateAndCheckComplexProto = [&]() { Scale = LMUL.getScale(ElementBitwidth); const StringRef VectorPrototypes("vwqom"); if (!VectorPrototypes.contains(PType)) PrintFatalError("Complex type transformer only supports vector type!"); if (Transformer.find_first_of("PCKWS") != StringRef::npos) PrintFatalError( "Illegal type transformer for Complex type transformer"); }; auto ComputeFixedLog2LMUL = [&](StringRef Value, std::function Compare) { int32_t Log2LMUL; Value.getAsInteger(10, Log2LMUL); if (!Compare(Log2LMUL, LMUL.Log2LMUL)) { ScalarType = Invalid; return false; } // Update new LMUL LMUL = LMULType(Log2LMUL); UpdateAndCheckComplexProto(); return true; }; auto ComplexTT = ComplexType.split(":"); if (ComplexTT.first == "Log2EEW") { uint32_t Log2EEW; ComplexTT.second.getAsInteger(10, Log2EEW); // update new elmul = (eew/sew) * lmul LMUL.MulLog2LMUL(Log2EEW - Log2_32(ElementBitwidth)); // update new eew ElementBitwidth = 1 << Log2EEW; ScalarType = ScalarTypeKind::SignedInteger; UpdateAndCheckComplexProto(); } else if (ComplexTT.first == "FixedSEW") { uint32_t NewSEW; ComplexTT.second.getAsInteger(10, NewSEW); // Set invalid type if src and dst SEW are same. if (ElementBitwidth == NewSEW) { ScalarType = Invalid; return; } // Update new SEW ElementBitwidth = NewSEW; UpdateAndCheckComplexProto(); } else if (ComplexTT.first == "LFixedLog2LMUL") { // New LMUL should be larger than old if (!ComputeFixedLog2LMUL(ComplexTT.second, std::greater())) return; } else if (ComplexTT.first == "SFixedLog2LMUL") { // New LMUL should be smaller than old if (!ComputeFixedLog2LMUL(ComplexTT.second, std::less())) return; } else { PrintFatalError("Illegal complex type transformers!"); } } // Compute the remain type transformers for (char I : Transformer) { switch (I) { case 'P': if (IsConstant) PrintFatalError("'P' transformer cannot be used after 'C'"); if (IsPointer) PrintFatalError("'P' transformer cannot be used twice"); IsPointer = true; break; case 'C': if (IsConstant) PrintFatalError("'C' transformer cannot be used twice"); IsConstant = true; break; case 'K': IsImmediate = true; break; case 'U': ScalarType = ScalarTypeKind::UnsignedInteger; break; case 'I': ScalarType = ScalarTypeKind::SignedInteger; break; case 'F': ScalarType = ScalarTypeKind::Float; break; case 'S': LMUL = LMULType(0); // Update ElementBitwidth need to update Scale too. Scale = LMUL.getScale(ElementBitwidth); break; default: PrintFatalError("Illegal non-primitive type transformer!"); } } } //===----------------------------------------------------------------------===// // RVVIntrinsic implementation //===----------------------------------------------------------------------===// RVVIntrinsic::RVVIntrinsic(StringRef NewName, StringRef Suffix, StringRef NewMangledName, StringRef MangledSuffix, StringRef IRName, bool IsMask, bool HasMaskedOffOperand, bool HasVL, bool HasPolicy, bool HasNoMaskedOverloaded, bool HasAutoDef, StringRef ManualCodegen, const RVVTypes &OutInTypes, const std::vector &NewIntrinsicTypes, const std::vector &RequiredFeatures, unsigned NF) : IRName(IRName), IsMask(IsMask), HasVL(HasVL), HasPolicy(HasPolicy), HasNoMaskedOverloaded(HasNoMaskedOverloaded), HasAutoDef(HasAutoDef), ManualCodegen(ManualCodegen.str()), NF(NF) { // Init BuiltinName, Name and MangledName BuiltinName = NewName.str(); Name = BuiltinName; if (NewMangledName.empty()) MangledName = NewName.split("_").first.str(); else MangledName = NewMangledName.str(); if (!Suffix.empty()) Name += "_" + Suffix.str(); if (!MangledSuffix.empty()) MangledName += "_" + MangledSuffix.str(); if (IsMask) { BuiltinName += "_m"; Name += "_m"; } // Init RISC-V extensions for (const auto &T : OutInTypes) { if (T->isFloatVector(16) || T->isFloat(16)) RISCVPredefinedMacros |= RISCVPredefinedMacro::Zfh; if (T->isFloatVector(32)) RISCVPredefinedMacros |= RISCVPredefinedMacro::VectorMaxELenFp32; if (T->isFloatVector(64)) RISCVPredefinedMacros |= RISCVPredefinedMacro::VectorMaxELenFp64; if (T->isVector(64)) RISCVPredefinedMacros |= RISCVPredefinedMacro::VectorMaxELen64; } for (auto Feature : RequiredFeatures) { if (Feature == "RV64") RISCVPredefinedMacros |= RISCVPredefinedMacro::RV64; // Note: Full multiply instruction (mulh, mulhu, mulhsu, smul) for EEW=64 // require V. if (Feature == "FullMultiply" && (RISCVPredefinedMacros & RISCVPredefinedMacro::VectorMaxELen64)) RISCVPredefinedMacros |= RISCVPredefinedMacro::V; } // Init OutputType and InputTypes OutputType = OutInTypes[0]; InputTypes.assign(OutInTypes.begin() + 1, OutInTypes.end()); // IntrinsicTypes is nonmasked version index. Need to update it // if there is maskedoff operand (It is always in first operand). IntrinsicTypes = NewIntrinsicTypes; if (IsMask && HasMaskedOffOperand) { for (auto &I : IntrinsicTypes) { if (I >= 0) I += NF; } } } std::string RVVIntrinsic::getBuiltinTypeStr() const { std::string S; S += OutputType->getBuiltinStr(); for (const auto &T : InputTypes) { S += T->getBuiltinStr(); } return S; } void RVVIntrinsic::emitCodeGenSwitchBody(raw_ostream &OS) const { if (!getIRName().empty()) OS << " ID = Intrinsic::riscv_" + getIRName() + ";\n"; if (NF >= 2) OS << " NF = " + utostr(getNF()) + ";\n"; if (hasManualCodegen()) { OS << ManualCodegen; OS << "break;\n"; return; } if (isMask()) { if (hasVL()) { OS << " std::rotate(Ops.begin(), Ops.begin() + 1, Ops.end() - 1);\n"; if (hasPolicy()) OS << " Ops.push_back(ConstantInt::get(Ops.back()->getType()," " TAIL_UNDISTURBED));\n"; } else { OS << " std::rotate(Ops.begin(), Ops.begin() + 1, Ops.end());\n"; } } OS << " IntrinsicTypes = {"; ListSeparator LS; for (const auto &Idx : IntrinsicTypes) { if (Idx == -1) OS << LS << "ResultType"; else OS << LS << "Ops[" << Idx << "]->getType()"; } // VL could be i64 or i32, need to encode it in IntrinsicTypes. VL is // always last operand. if (hasVL()) OS << ", Ops.back()->getType()"; OS << "};\n"; OS << " break;\n"; } void RVVIntrinsic::emitIntrinsicFuncDef(raw_ostream &OS) const { OS << "__attribute__((__clang_builtin_alias__("; OS << "__builtin_rvv_" << getBuiltinName() << ")))\n"; OS << OutputType->getTypeStr() << " " << getName() << "("; // Emit function arguments if (!InputTypes.empty()) { ListSeparator LS; for (unsigned i = 0; i < InputTypes.size(); ++i) OS << LS << InputTypes[i]->getTypeStr(); } OS << ");\n"; } void RVVIntrinsic::emitMangledFuncDef(raw_ostream &OS) const { OS << "__attribute__((__clang_builtin_alias__("; OS << "__builtin_rvv_" << getBuiltinName() << ")))\n"; OS << OutputType->getTypeStr() << " " << getMangledName() << "("; // Emit function arguments if (!InputTypes.empty()) { ListSeparator LS; for (unsigned i = 0; i < InputTypes.size(); ++i) OS << LS << InputTypes[i]->getTypeStr(); } OS << ");\n"; } //===----------------------------------------------------------------------===// // RVVEmitter implementation //===----------------------------------------------------------------------===// void RVVEmitter::createHeader(raw_ostream &OS) { OS << "/*===---- riscv_vector.h - RISC-V V-extension RVVIntrinsics " "-------------------===\n" " *\n" " *\n" " * Part of the LLVM Project, under the Apache License v2.0 with LLVM " "Exceptions.\n" " * See https://llvm.org/LICENSE.txt for license information.\n" " * SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception\n" " *\n" " *===-----------------------------------------------------------------" "------===\n" " */\n\n"; OS << "#ifndef __RISCV_VECTOR_H\n"; OS << "#define __RISCV_VECTOR_H\n\n"; OS << "#include \n"; OS << "#include \n\n"; OS << "#ifndef __riscv_vector\n"; OS << "#error \"Vector intrinsics require the vector extension.\"\n"; OS << "#endif\n\n"; OS << "#ifdef __cplusplus\n"; OS << "extern \"C\" {\n"; OS << "#endif\n\n"; createRVVHeaders(OS); std::vector> Defs; createRVVIntrinsics(Defs); // Print header code if (!HeaderCode.empty()) { OS << HeaderCode; } auto printType = [&](auto T) { OS << "typedef " << T->getClangBuiltinStr() << " " << T->getTypeStr() << ";\n"; }; constexpr int Log2LMULs[] = {-3, -2, -1, 0, 1, 2, 3}; // Print RVV boolean types. for (int Log2LMUL : Log2LMULs) { auto T = computeType('c', Log2LMUL, "m"); if (T.hasValue()) printType(T.getValue()); } // Print RVV int/float types. for (char I : StringRef("csil")) { for (int Log2LMUL : Log2LMULs) { auto T = computeType(I, Log2LMUL, "v"); if (T.hasValue()) { printType(T.getValue()); auto UT = computeType(I, Log2LMUL, "Uv"); printType(UT.getValue()); } } } OS << "#if defined(__riscv_zfh)\n"; for (int Log2LMUL : Log2LMULs) { auto T = computeType('x', Log2LMUL, "v"); if (T.hasValue()) printType(T.getValue()); } OS << "#endif\n"; OS << "#if defined(__riscv_f)\n"; for (int Log2LMUL : Log2LMULs) { auto T = computeType('f', Log2LMUL, "v"); if (T.hasValue()) printType(T.getValue()); } OS << "#endif\n"; OS << "#if defined(__riscv_d)\n"; for (int Log2LMUL : Log2LMULs) { auto T = computeType('d', Log2LMUL, "v"); if (T.hasValue()) printType(T.getValue()); } OS << "#endif\n\n"; // The same extension include in the same arch guard marco. llvm::stable_sort(Defs, [](const std::unique_ptr &A, const std::unique_ptr &B) { return A->getRISCVPredefinedMacros() < B->getRISCVPredefinedMacros(); }); OS << "#define __rvv_ai static __inline__\n"; // Print intrinsic functions with macro emitArchMacroAndBody(Defs, OS, [](raw_ostream &OS, const RVVIntrinsic &Inst) { OS << "__rvv_ai "; Inst.emitIntrinsicFuncDef(OS); }); OS << "#undef __rvv_ai\n\n"; OS << "#define __riscv_v_intrinsic_overloading 1\n"; // Print Overloaded APIs OS << "#define __rvv_aio static __inline__ " "__attribute__((__overloadable__))\n"; emitArchMacroAndBody(Defs, OS, [](raw_ostream &OS, const RVVIntrinsic &Inst) { if (!Inst.isMask() && !Inst.hasNoMaskedOverloaded()) return; OS << "__rvv_aio "; Inst.emitMangledFuncDef(OS); }); OS << "#undef __rvv_aio\n"; OS << "\n#ifdef __cplusplus\n"; OS << "}\n"; OS << "#endif // __cplusplus\n"; OS << "#endif // __RISCV_VECTOR_H\n"; } void RVVEmitter::createBuiltins(raw_ostream &OS) { std::vector> Defs; createRVVIntrinsics(Defs); // Map to keep track of which builtin names have already been emitted. StringMap BuiltinMap; OS << "#if defined(TARGET_BUILTIN) && !defined(RISCVV_BUILTIN)\n"; OS << "#define RISCVV_BUILTIN(ID, TYPE, ATTRS) TARGET_BUILTIN(ID, TYPE, " "ATTRS, \"zve32x|v\")\n"; OS << "#endif\n"; for (auto &Def : Defs) { auto P = BuiltinMap.insert(std::make_pair(Def->getBuiltinName(), Def.get())); if (!P.second) { // Verify that this would have produced the same builtin definition. if (P.first->second->hasAutoDef() != Def->hasAutoDef()) { PrintFatalError("Builtin with same name has different hasAutoDef"); } else if (!Def->hasAutoDef() && P.first->second->getBuiltinTypeStr() != Def->getBuiltinTypeStr()) { PrintFatalError("Builtin with same name has different type string"); } continue; } OS << "RISCVV_BUILTIN(__builtin_rvv_" << Def->getBuiltinName() << ",\""; if (!Def->hasAutoDef()) OS << Def->getBuiltinTypeStr(); OS << "\", \"n\")\n"; } OS << "#undef RISCVV_BUILTIN\n"; } void RVVEmitter::createCodeGen(raw_ostream &OS) { std::vector> Defs; createRVVIntrinsics(Defs); // IR name could be empty, use the stable sort preserves the relative order. llvm::stable_sort(Defs, [](const std::unique_ptr &A, const std::unique_ptr &B) { return A->getIRName() < B->getIRName(); }); // Map to keep track of which builtin names have already been emitted. StringMap BuiltinMap; // Print switch body when the ir name or ManualCodegen changes from previous // iteration. RVVIntrinsic *PrevDef = Defs.begin()->get(); for (auto &Def : Defs) { StringRef CurIRName = Def->getIRName(); if (CurIRName != PrevDef->getIRName() || (Def->getManualCodegen() != PrevDef->getManualCodegen())) { PrevDef->emitCodeGenSwitchBody(OS); } PrevDef = Def.get(); auto P = BuiltinMap.insert(std::make_pair(Def->getBuiltinName(), Def.get())); if (P.second) { OS << "case RISCVVector::BI__builtin_rvv_" << Def->getBuiltinName() << ":\n"; continue; } if (P.first->second->getIRName() != Def->getIRName()) PrintFatalError("Builtin with same name has different IRName"); else if (P.first->second->getManualCodegen() != Def->getManualCodegen()) PrintFatalError("Builtin with same name has different ManualCodegen"); else if (P.first->second->getNF() != Def->getNF()) PrintFatalError("Builtin with same name has different NF"); else if (P.first->second->isMask() != Def->isMask()) PrintFatalError("Builtin with same name has different isMask"); else if (P.first->second->hasVL() != Def->hasVL()) PrintFatalError("Builtin with same name has different HasPolicy"); else if (P.first->second->hasPolicy() != Def->hasPolicy()) PrintFatalError("Builtin with same name has different HasPolicy"); else if (P.first->second->getIntrinsicTypes() != Def->getIntrinsicTypes()) PrintFatalError("Builtin with same name has different IntrinsicTypes"); } Defs.back()->emitCodeGenSwitchBody(OS); OS << "\n"; } void RVVEmitter::parsePrototypes(StringRef Prototypes, std::function Handler) { const StringRef Primaries("evwqom0ztul"); while (!Prototypes.empty()) { size_t Idx = 0; // Skip over complex prototype because it could contain primitive type // character. if (Prototypes[0] == '(') Idx = Prototypes.find_first_of(')'); Idx = Prototypes.find_first_of(Primaries, Idx); assert(Idx != StringRef::npos); Handler(Prototypes.slice(0, Idx + 1)); Prototypes = Prototypes.drop_front(Idx + 1); } } std::string RVVEmitter::getSuffixStr(char Type, int Log2LMUL, StringRef Prototypes) { SmallVector SuffixStrs; parsePrototypes(Prototypes, [&](StringRef Proto) { auto T = computeType(Type, Log2LMUL, Proto); SuffixStrs.push_back(T.getValue()->getShortStr()); }); return join(SuffixStrs, "_"); } void RVVEmitter::createRVVIntrinsics( std::vector> &Out) { std::vector RV = Records.getAllDerivedDefinitions("RVVBuiltin"); for (auto *R : RV) { StringRef Name = R->getValueAsString("Name"); StringRef SuffixProto = R->getValueAsString("Suffix"); StringRef MangledName = R->getValueAsString("MangledName"); StringRef MangledSuffixProto = R->getValueAsString("MangledSuffix"); StringRef Prototypes = R->getValueAsString("Prototype"); StringRef TypeRange = R->getValueAsString("TypeRange"); bool HasMask = R->getValueAsBit("HasMask"); bool HasMaskedOffOperand = R->getValueAsBit("HasMaskedOffOperand"); bool HasVL = R->getValueAsBit("HasVL"); bool HasPolicy = R->getValueAsBit("HasPolicy"); bool HasNoMaskedOverloaded = R->getValueAsBit("HasNoMaskedOverloaded"); std::vector Log2LMULList = R->getValueAsListOfInts("Log2LMUL"); StringRef ManualCodegen = R->getValueAsString("ManualCodegen"); StringRef ManualCodegenMask = R->getValueAsString("ManualCodegenMask"); std::vector IntrinsicTypes = R->getValueAsListOfInts("IntrinsicTypes"); std::vector RequiredFeatures = R->getValueAsListOfStrings("RequiredFeatures"); StringRef IRName = R->getValueAsString("IRName"); StringRef IRNameMask = R->getValueAsString("IRNameMask"); unsigned NF = R->getValueAsInt("NF"); StringRef HeaderCodeStr = R->getValueAsString("HeaderCode"); bool HasAutoDef = HeaderCodeStr.empty(); if (!HeaderCodeStr.empty()) { HeaderCode += HeaderCodeStr.str(); } // Parse prototype and create a list of primitive type with transformers // (operand) in ProtoSeq. ProtoSeq[0] is output operand. SmallVector ProtoSeq; parsePrototypes(Prototypes, [&ProtoSeq](StringRef Proto) { ProtoSeq.push_back(Proto.str()); }); // Compute Builtin types SmallVector ProtoMaskSeq = ProtoSeq; if (HasMask) { // If HasMaskedOffOperand, insert result type as first input operand. if (HasMaskedOffOperand) { if (NF == 1) { ProtoMaskSeq.insert(ProtoMaskSeq.begin() + 1, ProtoSeq[0]); } else { // Convert // (void, op0 address, op1 address, ...) // to // (void, op0 address, op1 address, ..., maskedoff0, maskedoff1, ...) for (unsigned I = 0; I < NF; ++I) ProtoMaskSeq.insert( ProtoMaskSeq.begin() + NF + 1, ProtoSeq[1].substr(1)); // Use substr(1) to skip '*' } } if (HasMaskedOffOperand && NF > 1) { // Convert // (void, op0 address, op1 address, ..., maskedoff0, maskedoff1, ...) // to // (void, op0 address, op1 address, ..., mask, maskedoff0, maskedoff1, // ...) ProtoMaskSeq.insert(ProtoMaskSeq.begin() + NF + 1, "m"); } else { // If HasMask, insert 'm' as first input operand. ProtoMaskSeq.insert(ProtoMaskSeq.begin() + 1, "m"); } } // If HasVL, append 'z' to last operand if (HasVL) { ProtoSeq.push_back("z"); ProtoMaskSeq.push_back("z"); } // Create Intrinsics for each type and LMUL. for (char I : TypeRange) { for (int Log2LMUL : Log2LMULList) { Optional Types = computeTypes(I, Log2LMUL, NF, ProtoSeq); // Ignored to create new intrinsic if there are any illegal types. if (!Types.hasValue()) continue; auto SuffixStr = getSuffixStr(I, Log2LMUL, SuffixProto); auto MangledSuffixStr = getSuffixStr(I, Log2LMUL, MangledSuffixProto); // Create a non-mask intrinsic Out.push_back(std::make_unique( Name, SuffixStr, MangledName, MangledSuffixStr, IRName, /*IsMask=*/false, /*HasMaskedOffOperand=*/false, HasVL, HasPolicy, HasNoMaskedOverloaded, HasAutoDef, ManualCodegen, Types.getValue(), IntrinsicTypes, RequiredFeatures, NF)); if (HasMask) { // Create a mask intrinsic Optional MaskTypes = computeTypes(I, Log2LMUL, NF, ProtoMaskSeq); Out.push_back(std::make_unique( Name, SuffixStr, MangledName, MangledSuffixStr, IRNameMask, /*IsMask=*/true, HasMaskedOffOperand, HasVL, HasPolicy, HasNoMaskedOverloaded, HasAutoDef, ManualCodegenMask, MaskTypes.getValue(), IntrinsicTypes, RequiredFeatures, NF)); } } // end for Log2LMULList } // end for TypeRange } } void RVVEmitter::createRVVHeaders(raw_ostream &OS) { std::vector RVVHeaders = Records.getAllDerivedDefinitions("RVVHeader"); for (auto *R : RVVHeaders) { StringRef HeaderCodeStr = R->getValueAsString("HeaderCode"); OS << HeaderCodeStr.str(); } } Optional RVVEmitter::computeTypes(BasicType BT, int Log2LMUL, unsigned NF, ArrayRef PrototypeSeq) { // LMUL x NF must be less than or equal to 8. if ((Log2LMUL >= 1) && (1 << Log2LMUL) * NF > 8) return llvm::None; RVVTypes Types; for (const std::string &Proto : PrototypeSeq) { auto T = computeType(BT, Log2LMUL, Proto); if (!T.hasValue()) return llvm::None; // Record legal type index Types.push_back(T.getValue()); } return Types; } Optional RVVEmitter::computeType(BasicType BT, int Log2LMUL, StringRef Proto) { std::string Idx = Twine(Twine(BT) + Twine(Log2LMUL) + Proto).str(); // Search first auto It = LegalTypes.find(Idx); if (It != LegalTypes.end()) return &(It->second); if (IllegalTypes.count(Idx)) return llvm::None; // Compute type and record the result. RVVType T(BT, Log2LMUL, Proto); if (T.isValid()) { // Record legal type index and value. LegalTypes.insert({Idx, T}); return &(LegalTypes[Idx]); } // Record illegal type index. IllegalTypes.insert(Idx); return llvm::None; } void RVVEmitter::emitArchMacroAndBody( std::vector> &Defs, raw_ostream &OS, std::function PrintBody) { RISCVPredefinedMacroT PrevMacros = (*Defs.begin())->getRISCVPredefinedMacros(); bool NeedEndif = emitMacroRestrictionStr(PrevMacros, OS); for (auto &Def : Defs) { RISCVPredefinedMacroT CurMacros = Def->getRISCVPredefinedMacros(); if (CurMacros != PrevMacros) { if (NeedEndif) OS << "#endif\n\n"; NeedEndif = emitMacroRestrictionStr(CurMacros, OS); PrevMacros = CurMacros; } if (Def->hasAutoDef()) PrintBody(OS, *Def); } if (NeedEndif) OS << "#endif\n\n"; } bool RVVEmitter::emitMacroRestrictionStr(RISCVPredefinedMacroT PredefinedMacros, raw_ostream &OS) { if (PredefinedMacros == RISCVPredefinedMacro::Basic) return false; OS << "#if "; ListSeparator LS(" && "); if (PredefinedMacros & RISCVPredefinedMacro::V) OS << LS << "defined(__riscv_v)"; if (PredefinedMacros & RISCVPredefinedMacro::Zfh) OS << LS << "defined(__riscv_zfh)"; if (PredefinedMacros & RISCVPredefinedMacro::RV64) OS << LS << "(__riscv_xlen == 64)"; if (PredefinedMacros & RISCVPredefinedMacro::VectorMaxELen64) OS << LS << "(__riscv_v_elen >= 64)"; if (PredefinedMacros & RISCVPredefinedMacro::VectorMaxELenFp32) OS << LS << "(__riscv_v_elen_fp >= 32)"; if (PredefinedMacros & RISCVPredefinedMacro::VectorMaxELenFp64) OS << LS << "(__riscv_v_elen_fp >= 64)"; OS << "\n"; return true; } namespace clang { void EmitRVVHeader(RecordKeeper &Records, raw_ostream &OS) { RVVEmitter(Records).createHeader(OS); } void EmitRVVBuiltins(RecordKeeper &Records, raw_ostream &OS) { RVVEmitter(Records).createBuiltins(OS); } void EmitRVVBuiltinCG(RecordKeeper &Records, raw_ostream &OS) { RVVEmitter(Records).createCodeGen(OS); } } // End namespace clang