//===------------------------- MicrosoftDemangle.h --------------*- C++ -*-===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #ifndef LLVM_DEMANGLE_MICROSOFTDEMANGLE_H #define LLVM_DEMANGLE_MICROSOFTDEMANGLE_H #include "llvm/Demangle/Demangle.h" #include "llvm/Demangle/MicrosoftDemangleNodes.h" #include #include #include namespace llvm { namespace ms_demangle { // This memory allocator is extremely fast, but it doesn't call dtors // for allocated objects. That means you can't use STL containers // (such as std::vector) with this allocator. But it pays off -- // the demangler is 3x faster with this allocator compared to one with // STL containers. constexpr size_t AllocUnit = 4096; class ArenaAllocator { struct AllocatorNode { uint8_t *Buf = nullptr; size_t Used = 0; size_t Capacity = 0; AllocatorNode *Next = nullptr; }; void addNode(size_t Capacity) { AllocatorNode *NewHead = new AllocatorNode; NewHead->Buf = new uint8_t[Capacity]; NewHead->Next = Head; NewHead->Capacity = Capacity; Head = NewHead; NewHead->Used = 0; } public: ArenaAllocator() { addNode(AllocUnit); } ~ArenaAllocator() { while (Head) { assert(Head->Buf); delete[] Head->Buf; AllocatorNode *Next = Head->Next; delete Head; Head = Next; } } // Delete the copy constructor and the copy assignment operator. ArenaAllocator(const ArenaAllocator &) = delete; ArenaAllocator &operator=(const ArenaAllocator &) = delete; char *allocUnalignedBuffer(size_t Size) { assert(Head && Head->Buf); uint8_t *P = Head->Buf + Head->Used; Head->Used += Size; if (Head->Used <= Head->Capacity) return reinterpret_cast(P); addNode(std::max(AllocUnit, Size)); Head->Used = Size; return reinterpret_cast(Head->Buf); } template T *allocArray(size_t Count) { size_t Size = Count * sizeof(T); assert(Head && Head->Buf); size_t P = (size_t)Head->Buf + Head->Used; uintptr_t AlignedP = (((size_t)P + alignof(T) - 1) & ~(size_t)(alignof(T) - 1)); uint8_t *PP = (uint8_t *)AlignedP; size_t Adjustment = AlignedP - P; Head->Used += Size + Adjustment; if (Head->Used <= Head->Capacity) return new (PP) T[Count](); addNode(std::max(AllocUnit, Size)); Head->Used = Size; return new (Head->Buf) T[Count](); } template T *alloc(Args &&... ConstructorArgs) { constexpr size_t Size = sizeof(T); assert(Head && Head->Buf); size_t P = (size_t)Head->Buf + Head->Used; uintptr_t AlignedP = (((size_t)P + alignof(T) - 1) & ~(size_t)(alignof(T) - 1)); uint8_t *PP = (uint8_t *)AlignedP; size_t Adjustment = AlignedP - P; Head->Used += Size + Adjustment; if (Head->Used <= Head->Capacity) return new (PP) T(std::forward(ConstructorArgs)...); static_assert(Size < AllocUnit); addNode(AllocUnit); Head->Used = Size; return new (Head->Buf) T(std::forward(ConstructorArgs)...); } private: AllocatorNode *Head = nullptr; }; struct BackrefContext { static constexpr size_t Max = 10; TypeNode *FunctionParams[Max]; size_t FunctionParamCount = 0; // The first 10 BackReferences in a mangled name can be back-referenced by // special name @[0-9]. This is a storage for the first 10 BackReferences. NamedIdentifierNode *Names[Max]; size_t NamesCount = 0; }; enum class QualifierMangleMode { Drop, Mangle, Result }; enum NameBackrefBehavior : uint8_t { NBB_None = 0, // don't save any names as backrefs. NBB_Template = 1 << 0, // save template instanations. NBB_Simple = 1 << 1, // save simple names. }; enum class FunctionIdentifierCodeGroup { Basic, Under, DoubleUnder }; // Demangler class takes the main role in demangling symbols. // It has a set of functions to parse mangled symbols into Type instances. // It also has a set of functions to convert Type instances to strings. class Demangler { friend std::optional llvm::getArm64ECInsertionPointInMangledName(std::string_view MangledName); public: Demangler() = default; virtual ~Demangler() = default; // You are supposed to call parse() first and then check if error is true. If // it is false, call output() to write the formatted name to the given stream. SymbolNode *parse(std::string_view &MangledName); TagTypeNode *parseTagUniqueName(std::string_view &MangledName); // True if an error occurred. bool Error = false; void dumpBackReferences(); private: SymbolNode *demangleEncodedSymbol(std::string_view &MangledName, QualifiedNameNode *QN); SymbolNode *demangleDeclarator(std::string_view &MangledName); SymbolNode *demangleMD5Name(std::string_view &MangledName); SymbolNode *demangleTypeinfoName(std::string_view &MangledName); VariableSymbolNode *demangleVariableEncoding(std::string_view &MangledName, StorageClass SC); FunctionSymbolNode *demangleFunctionEncoding(std::string_view &MangledName); Qualifiers demanglePointerExtQualifiers(std::string_view &MangledName); // Parser functions. This is a recursive-descent parser. TypeNode *demangleType(std::string_view &MangledName, QualifierMangleMode QMM); PrimitiveTypeNode *demanglePrimitiveType(std::string_view &MangledName); CustomTypeNode *demangleCustomType(std::string_view &MangledName); TagTypeNode *demangleClassType(std::string_view &MangledName); PointerTypeNode *demanglePointerType(std::string_view &MangledName); PointerTypeNode *demangleMemberPointerType(std::string_view &MangledName); FunctionSignatureNode *demangleFunctionType(std::string_view &MangledName, bool HasThisQuals); ArrayTypeNode *demangleArrayType(std::string_view &MangledName); NodeArrayNode *demangleFunctionParameterList(std::string_view &MangledName, bool &IsVariadic); NodeArrayNode *demangleTemplateParameterList(std::string_view &MangledName); std::pair demangleNumber(std::string_view &MangledName); uint64_t demangleUnsigned(std::string_view &MangledName); int64_t demangleSigned(std::string_view &MangledName); void memorizeString(std::string_view s); void memorizeIdentifier(IdentifierNode *Identifier); /// Allocate a copy of \p Borrowed into memory that we own. std::string_view copyString(std::string_view Borrowed); QualifiedNameNode * demangleFullyQualifiedTypeName(std::string_view &MangledName); QualifiedNameNode * demangleFullyQualifiedSymbolName(std::string_view &MangledName); IdentifierNode *demangleUnqualifiedTypeName(std::string_view &MangledName, bool Memorize); IdentifierNode *demangleUnqualifiedSymbolName(std::string_view &MangledName, NameBackrefBehavior NBB); QualifiedNameNode *demangleNameScopeChain(std::string_view &MangledName, IdentifierNode *UnqualifiedName); IdentifierNode *demangleNameScopePiece(std::string_view &MangledName); NamedIdentifierNode *demangleBackRefName(std::string_view &MangledName); IdentifierNode * demangleTemplateInstantiationName(std::string_view &MangledName, NameBackrefBehavior NBB); IntrinsicFunctionKind translateIntrinsicFunctionCode(char CH, FunctionIdentifierCodeGroup Group); IdentifierNode *demangleFunctionIdentifierCode(std::string_view &MangledName); IdentifierNode * demangleFunctionIdentifierCode(std::string_view &MangledName, FunctionIdentifierCodeGroup Group); StructorIdentifierNode * demangleStructorIdentifier(std::string_view &MangledName, bool IsDestructor); ConversionOperatorIdentifierNode * demangleConversionOperatorIdentifier(std::string_view &MangledName); LiteralOperatorIdentifierNode * demangleLiteralOperatorIdentifier(std::string_view &MangledName); SymbolNode *demangleSpecialIntrinsic(std::string_view &MangledName); SpecialTableSymbolNode * demangleSpecialTableSymbolNode(std::string_view &MangledName, SpecialIntrinsicKind SIK); LocalStaticGuardVariableNode * demangleLocalStaticGuard(std::string_view &MangledName, bool IsThread); VariableSymbolNode *demangleUntypedVariable(ArenaAllocator &Arena, std::string_view &MangledName, std::string_view VariableName); VariableSymbolNode * demangleRttiBaseClassDescriptorNode(ArenaAllocator &Arena, std::string_view &MangledName); FunctionSymbolNode *demangleInitFiniStub(std::string_view &MangledName, bool IsDestructor); NamedIdentifierNode *demangleSimpleName(std::string_view &MangledName, bool Memorize); NamedIdentifierNode * demangleAnonymousNamespaceName(std::string_view &MangledName); NamedIdentifierNode * demangleLocallyScopedNamePiece(std::string_view &MangledName); EncodedStringLiteralNode * demangleStringLiteral(std::string_view &MangledName); FunctionSymbolNode *demangleVcallThunkNode(std::string_view &MangledName); std::string_view demangleSimpleString(std::string_view &MangledName, bool Memorize); FuncClass demangleFunctionClass(std::string_view &MangledName); CallingConv demangleCallingConvention(std::string_view &MangledName); StorageClass demangleVariableStorageClass(std::string_view &MangledName); bool demangleThrowSpecification(std::string_view &MangledName); wchar_t demangleWcharLiteral(std::string_view &MangledName); uint8_t demangleCharLiteral(std::string_view &MangledName); std::pair demangleQualifiers(std::string_view &MangledName); // Memory allocator. ArenaAllocator Arena; // A single type uses one global back-ref table for all function params. // This means back-refs can even go "into" other types. Examples: // // // Second int* is a back-ref to first. // void foo(int *, int*); // // // Second int* is not a back-ref to first (first is not a function param). // int* foo(int*); // // // Second int* is a back-ref to first (ALL function types share the same // // back-ref map. // using F = void(*)(int*); // F G(int *); BackrefContext Backrefs; }; } // namespace ms_demangle } // namespace llvm #endif // LLVM_DEMANGLE_MICROSOFTDEMANGLE_H