1 //===- MicrosoftDemangle.cpp ----------------------------------------------===//
3 // The LLVM Compiler Infrastructure
5 // This file is dual licensed under the MIT and the University of Illinois Open
6 // Source Licenses. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file defines a demangler for MSVC-style mangled symbols.
12 // This file has no dependencies on the rest of LLVM so that it can be
13 // easily reused in other programs such as libcxxabi.
15 //===----------------------------------------------------------------------===//
17 #include "llvm/Demangle/MicrosoftDemangle.h"
18 #include "llvm/Demangle/Demangle.h"
19 #include "llvm/Demangle/MicrosoftDemangleNodes.h"
21 #include "llvm/Demangle/Compiler.h"
22 #include "llvm/Demangle/StringView.h"
23 #include "llvm/Demangle/Utility.h"
31 using namespace ms_demangle;
33 static bool startsWithDigit(StringView S) {
34 return !S.empty() && std::isdigit(S.front());
40 NodeList *Next = nullptr;
43 static bool isMemberPointer(StringView MangledName, bool &Error) {
45 switch (MangledName.popFront()) {
47 // This is probably an rvalue reference (e.g. $$Q), and you cannot have an
48 // rvalue reference to a member.
51 // 'A' indicates a reference, and you cannot have a reference to a member
52 // function or member.
58 // These 4 values indicate some kind of pointer, but we still don't know
66 // If it starts with a number, then 6 indicates a non-member function
67 // pointer, and 8 indicates a member function pointer.
68 if (startsWithDigit(MangledName)) {
69 assert(MangledName[0] == '6' || MangledName[0] == '8');
70 return (MangledName[0] == '8');
73 // Remove ext qualifiers since those can appear on either type and are
74 // therefore not indicative.
75 MangledName.consumeFront('E'); // 64-bit
76 MangledName.consumeFront('I'); // restrict
77 MangledName.consumeFront('F'); // unaligned
79 assert(!MangledName.empty());
81 // The next value should be either ABCD (non-member) or QRST (member).
82 switch (MangledName.front()) {
99 static SpecialIntrinsicKind
100 consumeSpecialIntrinsicKind(StringView &MangledName) {
101 if (MangledName.consumeFront("?_7"))
102 return SpecialIntrinsicKind::Vftable;
103 if (MangledName.consumeFront("?_8"))
104 return SpecialIntrinsicKind::Vbtable;
105 if (MangledName.consumeFront("?_9"))
106 return SpecialIntrinsicKind::VcallThunk;
107 if (MangledName.consumeFront("?_A"))
108 return SpecialIntrinsicKind::Typeof;
109 if (MangledName.consumeFront("?_B"))
110 return SpecialIntrinsicKind::LocalStaticGuard;
111 if (MangledName.consumeFront("?_C"))
112 return SpecialIntrinsicKind::StringLiteralSymbol;
113 if (MangledName.consumeFront("?_P"))
114 return SpecialIntrinsicKind::UdtReturning;
115 if (MangledName.consumeFront("?_R0"))
116 return SpecialIntrinsicKind::RttiTypeDescriptor;
117 if (MangledName.consumeFront("?_R1"))
118 return SpecialIntrinsicKind::RttiBaseClassDescriptor;
119 if (MangledName.consumeFront("?_R2"))
120 return SpecialIntrinsicKind::RttiBaseClassArray;
121 if (MangledName.consumeFront("?_R3"))
122 return SpecialIntrinsicKind::RttiClassHierarchyDescriptor;
123 if (MangledName.consumeFront("?_R4"))
124 return SpecialIntrinsicKind::RttiCompleteObjLocator;
125 if (MangledName.consumeFront("?_S"))
126 return SpecialIntrinsicKind::LocalVftable;
127 if (MangledName.consumeFront("?__E"))
128 return SpecialIntrinsicKind::DynamicInitializer;
129 if (MangledName.consumeFront("?__F"))
130 return SpecialIntrinsicKind::DynamicAtexitDestructor;
131 if (MangledName.consumeFront("?__J"))
132 return SpecialIntrinsicKind::LocalStaticThreadGuard;
133 return SpecialIntrinsicKind::None;
136 static bool startsWithLocalScopePattern(StringView S) {
137 if (!S.consumeFront('?'))
142 size_t End = S.find('?');
143 if (End == StringView::npos)
145 StringView Candidate = S.substr(0, End);
146 if (Candidate.empty())
150 // ?@? is the discriminator 0.
151 if (Candidate.size() == 1)
152 return Candidate[0] == '@' || (Candidate[0] >= '0' && Candidate[0] <= '9');
154 // If it's not 0-9, then it's an encoded number terminated with an @
155 if (Candidate.back() != '@')
157 Candidate = Candidate.dropBack();
159 // An encoded number starts with B-P and all subsequent digits are in A-P.
160 // Note that the reason the first digit cannot be A is two fold. First, it
161 // would create an ambiguity with ?A which delimits the beginning of an
162 // anonymous namespace. Second, A represents 0, and you don't start a multi
163 // digit number with a leading 0. Presumably the anonymous namespace
164 // ambiguity is also why single digit encoded numbers use 0-9 rather than A-J.
165 if (Candidate[0] < 'B' || Candidate[0] > 'P')
167 Candidate = Candidate.dropFront();
168 while (!Candidate.empty()) {
169 if (Candidate[0] < 'A' || Candidate[0] > 'P')
171 Candidate = Candidate.dropFront();
177 static bool isTagType(StringView S) {
188 static bool isCustomType(StringView S) { return S[0] == '?'; }
190 static bool isPointerType(StringView S) {
191 if (S.startsWith("$$Q")) // foo &&
197 case 'Q': // foo *const
198 case 'R': // foo *volatile
199 case 'S': // foo *const volatile
205 static bool isArrayType(StringView S) { return S[0] == 'Y'; }
207 static bool isFunctionType(StringView S) {
208 return S.startsWith("$$A8@@") || S.startsWith("$$A6");
211 static FunctionRefQualifier
212 demangleFunctionRefQualifier(StringView &MangledName) {
213 if (MangledName.consumeFront('G'))
214 return FunctionRefQualifier::Reference;
215 else if (MangledName.consumeFront('H'))
216 return FunctionRefQualifier::RValueReference;
217 return FunctionRefQualifier::None;
220 static std::pair<Qualifiers, PointerAffinity>
221 demanglePointerCVQualifiers(StringView &MangledName) {
222 if (MangledName.consumeFront("$$Q"))
223 return std::make_pair(Q_None, PointerAffinity::RValueReference);
225 switch (MangledName.popFront()) {
227 return std::make_pair(Q_None, PointerAffinity::Reference);
229 return std::make_pair(Q_None, PointerAffinity::Pointer);
231 return std::make_pair(Q_Const, PointerAffinity::Pointer);
233 return std::make_pair(Q_Volatile, PointerAffinity::Pointer);
235 return std::make_pair(Qualifiers(Q_Const | Q_Volatile),
236 PointerAffinity::Pointer);
238 assert(false && "Ty is not a pointer type!");
240 return std::make_pair(Q_None, PointerAffinity::Pointer);
243 StringView Demangler::copyString(StringView Borrowed) {
244 char *Stable = Arena.allocUnalignedBuffer(Borrowed.size() + 1);
245 std::strcpy(Stable, Borrowed.begin());
247 return {Stable, Borrowed.size()};
250 SpecialTableSymbolNode *
251 Demangler::demangleSpecialTableSymbolNode(StringView &MangledName,
252 SpecialIntrinsicKind K) {
253 NamedIdentifierNode *NI = Arena.alloc<NamedIdentifierNode>();
255 case SpecialIntrinsicKind::Vftable:
256 NI->Name = "`vftable'";
258 case SpecialIntrinsicKind::Vbtable:
259 NI->Name = "`vbtable'";
261 case SpecialIntrinsicKind::LocalVftable:
262 NI->Name = "`local vftable'";
264 case SpecialIntrinsicKind::RttiCompleteObjLocator:
265 NI->Name = "`RTTI Complete Object Locator'";
268 LLVM_BUILTIN_UNREACHABLE;
270 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
271 SpecialTableSymbolNode *STSN = Arena.alloc<SpecialTableSymbolNode>();
273 bool IsMember = false;
274 char Front = MangledName.popFront();
275 if (Front != '6' && Front != '7') {
280 std::tie(STSN->Quals, IsMember) = demangleQualifiers(MangledName);
281 if (!MangledName.consumeFront('@'))
282 STSN->TargetName = demangleFullyQualifiedTypeName(MangledName);
286 LocalStaticGuardVariableNode *
287 Demangler::demangleLocalStaticGuard(StringView &MangledName) {
288 LocalStaticGuardIdentifierNode *LSGI =
289 Arena.alloc<LocalStaticGuardIdentifierNode>();
290 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, LSGI);
291 LocalStaticGuardVariableNode *LSGVN =
292 Arena.alloc<LocalStaticGuardVariableNode>();
295 if (MangledName.consumeFront("4IA"))
296 LSGVN->IsVisible = false;
297 else if (MangledName.consumeFront("5"))
298 LSGVN->IsVisible = true;
304 if (!MangledName.empty())
305 LSGI->ScopeIndex = demangleUnsigned(MangledName);
309 static NamedIdentifierNode *synthesizeNamedIdentifier(ArenaAllocator &Arena,
311 NamedIdentifierNode *Id = Arena.alloc<NamedIdentifierNode>();
316 static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
317 IdentifierNode *Identifier) {
318 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
319 QN->Components = Arena.alloc<NodeArrayNode>();
320 QN->Components->Count = 1;
321 QN->Components->Nodes = Arena.allocArray<Node *>(1);
322 QN->Components->Nodes[0] = Identifier;
326 static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
328 NamedIdentifierNode *Id = synthesizeNamedIdentifier(Arena, Name);
329 return synthesizeQualifiedName(Arena, Id);
332 static VariableSymbolNode *synthesizeVariable(ArenaAllocator &Arena,
334 StringView VariableName) {
335 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
337 VSN->Name = synthesizeQualifiedName(Arena, VariableName);
341 VariableSymbolNode *Demangler::demangleUntypedVariable(
342 ArenaAllocator &Arena, StringView &MangledName, StringView VariableName) {
343 NamedIdentifierNode *NI = synthesizeNamedIdentifier(Arena, VariableName);
344 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
345 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
347 if (MangledName.consumeFront("8"))
355 Demangler::demangleRttiBaseClassDescriptorNode(ArenaAllocator &Arena,
356 StringView &MangledName) {
357 RttiBaseClassDescriptorNode *RBCDN =
358 Arena.alloc<RttiBaseClassDescriptorNode>();
359 RBCDN->NVOffset = demangleUnsigned(MangledName);
360 RBCDN->VBPtrOffset = demangleSigned(MangledName);
361 RBCDN->VBTableOffset = demangleUnsigned(MangledName);
362 RBCDN->Flags = demangleUnsigned(MangledName);
366 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
367 VSN->Name = demangleNameScopeChain(MangledName, RBCDN);
368 MangledName.consumeFront('8');
372 FunctionSymbolNode *Demangler::demangleInitFiniStub(StringView &MangledName,
374 DynamicStructorIdentifierNode *DSIN =
375 Arena.alloc<DynamicStructorIdentifierNode>();
376 DSIN->IsDestructor = IsDestructor;
378 bool IsKnownStaticDataMember = false;
379 if (MangledName.consumeFront('?'))
380 IsKnownStaticDataMember = true;
382 QualifiedNameNode *QN = demangleFullyQualifiedSymbolName(MangledName);
384 SymbolNode *Symbol = demangleEncodedSymbol(MangledName, QN);
385 FunctionSymbolNode *FSN = nullptr;
388 if (Symbol->kind() == NodeKind::VariableSymbol) {
389 DSIN->Variable = static_cast<VariableSymbolNode *>(Symbol);
391 // Older versions of clang mangled this type of symbol incorrectly. They
392 // would omit the leading ? and they would only emit a single @ at the end.
393 // The correct mangling is a leading ? and 2 trailing @ signs. Handle
395 int AtCount = IsKnownStaticDataMember ? 2 : 1;
396 for (int I = 0; I < AtCount; ++I) {
397 if (MangledName.consumeFront('@'))
403 FSN = demangleFunctionEncoding(MangledName);
404 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
406 if (IsKnownStaticDataMember) {
407 // This was supposed to be a static data member, but we got a function.
412 FSN = static_cast<FunctionSymbolNode *>(Symbol);
413 DSIN->Name = Symbol->Name;
414 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
420 SymbolNode *Demangler::demangleSpecialIntrinsic(StringView &MangledName) {
421 SpecialIntrinsicKind SIK = consumeSpecialIntrinsicKind(MangledName);
422 if (SIK == SpecialIntrinsicKind::None)
426 case SpecialIntrinsicKind::StringLiteralSymbol:
427 return demangleStringLiteral(MangledName);
428 case SpecialIntrinsicKind::Vftable:
429 case SpecialIntrinsicKind::Vbtable:
430 case SpecialIntrinsicKind::LocalVftable:
431 case SpecialIntrinsicKind::RttiCompleteObjLocator:
432 return demangleSpecialTableSymbolNode(MangledName, SIK);
433 case SpecialIntrinsicKind::VcallThunk:
434 return demangleVcallThunkNode(MangledName);
435 case SpecialIntrinsicKind::LocalStaticGuard:
436 return demangleLocalStaticGuard(MangledName);
437 case SpecialIntrinsicKind::RttiTypeDescriptor: {
438 TypeNode *T = demangleType(MangledName, QualifierMangleMode::Result);
441 if (!MangledName.consumeFront("@8"))
443 if (!MangledName.empty())
445 return synthesizeVariable(Arena, T, "`RTTI Type Descriptor'");
447 case SpecialIntrinsicKind::RttiBaseClassArray:
448 return demangleUntypedVariable(Arena, MangledName,
449 "`RTTI Base Class Array'");
450 case SpecialIntrinsicKind::RttiClassHierarchyDescriptor:
451 return demangleUntypedVariable(Arena, MangledName,
452 "`RTTI Class Hierarchy Descriptor'");
453 case SpecialIntrinsicKind::RttiBaseClassDescriptor:
454 return demangleRttiBaseClassDescriptorNode(Arena, MangledName);
455 case SpecialIntrinsicKind::DynamicInitializer:
456 return demangleInitFiniStub(MangledName, false);
457 case SpecialIntrinsicKind::DynamicAtexitDestructor:
458 return demangleInitFiniStub(MangledName, true);
467 Demangler::demangleFunctionIdentifierCode(StringView &MangledName) {
468 assert(MangledName.startsWith('?'));
469 MangledName = MangledName.dropFront();
471 if (MangledName.consumeFront("__"))
472 return demangleFunctionIdentifierCode(
473 MangledName, FunctionIdentifierCodeGroup::DoubleUnder);
474 else if (MangledName.consumeFront("_"))
475 return demangleFunctionIdentifierCode(MangledName,
476 FunctionIdentifierCodeGroup::Under);
477 return demangleFunctionIdentifierCode(MangledName,
478 FunctionIdentifierCodeGroup::Basic);
481 StructorIdentifierNode *
482 Demangler::demangleStructorIdentifier(StringView &MangledName,
484 StructorIdentifierNode *N = Arena.alloc<StructorIdentifierNode>();
485 N->IsDestructor = IsDestructor;
489 ConversionOperatorIdentifierNode *
490 Demangler::demangleConversionOperatorIdentifier(StringView &MangledName) {
491 ConversionOperatorIdentifierNode *N =
492 Arena.alloc<ConversionOperatorIdentifierNode>();
496 LiteralOperatorIdentifierNode *
497 Demangler::demangleLiteralOperatorIdentifier(StringView &MangledName) {
498 LiteralOperatorIdentifierNode *N =
499 Arena.alloc<LiteralOperatorIdentifierNode>();
500 N->Name = demangleSimpleString(MangledName, false);
504 static IntrinsicFunctionKind
505 translateIntrinsicFunctionCode(char CH, FunctionIdentifierCodeGroup Group) {
506 // Not all ? identifiers are intrinsics *functions*. This function only maps
507 // operator codes for the special functions, all others are handled elsewhere,
508 // hence the IFK::None entries in the table.
509 using IFK = IntrinsicFunctionKind;
510 static IFK Basic[36] = {
511 IFK::None, // ?0 # Foo::Foo()
512 IFK::None, // ?1 # Foo::~Foo()
513 IFK::New, // ?2 # operator new
514 IFK::Delete, // ?3 # operator delete
515 IFK::Assign, // ?4 # operator=
516 IFK::RightShift, // ?5 # operator>>
517 IFK::LeftShift, // ?6 # operator<<
518 IFK::LogicalNot, // ?7 # operator!
519 IFK::Equals, // ?8 # operator==
520 IFK::NotEquals, // ?9 # operator!=
521 IFK::ArraySubscript, // ?A # operator[]
522 IFK::None, // ?B # Foo::operator <type>()
523 IFK::Pointer, // ?C # operator->
524 IFK::Dereference, // ?D # operator*
525 IFK::Increment, // ?E # operator++
526 IFK::Decrement, // ?F # operator--
527 IFK::Minus, // ?G # operator-
528 IFK::Plus, // ?H # operator+
529 IFK::BitwiseAnd, // ?I # operator&
530 IFK::MemberPointer, // ?J # operator->*
531 IFK::Divide, // ?K # operator/
532 IFK::Modulus, // ?L # operator%
533 IFK::LessThan, // ?M operator<
534 IFK::LessThanEqual, // ?N operator<=
535 IFK::GreaterThan, // ?O operator>
536 IFK::GreaterThanEqual, // ?P operator>=
537 IFK::Comma, // ?Q operator,
538 IFK::Parens, // ?R operator()
539 IFK::BitwiseNot, // ?S operator~
540 IFK::BitwiseXor, // ?T operator^
541 IFK::BitwiseOr, // ?U operator|
542 IFK::LogicalAnd, // ?V operator&&
543 IFK::LogicalOr, // ?W operator||
544 IFK::TimesEqual, // ?X operator*=
545 IFK::PlusEqual, // ?Y operator+=
546 IFK::MinusEqual, // ?Z operator-=
548 static IFK Under[36] = {
549 IFK::DivEqual, // ?_0 operator/=
550 IFK::ModEqual, // ?_1 operator%=
551 IFK::RshEqual, // ?_2 operator>>=
552 IFK::LshEqual, // ?_3 operator<<=
553 IFK::BitwiseAndEqual, // ?_4 operator&=
554 IFK::BitwiseOrEqual, // ?_5 operator|=
555 IFK::BitwiseXorEqual, // ?_6 operator^=
556 IFK::None, // ?_7 # vftable
557 IFK::None, // ?_8 # vbtable
558 IFK::None, // ?_9 # vcall
559 IFK::None, // ?_A # typeof
560 IFK::None, // ?_B # local static guard
561 IFK::None, // ?_C # string literal
562 IFK::VbaseDtor, // ?_D # vbase destructor
563 IFK::VecDelDtor, // ?_E # vector deleting destructor
564 IFK::DefaultCtorClosure, // ?_F # default constructor closure
565 IFK::ScalarDelDtor, // ?_G # scalar deleting destructor
566 IFK::VecCtorIter, // ?_H # vector constructor iterator
567 IFK::VecDtorIter, // ?_I # vector destructor iterator
568 IFK::VecVbaseCtorIter, // ?_J # vector vbase constructor iterator
569 IFK::VdispMap, // ?_K # virtual displacement map
570 IFK::EHVecCtorIter, // ?_L # eh vector constructor iterator
571 IFK::EHVecDtorIter, // ?_M # eh vector destructor iterator
572 IFK::EHVecVbaseCtorIter, // ?_N # eh vector vbase constructor iterator
573 IFK::CopyCtorClosure, // ?_O # copy constructor closure
574 IFK::None, // ?_P<name> # udt returning <name>
575 IFK::None, // ?_Q # <unknown>
576 IFK::None, // ?_R0 - ?_R4 # RTTI Codes
577 IFK::None, // ?_S # local vftable
578 IFK::LocalVftableCtorClosure, // ?_T # local vftable constructor closure
579 IFK::ArrayNew, // ?_U operator new[]
580 IFK::ArrayDelete, // ?_V operator delete[]
581 IFK::None, // ?_W <unused>
582 IFK::None, // ?_X <unused>
583 IFK::None, // ?_Y <unused>
584 IFK::None, // ?_Z <unused>
586 static IFK DoubleUnder[36] = {
587 IFK::None, // ?__0 <unused>
588 IFK::None, // ?__1 <unused>
589 IFK::None, // ?__2 <unused>
590 IFK::None, // ?__3 <unused>
591 IFK::None, // ?__4 <unused>
592 IFK::None, // ?__5 <unused>
593 IFK::None, // ?__6 <unused>
594 IFK::None, // ?__7 <unused>
595 IFK::None, // ?__8 <unused>
596 IFK::None, // ?__9 <unused>
597 IFK::ManVectorCtorIter, // ?__A managed vector ctor iterator
598 IFK::ManVectorDtorIter, // ?__B managed vector dtor iterator
599 IFK::EHVectorCopyCtorIter, // ?__C EH vector copy ctor iterator
600 IFK::EHVectorVbaseCopyCtorIter, // ?__D EH vector vbase copy ctor iter
601 IFK::None, // ?__E dynamic initializer for `T'
602 IFK::None, // ?__F dynamic atexit destructor for `T'
603 IFK::VectorCopyCtorIter, // ?__G vector copy constructor iter
604 IFK::VectorVbaseCopyCtorIter, // ?__H vector vbase copy ctor iter
605 IFK::ManVectorVbaseCopyCtorIter, // ?__I managed vector vbase copy ctor
607 IFK::None, // ?__J local static thread guard
608 IFK::None, // ?__K operator ""_name
609 IFK::CoAwait, // ?__L co_await
610 IFK::None, // ?__M <unused>
611 IFK::None, // ?__N <unused>
612 IFK::None, // ?__O <unused>
613 IFK::None, // ?__P <unused>
614 IFK::None, // ?__Q <unused>
615 IFK::None, // ?__R <unused>
616 IFK::None, // ?__S <unused>
617 IFK::None, // ?__T <unused>
618 IFK::None, // ?__U <unused>
619 IFK::None, // ?__V <unused>
620 IFK::None, // ?__W <unused>
621 IFK::None, // ?__X <unused>
622 IFK::None, // ?__Y <unused>
623 IFK::None, // ?__Z <unused>
626 int Index = (CH >= '0' && CH <= '9') ? (CH - '0') : (CH - 'A' + 10);
628 case FunctionIdentifierCodeGroup::Basic:
630 case FunctionIdentifierCodeGroup::Under:
632 case FunctionIdentifierCodeGroup::DoubleUnder:
633 return DoubleUnder[Index];
635 LLVM_BUILTIN_UNREACHABLE;
639 Demangler::demangleFunctionIdentifierCode(StringView &MangledName,
640 FunctionIdentifierCodeGroup Group) {
642 case FunctionIdentifierCodeGroup::Basic:
643 switch (char CH = MangledName.popFront()) {
646 return demangleStructorIdentifier(MangledName, CH == '1');
648 return demangleConversionOperatorIdentifier(MangledName);
650 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
651 translateIntrinsicFunctionCode(CH, Group));
654 case FunctionIdentifierCodeGroup::Under:
655 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
656 translateIntrinsicFunctionCode(MangledName.popFront(), Group));
657 case FunctionIdentifierCodeGroup::DoubleUnder:
658 switch (char CH = MangledName.popFront()) {
660 return demangleLiteralOperatorIdentifier(MangledName);
662 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
663 translateIntrinsicFunctionCode(CH, Group));
666 // No Mangling Yet: Spaceship, // operator<=>
671 SymbolNode *Demangler::demangleEncodedSymbol(StringView &MangledName,
672 QualifiedNameNode *Name) {
674 switch (MangledName.front()) {
680 StorageClass SC = demangleVariableStorageClass(MangledName);
681 return demangleVariableEncoding(MangledName, SC);
686 FunctionSymbolNode *FSN = demangleFunctionEncoding(MangledName);
688 IdentifierNode *UQN = Name->getUnqualifiedIdentifier();
689 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
690 ConversionOperatorIdentifierNode *COIN =
691 static_cast<ConversionOperatorIdentifierNode *>(UQN);
692 COIN->TargetType = FSN->Signature->ReturnType;
697 // Parser entry point.
698 SymbolNode *Demangler::parse(StringView &MangledName) {
699 // We can't demangle MD5 names, just output them as-is.
700 // Also, MSVC-style mangled symbols must start with '?'.
701 if (MangledName.startsWith("??@")) {
702 // This is an MD5 mangled name. We can't demangle it, just return the
704 SymbolNode *S = Arena.alloc<SymbolNode>(NodeKind::Md5Symbol);
705 S->Name = synthesizeQualifiedName(Arena, MangledName);
709 if (!MangledName.startsWith('?')) {
714 MangledName.consumeFront('?');
716 // ?$ is a template instantiation, but all other names that start with ? are
717 // operators / special names.
718 if (SymbolNode *SI = demangleSpecialIntrinsic(MangledName))
721 // What follows is a main symbol name. This may include namespaces or class
723 QualifiedNameNode *QN = demangleFullyQualifiedSymbolName(MangledName);
727 SymbolNode *Symbol = demangleEncodedSymbol(MangledName, QN);
738 TagTypeNode *Demangler::parseTagUniqueName(StringView &MangledName) {
739 if (!MangledName.consumeFront(".?A"))
741 MangledName.consumeFront(".?A");
742 if (MangledName.empty())
745 return demangleClassType(MangledName);
748 // <type-encoding> ::= <storage-class> <variable-type>
749 // <storage-class> ::= 0 # private static member
750 // ::= 1 # protected static member
751 // ::= 2 # public static member
753 // ::= 4 # static local
755 VariableSymbolNode *Demangler::demangleVariableEncoding(StringView &MangledName,
757 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
759 VSN->Type = demangleType(MangledName, QualifierMangleMode::Drop);
762 // <variable-type> ::= <type> <cvr-qualifiers>
763 // ::= <type> <pointee-cvr-qualifiers> # pointers, references
764 switch (VSN->Type->kind()) {
765 case NodeKind::PointerType: {
766 PointerTypeNode *PTN = static_cast<PointerTypeNode *>(VSN->Type);
768 Qualifiers ExtraChildQuals = Q_None;
769 PTN->Quals = Qualifiers(VSN->Type->Quals |
770 demanglePointerExtQualifiers(MangledName));
772 bool IsMember = false;
773 std::tie(ExtraChildQuals, IsMember) = demangleQualifiers(MangledName);
775 if (PTN->ClassParent) {
776 QualifiedNameNode *BackRefName =
777 demangleFullyQualifiedTypeName(MangledName);
780 PTN->Pointee->Quals = Qualifiers(PTN->Pointee->Quals | ExtraChildQuals);
785 VSN->Type->Quals = demangleQualifiers(MangledName).first;
792 // Sometimes numbers are encoded in mangled symbols. For example,
793 // "int (*x)[20]" is a valid C type (x is a pointer to an array of
794 // length 20), so we need some way to embed numbers as part of symbols.
795 // This function parses it.
797 // <number> ::= [?] <non-negative integer>
799 // <non-negative integer> ::= <decimal digit> # when 1 <= Number <= 10
800 // ::= <hex digit>+ @ # when Numbrer == 0 or >= 10
802 // <hex-digit> ::= [A-P] # A = 0, B = 1, ...
803 std::pair<uint64_t, bool> Demangler::demangleNumber(StringView &MangledName) {
804 bool IsNegative = MangledName.consumeFront('?');
806 if (startsWithDigit(MangledName)) {
807 uint64_t Ret = MangledName[0] - '0' + 1;
808 MangledName = MangledName.dropFront(1);
809 return {Ret, IsNegative};
813 for (size_t i = 0; i < MangledName.size(); ++i) {
814 char C = MangledName[i];
816 MangledName = MangledName.dropFront(i + 1);
817 return {Ret, IsNegative};
819 if ('A' <= C && C <= 'P') {
820 Ret = (Ret << 4) + (C - 'A');
827 return {0ULL, false};
830 uint64_t Demangler::demangleUnsigned(StringView &MangledName) {
831 bool IsNegative = false;
833 std::tie(Number, IsNegative) = demangleNumber(MangledName);
839 int64_t Demangler::demangleSigned(StringView &MangledName) {
840 bool IsNegative = false;
842 std::tie(Number, IsNegative) = demangleNumber(MangledName);
843 if (Number > INT64_MAX)
845 int64_t I = static_cast<int64_t>(Number);
846 return IsNegative ? -I : I;
849 // First 10 strings can be referenced by special BackReferences ?0, ?1, ..., ?9.
851 void Demangler::memorizeString(StringView S) {
852 if (Backrefs.NamesCount >= BackrefContext::Max)
854 for (size_t i = 0; i < Backrefs.NamesCount; ++i)
855 if (S == Backrefs.Names[i]->Name)
857 NamedIdentifierNode *N = Arena.alloc<NamedIdentifierNode>();
859 Backrefs.Names[Backrefs.NamesCount++] = N;
862 NamedIdentifierNode *Demangler::demangleBackRefName(StringView &MangledName) {
863 assert(startsWithDigit(MangledName));
865 size_t I = MangledName[0] - '0';
866 if (I >= Backrefs.NamesCount) {
871 MangledName = MangledName.dropFront();
872 return Backrefs.Names[I];
875 void Demangler::memorizeIdentifier(IdentifierNode *Identifier) {
876 // Render this class template name into a string buffer so that we can
877 // memorize it for the purpose of back-referencing.
879 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
880 // FIXME: Propagate out-of-memory as an error?
882 Identifier->output(OS, OF_Default);
884 char *Name = OS.getBuffer();
886 StringView Owned = copyString(Name);
887 memorizeString(Owned);
892 Demangler::demangleTemplateInstantiationName(StringView &MangledName,
893 NameBackrefBehavior NBB) {
894 assert(MangledName.startsWith("?$"));
895 MangledName.consumeFront("?$");
897 BackrefContext OuterContext;
898 std::swap(OuterContext, Backrefs);
900 IdentifierNode *Identifier =
901 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
903 Identifier->TemplateParams = demangleTemplateParameterList(MangledName);
905 std::swap(OuterContext, Backrefs);
909 if (NBB & NBB_Template)
910 memorizeIdentifier(Identifier);
915 NamedIdentifierNode *Demangler::demangleSimpleName(StringView &MangledName,
917 StringView S = demangleSimpleString(MangledName, Memorize);
921 NamedIdentifierNode *Name = Arena.alloc<NamedIdentifierNode>();
926 static bool isRebasedHexDigit(char C) { return (C >= 'A' && C <= 'P'); }
928 static uint8_t rebasedHexDigitToNumber(char C) {
929 assert(isRebasedHexDigit(C));
930 return (C <= 'J') ? (C - 'A') : (10 + C - 'K');
933 uint8_t Demangler::demangleCharLiteral(StringView &MangledName) {
934 if (!MangledName.startsWith('?'))
935 return MangledName.popFront();
937 MangledName = MangledName.dropFront();
938 if (MangledName.empty())
939 goto CharLiteralError;
941 if (MangledName.consumeFront('$')) {
943 if (MangledName.size() < 2)
944 goto CharLiteralError;
945 StringView Nibbles = MangledName.substr(0, 2);
946 if (!isRebasedHexDigit(Nibbles[0]) || !isRebasedHexDigit(Nibbles[1]))
947 goto CharLiteralError;
948 // Don't append the null terminator.
949 uint8_t C1 = rebasedHexDigitToNumber(Nibbles[0]);
950 uint8_t C2 = rebasedHexDigitToNumber(Nibbles[1]);
951 MangledName = MangledName.dropFront(2);
952 return (C1 << 4) | C2;
955 if (startsWithDigit(MangledName)) {
956 const char *Lookup = ",/\\:. \n\t'-";
957 char C = Lookup[MangledName[0] - '0'];
958 MangledName = MangledName.dropFront();
962 if (MangledName[0] >= 'a' && MangledName[0] <= 'z') {
963 char Lookup[26] = {'\xE1', '\xE2', '\xE3', '\xE4', '\xE5', '\xE6', '\xE7',
964 '\xE8', '\xE9', '\xEA', '\xEB', '\xEC', '\xED', '\xEE',
965 '\xEF', '\xF0', '\xF1', '\xF2', '\xF3', '\xF4', '\xF5',
966 '\xF6', '\xF7', '\xF8', '\xF9', '\xFA'};
967 char C = Lookup[MangledName[0] - 'a'];
968 MangledName = MangledName.dropFront();
972 if (MangledName[0] >= 'A' && MangledName[0] <= 'Z') {
973 char Lookup[26] = {'\xC1', '\xC2', '\xC3', '\xC4', '\xC5', '\xC6', '\xC7',
974 '\xC8', '\xC9', '\xCA', '\xCB', '\xCC', '\xCD', '\xCE',
975 '\xCF', '\xD0', '\xD1', '\xD2', '\xD3', '\xD4', '\xD5',
976 '\xD6', '\xD7', '\xD8', '\xD9', '\xDA'};
977 char C = Lookup[MangledName[0] - 'A'];
978 MangledName = MangledName.dropFront();
987 wchar_t Demangler::demangleWcharLiteral(StringView &MangledName) {
990 C1 = demangleCharLiteral(MangledName);
992 goto WCharLiteralError;
993 C2 = demangleCharLiteral(MangledName);
995 goto WCharLiteralError;
997 return ((wchar_t)C1 << 8) | (wchar_t)C2;
1004 static void writeHexDigit(char *Buffer, uint8_t Digit) {
1005 assert(Digit <= 15);
1006 *Buffer = (Digit < 10) ? ('0' + Digit) : ('A' + Digit - 10);
1009 static void outputHex(OutputStream &OS, unsigned C) {
1014 // It's easier to do the math if we can work from right to left, but we need
1015 // to print the numbers from left to right. So render this into a temporary
1016 // buffer first, then output the temporary buffer. Each byte is of the form
1017 // \xAB, which means that each byte needs 4 characters. Since there are at
1018 // most 4 bytes, we need a 4*4+1 = 17 character temporary buffer.
1019 char TempBuffer[17];
1021 ::memset(TempBuffer, 0, sizeof(TempBuffer));
1022 constexpr int MaxPos = 15;
1024 int Pos = MaxPos - 1;
1026 for (int I = 0; I < 2; ++I) {
1027 writeHexDigit(&TempBuffer[Pos--], C % 16);
1030 TempBuffer[Pos--] = 'x';
1031 TempBuffer[Pos--] = '\\';
1034 OS << StringView(&TempBuffer[Pos + 1]);
1037 static void outputEscapedChar(OutputStream &OS, unsigned C) {
1039 case '\'': // single quote
1042 case '\"': // double quote
1045 case '\\': // backslash
1051 case '\b': // backspace
1054 case '\f': // form feed
1057 case '\n': // new line
1060 case '\r': // carriage return
1066 case '\v': // vertical tab
1073 if (C > 0x1F && C < 0x7F) {
1074 // Standard ascii char.
1082 static unsigned countTrailingNullBytes(const uint8_t *StringBytes, int Length) {
1083 const uint8_t *End = StringBytes + Length - 1;
1085 while (Length > 0 && *End == 0) {
1093 static unsigned countEmbeddedNulls(const uint8_t *StringBytes,
1095 unsigned Result = 0;
1096 for (unsigned I = 0; I < Length; ++I) {
1097 if (*StringBytes++ == 0)
1103 static unsigned guessCharByteSize(const uint8_t *StringBytes, unsigned NumChars,
1104 unsigned NumBytes) {
1105 assert(NumBytes > 0);
1107 // If the number of bytes is odd, this is guaranteed to be a char string.
1108 if (NumBytes % 2 == 1)
1111 // All strings can encode at most 32 bytes of data. If it's less than that,
1112 // then we encoded the entire string. In this case we check for a 1-byte,
1113 // 2-byte, or 4-byte null terminator.
1114 if (NumBytes < 32) {
1115 unsigned TrailingNulls = countTrailingNullBytes(StringBytes, NumChars);
1116 if (TrailingNulls >= 4)
1118 if (TrailingNulls >= 2)
1123 // The whole string was not able to be encoded. Try to look at embedded null
1124 // terminators to guess. The heuristic is that we count all embedded null
1125 // terminators. If more than 2/3 are null, it's a char32. If more than 1/3
1126 // are null, it's a char16. Otherwise it's a char8. This obviously isn't
1127 // perfect and is biased towards languages that have ascii alphabets, but this
1128 // was always going to be best effort since the encoding is lossy.
1129 unsigned Nulls = countEmbeddedNulls(StringBytes, NumChars);
1130 if (Nulls >= 2 * NumChars / 3)
1132 if (Nulls >= NumChars / 3)
1137 static unsigned decodeMultiByteChar(const uint8_t *StringBytes,
1138 unsigned CharIndex, unsigned CharBytes) {
1139 assert(CharBytes == 1 || CharBytes == 2 || CharBytes == 4);
1140 unsigned Offset = CharIndex * CharBytes;
1141 unsigned Result = 0;
1142 StringBytes = StringBytes + Offset;
1143 for (unsigned I = 0; I < CharBytes; ++I) {
1144 unsigned C = static_cast<unsigned>(StringBytes[I]);
1145 Result |= C << (8 * I);
1150 FunctionSymbolNode *Demangler::demangleVcallThunkNode(StringView &MangledName) {
1151 FunctionSymbolNode *FSN = Arena.alloc<FunctionSymbolNode>();
1152 VcallThunkIdentifierNode *VTIN = Arena.alloc<VcallThunkIdentifierNode>();
1153 FSN->Signature = Arena.alloc<ThunkSignatureNode>();
1154 FSN->Signature->FunctionClass = FC_NoParameterList;
1156 FSN->Name = demangleNameScopeChain(MangledName, VTIN);
1158 Error = !MangledName.consumeFront("$B");
1160 VTIN->OffsetInVTable = demangleUnsigned(MangledName);
1162 Error = !MangledName.consumeFront('A');
1164 FSN->Signature->CallConvention = demangleCallingConvention(MangledName);
1165 return (Error) ? nullptr : FSN;
1168 EncodedStringLiteralNode *
1169 Demangler::demangleStringLiteral(StringView &MangledName) {
1170 // This function uses goto, so declare all variables up front.
1173 uint64_t StringByteSize;
1174 bool IsWcharT = false;
1175 bool IsNegative = false;
1176 size_t CrcEndPos = 0;
1177 char *ResultBuffer = nullptr;
1179 EncodedStringLiteralNode *Result = Arena.alloc<EncodedStringLiteralNode>();
1181 // Prefix indicating the beginning of a string literal
1182 if (!MangledName.consumeFront("@_"))
1183 goto StringLiteralError;
1184 if (MangledName.empty())
1185 goto StringLiteralError;
1187 // Char Type (regular or wchar_t)
1188 switch (MangledName.popFront()) {
1195 goto StringLiteralError;
1199 std::tie(StringByteSize, IsNegative) = demangleNumber(MangledName);
1200 if (Error || IsNegative)
1201 goto StringLiteralError;
1203 // CRC 32 (always 8 characters plus a terminator)
1204 CrcEndPos = MangledName.find('@');
1205 if (CrcEndPos == StringView::npos)
1206 goto StringLiteralError;
1207 CRC = MangledName.substr(0, CrcEndPos);
1208 MangledName = MangledName.dropFront(CrcEndPos + 1);
1209 if (MangledName.empty())
1210 goto StringLiteralError;
1212 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
1213 // FIXME: Propagate out-of-memory as an error?
1216 Result->Char = CharKind::Wchar;
1217 if (StringByteSize > 64)
1218 Result->IsTruncated = true;
1220 while (!MangledName.consumeFront('@')) {
1221 assert(StringByteSize >= 2);
1222 wchar_t W = demangleWcharLiteral(MangledName);
1223 if (StringByteSize != 2 || Result->IsTruncated)
1224 outputEscapedChar(OS, W);
1225 StringByteSize -= 2;
1227 goto StringLiteralError;
1230 // The max byte length is actually 32, but some compilers mangled strings
1231 // incorrectly, so we have to assume it can go higher.
1232 constexpr unsigned MaxStringByteLength = 32 * 4;
1233 uint8_t StringBytes[MaxStringByteLength];
1235 unsigned BytesDecoded = 0;
1236 while (!MangledName.consumeFront('@')) {
1237 assert(StringByteSize >= 1);
1238 StringBytes[BytesDecoded++] = demangleCharLiteral(MangledName);
1241 if (StringByteSize > BytesDecoded)
1242 Result->IsTruncated = true;
1244 unsigned CharBytes =
1245 guessCharByteSize(StringBytes, BytesDecoded, StringByteSize);
1246 assert(StringByteSize % CharBytes == 0);
1247 switch (CharBytes) {
1249 Result->Char = CharKind::Char;
1252 Result->Char = CharKind::Char16;
1255 Result->Char = CharKind::Char32;
1258 LLVM_BUILTIN_UNREACHABLE;
1260 const unsigned NumChars = BytesDecoded / CharBytes;
1261 for (unsigned CharIndex = 0; CharIndex < NumChars; ++CharIndex) {
1263 decodeMultiByteChar(StringBytes, CharIndex, CharBytes);
1264 if (CharIndex + 1 < NumChars || Result->IsTruncated)
1265 outputEscapedChar(OS, NextChar);
1270 ResultBuffer = OS.getBuffer();
1271 Result->DecodedString = copyString(ResultBuffer);
1272 std::free(ResultBuffer);
1280 StringView Demangler::demangleSimpleString(StringView &MangledName,
1283 for (size_t i = 0; i < MangledName.size(); ++i) {
1284 if (MangledName[i] != '@')
1286 S = MangledName.substr(0, i);
1287 MangledName = MangledName.dropFront(i + 1);
1298 NamedIdentifierNode *
1299 Demangler::demangleAnonymousNamespaceName(StringView &MangledName) {
1300 assert(MangledName.startsWith("?A"));
1301 MangledName.consumeFront("?A");
1303 NamedIdentifierNode *Node = Arena.alloc<NamedIdentifierNode>();
1304 Node->Name = "`anonymous namespace'";
1305 size_t EndPos = MangledName.find('@');
1306 if (EndPos == StringView::npos) {
1310 StringView NamespaceKey = MangledName.substr(0, EndPos);
1311 memorizeString(NamespaceKey);
1312 MangledName = MangledName.substr(EndPos + 1);
1316 NamedIdentifierNode *
1317 Demangler::demangleLocallyScopedNamePiece(StringView &MangledName) {
1318 assert(startsWithLocalScopePattern(MangledName));
1320 NamedIdentifierNode *Identifier = Arena.alloc<NamedIdentifierNode>();
1321 MangledName.consumeFront('?');
1322 auto Number = demangleNumber(MangledName);
1323 assert(!Number.second);
1325 // One ? to terminate the number
1326 MangledName.consumeFront('?');
1329 Node *Scope = parse(MangledName);
1333 // Render the parent symbol's name into a buffer.
1335 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
1336 // FIXME: Propagate out-of-memory as an error?
1339 Scope->output(OS, OF_Default);
1341 OS << "::`" << Number.first << "'";
1343 char *Result = OS.getBuffer();
1344 Identifier->Name = copyString(Result);
1349 // Parses a type name in the form of A@B@C@@ which represents C::B::A.
1351 Demangler::demangleFullyQualifiedTypeName(StringView &MangledName) {
1352 IdentifierNode *Identifier = demangleUnqualifiedTypeName(MangledName, true);
1357 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
1364 // Parses a symbol name in the form of A@B@C@@ which represents C::B::A.
1365 // Symbol names have slightly different rules regarding what can appear
1366 // so we separate out the implementations for flexibility.
1368 Demangler::demangleFullyQualifiedSymbolName(StringView &MangledName) {
1369 // This is the final component of a symbol name (i.e. the leftmost component
1370 // of a mangled name. Since the only possible template instantiation that
1371 // can appear in this context is a function template, and since those are
1372 // not saved for the purposes of name backreferences, only backref simple
1374 IdentifierNode *Identifier =
1375 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
1379 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
1383 if (Identifier->kind() == NodeKind::StructorIdentifier) {
1384 StructorIdentifierNode *SIN =
1385 static_cast<StructorIdentifierNode *>(Identifier);
1386 assert(QN->Components->Count >= 2);
1387 Node *ClassNode = QN->Components->Nodes[QN->Components->Count - 2];
1388 SIN->Class = static_cast<IdentifierNode *>(ClassNode);
1394 IdentifierNode *Demangler::demangleUnqualifiedTypeName(StringView &MangledName,
1396 // An inner-most name can be a back-reference, because a fully-qualified name
1397 // (e.g. Scope + Inner) can contain other fully qualified names inside of
1398 // them (for example template parameters), and these nested parameters can
1399 // refer to previously mangled types.
1400 if (startsWithDigit(MangledName))
1401 return demangleBackRefName(MangledName);
1403 if (MangledName.startsWith("?$"))
1404 return demangleTemplateInstantiationName(MangledName, NBB_Template);
1406 return demangleSimpleName(MangledName, Memorize);
1410 Demangler::demangleUnqualifiedSymbolName(StringView &MangledName,
1411 NameBackrefBehavior NBB) {
1412 if (startsWithDigit(MangledName))
1413 return demangleBackRefName(MangledName);
1414 if (MangledName.startsWith("?$"))
1415 return demangleTemplateInstantiationName(MangledName, NBB);
1416 if (MangledName.startsWith('?'))
1417 return demangleFunctionIdentifierCode(MangledName);
1418 return demangleSimpleName(MangledName, (NBB & NBB_Simple) != 0);
1421 IdentifierNode *Demangler::demangleNameScopePiece(StringView &MangledName) {
1422 if (startsWithDigit(MangledName))
1423 return demangleBackRefName(MangledName);
1425 if (MangledName.startsWith("?$"))
1426 return demangleTemplateInstantiationName(MangledName, NBB_Template);
1428 if (MangledName.startsWith("?A"))
1429 return demangleAnonymousNamespaceName(MangledName);
1431 if (startsWithLocalScopePattern(MangledName))
1432 return demangleLocallyScopedNamePiece(MangledName);
1434 return demangleSimpleName(MangledName, true);
1437 static NodeArrayNode *nodeListToNodeArray(ArenaAllocator &Arena, NodeList *Head,
1439 NodeArrayNode *N = Arena.alloc<NodeArrayNode>();
1441 N->Nodes = Arena.allocArray<Node *>(Count);
1442 for (size_t I = 0; I < Count; ++I) {
1443 N->Nodes[I] = Head->N;
1450 Demangler::demangleNameScopeChain(StringView &MangledName,
1451 IdentifierNode *UnqualifiedName) {
1452 NodeList *Head = Arena.alloc<NodeList>();
1454 Head->N = UnqualifiedName;
1457 while (!MangledName.consumeFront("@")) {
1459 NodeList *NewHead = Arena.alloc<NodeList>();
1460 NewHead->Next = Head;
1463 if (MangledName.empty()) {
1469 IdentifierNode *Elem = demangleNameScopePiece(MangledName);
1476 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
1477 QN->Components = nodeListToNodeArray(Arena, Head, Count);
1481 FuncClass Demangler::demangleFunctionClass(StringView &MangledName) {
1482 switch (MangledName.popFront()) {
1484 return FuncClass(FC_ExternC | FC_NoParameterList);
1488 return FuncClass(FC_Private | FC_Far);
1490 return FuncClass(FC_Private | FC_Static);
1492 return FuncClass(FC_Private | FC_Static);
1494 return FuncClass(FC_Private | FC_Virtual);
1496 return FuncClass(FC_Private | FC_Virtual);
1498 return FuncClass(FC_Private | FC_StaticThisAdjust);
1500 return FuncClass(FC_Private | FC_StaticThisAdjust | FC_Far);
1502 return FuncClass(FC_Protected);
1504 return FuncClass(FC_Protected | FC_Far);
1506 return FuncClass(FC_Protected | FC_Static);
1508 return FuncClass(FC_Protected | FC_Static | FC_Far);
1510 return FuncClass(FC_Protected | FC_Virtual);
1512 return FuncClass(FC_Protected | FC_Virtual | FC_Far);
1514 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust);
1516 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust | FC_Far);
1518 return FuncClass(FC_Public);
1520 return FuncClass(FC_Public | FC_Far);
1522 return FuncClass(FC_Public | FC_Static);
1524 return FuncClass(FC_Public | FC_Static | FC_Far);
1526 return FuncClass(FC_Public | FC_Virtual);
1528 return FuncClass(FC_Public | FC_Virtual | FC_Far);
1530 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust);
1532 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust | FC_Far);
1534 return FuncClass(FC_Global);
1536 return FuncClass(FC_Global | FC_Far);
1538 FuncClass VFlag = FC_VirtualThisAdjust;
1539 if (MangledName.consumeFront('R'))
1540 VFlag = FuncClass(VFlag | FC_VirtualThisAdjustEx);
1542 switch (MangledName.popFront()) {
1544 return FuncClass(FC_Private | FC_Virtual | VFlag);
1546 return FuncClass(FC_Private | FC_Virtual | VFlag | FC_Far);
1548 return FuncClass(FC_Protected | FC_Virtual | VFlag);
1550 return FuncClass(FC_Protected | FC_Virtual | VFlag | FC_Far);
1552 return FuncClass(FC_Public | FC_Virtual | VFlag);
1554 return FuncClass(FC_Public | FC_Virtual | VFlag | FC_Far);
1563 CallingConv Demangler::demangleCallingConvention(StringView &MangledName) {
1564 switch (MangledName.popFront()) {
1567 return CallingConv::Cdecl;
1570 return CallingConv::Pascal;
1573 return CallingConv::Thiscall;
1576 return CallingConv::Stdcall;
1579 return CallingConv::Fastcall;
1582 return CallingConv::Clrcall;
1585 return CallingConv::Eabi;
1587 return CallingConv::Vectorcall;
1590 return CallingConv::None;
1593 StorageClass Demangler::demangleVariableStorageClass(StringView &MangledName) {
1594 assert(std::isdigit(MangledName.front()));
1596 switch (MangledName.popFront()) {
1598 return StorageClass::PrivateStatic;
1600 return StorageClass::ProtectedStatic;
1602 return StorageClass::PublicStatic;
1604 return StorageClass::Global;
1606 return StorageClass::FunctionLocalStatic;
1609 return StorageClass::None;
1612 std::pair<Qualifiers, bool>
1613 Demangler::demangleQualifiers(StringView &MangledName) {
1615 switch (MangledName.popFront()) {
1616 // Member qualifiers
1618 return std::make_pair(Q_None, true);
1620 return std::make_pair(Q_Const, true);
1622 return std::make_pair(Q_Volatile, true);
1624 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), true);
1625 // Non-Member qualifiers
1627 return std::make_pair(Q_None, false);
1629 return std::make_pair(Q_Const, false);
1631 return std::make_pair(Q_Volatile, false);
1633 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), false);
1636 return std::make_pair(Q_None, false);
1639 // <variable-type> ::= <type> <cvr-qualifiers>
1640 // ::= <type> <pointee-cvr-qualifiers> # pointers, references
1641 TypeNode *Demangler::demangleType(StringView &MangledName,
1642 QualifierMangleMode QMM) {
1643 Qualifiers Quals = Q_None;
1644 bool IsMember = false;
1645 if (QMM == QualifierMangleMode::Mangle) {
1646 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
1647 } else if (QMM == QualifierMangleMode::Result) {
1648 if (MangledName.consumeFront('?'))
1649 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
1652 TypeNode *Ty = nullptr;
1653 if (isTagType(MangledName))
1654 Ty = demangleClassType(MangledName);
1655 else if (isPointerType(MangledName)) {
1656 if (isMemberPointer(MangledName, Error))
1657 Ty = demangleMemberPointerType(MangledName);
1659 Ty = demanglePointerType(MangledName);
1662 } else if (isArrayType(MangledName))
1663 Ty = demangleArrayType(MangledName);
1664 else if (isFunctionType(MangledName)) {
1665 if (MangledName.consumeFront("$$A8@@"))
1666 Ty = demangleFunctionType(MangledName, true);
1668 assert(MangledName.startsWith("$$A6"));
1669 MangledName.consumeFront("$$A6");
1670 Ty = demangleFunctionType(MangledName, false);
1672 } else if (isCustomType(MangledName)) {
1673 Ty = demangleCustomType(MangledName);
1675 Ty = demanglePrimitiveType(MangledName);
1680 Ty->Quals = Qualifiers(Ty->Quals | Quals);
1684 bool Demangler::demangleThrowSpecification(StringView &MangledName) {
1685 if (MangledName.consumeFront("_E"))
1687 if (MangledName.consumeFront('Z'))
1694 FunctionSignatureNode *Demangler::demangleFunctionType(StringView &MangledName,
1695 bool HasThisQuals) {
1696 FunctionSignatureNode *FTy = Arena.alloc<FunctionSignatureNode>();
1699 FTy->Quals = demanglePointerExtQualifiers(MangledName);
1700 FTy->RefQualifier = demangleFunctionRefQualifier(MangledName);
1701 FTy->Quals = Qualifiers(FTy->Quals | demangleQualifiers(MangledName).first);
1704 // Fields that appear on both member and non-member functions.
1705 FTy->CallConvention = demangleCallingConvention(MangledName);
1707 // <return-type> ::= <type>
1708 // ::= @ # structors (they have no declared return type)
1709 bool IsStructor = MangledName.consumeFront('@');
1711 FTy->ReturnType = demangleType(MangledName, QualifierMangleMode::Result);
1713 FTy->Params = demangleFunctionParameterList(MangledName);
1715 FTy->IsNoexcept = demangleThrowSpecification(MangledName);
1720 FunctionSymbolNode *
1721 Demangler::demangleFunctionEncoding(StringView &MangledName) {
1722 FuncClass ExtraFlags = FC_None;
1723 if (MangledName.consumeFront("$$J0"))
1724 ExtraFlags = FC_ExternC;
1726 FuncClass FC = demangleFunctionClass(MangledName);
1727 FC = FuncClass(ExtraFlags | FC);
1729 FunctionSignatureNode *FSN = nullptr;
1730 ThunkSignatureNode *TTN = nullptr;
1731 if (FC & FC_StaticThisAdjust) {
1732 TTN = Arena.alloc<ThunkSignatureNode>();
1733 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
1734 } else if (FC & FC_VirtualThisAdjust) {
1735 TTN = Arena.alloc<ThunkSignatureNode>();
1736 if (FC & FC_VirtualThisAdjustEx) {
1737 TTN->ThisAdjust.VBPtrOffset = demangleSigned(MangledName);
1738 TTN->ThisAdjust.VBOffsetOffset = demangleSigned(MangledName);
1740 TTN->ThisAdjust.VtordispOffset = demangleSigned(MangledName);
1741 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
1744 if (FC & FC_NoParameterList) {
1745 // This is an extern "C" function whose full signature hasn't been mangled.
1746 // This happens when we need to mangle a local symbol inside of an extern
1748 FSN = Arena.alloc<FunctionSignatureNode>();
1750 bool HasThisQuals = !(FC & (FC_Global | FC_Static));
1751 FSN = demangleFunctionType(MangledName, HasThisQuals);
1754 *static_cast<FunctionSignatureNode *>(TTN) = *FSN;
1757 FSN->FunctionClass = FC;
1759 FunctionSymbolNode *Symbol = Arena.alloc<FunctionSymbolNode>();
1760 Symbol->Signature = FSN;
1764 CustomTypeNode *Demangler::demangleCustomType(StringView &MangledName) {
1765 assert(MangledName.startsWith('?'));
1766 MangledName.popFront();
1768 CustomTypeNode *CTN = Arena.alloc<CustomTypeNode>();
1769 CTN->Identifier = demangleUnqualifiedTypeName(MangledName, true);
1770 if (!MangledName.consumeFront('@'))
1777 // Reads a primitive type.
1778 PrimitiveTypeNode *Demangler::demanglePrimitiveType(StringView &MangledName) {
1779 if (MangledName.consumeFront("$$T"))
1780 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Nullptr);
1782 switch (MangledName.popFront()) {
1784 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Void);
1786 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char);
1788 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Schar);
1790 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uchar);
1792 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Short);
1794 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ushort);
1796 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int);
1798 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint);
1800 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Long);
1802 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ulong);
1804 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Float);
1806 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Double);
1808 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ldouble);
1810 if (MangledName.empty()) {
1814 switch (MangledName.popFront()) {
1816 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Bool);
1818 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int64);
1820 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint64);
1822 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Wchar);
1824 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char16);
1826 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char32);
1835 TagTypeNode *Demangler::demangleClassType(StringView &MangledName) {
1836 TagTypeNode *TT = nullptr;
1838 switch (MangledName.popFront()) {
1840 TT = Arena.alloc<TagTypeNode>(TagKind::Union);
1843 TT = Arena.alloc<TagTypeNode>(TagKind::Struct);
1846 TT = Arena.alloc<TagTypeNode>(TagKind::Class);
1849 if (MangledName.popFront() != '4') {
1853 TT = Arena.alloc<TagTypeNode>(TagKind::Enum);
1859 TT->QualifiedName = demangleFullyQualifiedTypeName(MangledName);
1863 // <pointer-type> ::= E? <pointer-cvr-qualifiers> <ext-qualifiers> <type>
1864 // # the E is required for 64-bit non-static pointers
1865 PointerTypeNode *Demangler::demanglePointerType(StringView &MangledName) {
1866 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
1868 std::tie(Pointer->Quals, Pointer->Affinity) =
1869 demanglePointerCVQualifiers(MangledName);
1871 if (MangledName.consumeFront("6")) {
1872 Pointer->Pointee = demangleFunctionType(MangledName, false);
1876 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
1877 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
1879 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Mangle);
1883 PointerTypeNode *Demangler::demangleMemberPointerType(StringView &MangledName) {
1884 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
1886 std::tie(Pointer->Quals, Pointer->Affinity) =
1887 demanglePointerCVQualifiers(MangledName);
1888 assert(Pointer->Affinity == PointerAffinity::Pointer);
1890 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
1891 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
1893 if (MangledName.consumeFront("8")) {
1894 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
1895 Pointer->Pointee = demangleFunctionType(MangledName, true);
1897 Qualifiers PointeeQuals = Q_None;
1898 bool IsMember = false;
1899 std::tie(PointeeQuals, IsMember) = demangleQualifiers(MangledName);
1901 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
1903 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Drop);
1904 Pointer->Pointee->Quals = PointeeQuals;
1910 Qualifiers Demangler::demanglePointerExtQualifiers(StringView &MangledName) {
1911 Qualifiers Quals = Q_None;
1912 if (MangledName.consumeFront('E'))
1913 Quals = Qualifiers(Quals | Q_Pointer64);
1914 if (MangledName.consumeFront('I'))
1915 Quals = Qualifiers(Quals | Q_Restrict);
1916 if (MangledName.consumeFront('F'))
1917 Quals = Qualifiers(Quals | Q_Unaligned);
1922 ArrayTypeNode *Demangler::demangleArrayType(StringView &MangledName) {
1923 assert(MangledName.front() == 'Y');
1924 MangledName.popFront();
1927 bool IsNegative = false;
1928 std::tie(Rank, IsNegative) = demangleNumber(MangledName);
1929 if (IsNegative || Rank == 0) {
1934 ArrayTypeNode *ATy = Arena.alloc<ArrayTypeNode>();
1935 NodeList *Head = Arena.alloc<NodeList>();
1936 NodeList *Tail = Head;
1938 for (uint64_t I = 0; I < Rank; ++I) {
1940 std::tie(D, IsNegative) = demangleNumber(MangledName);
1945 Tail->N = Arena.alloc<IntegerLiteralNode>(D, IsNegative);
1947 Tail->Next = Arena.alloc<NodeList>();
1951 ATy->Dimensions = nodeListToNodeArray(Arena, Head, Rank);
1953 if (MangledName.consumeFront("$$C")) {
1954 bool IsMember = false;
1955 std::tie(ATy->Quals, IsMember) = demangleQualifiers(MangledName);
1962 ATy->ElementType = demangleType(MangledName, QualifierMangleMode::Drop);
1966 // Reads a function or a template parameters.
1968 Demangler::demangleFunctionParameterList(StringView &MangledName) {
1969 // Empty parameter list.
1970 if (MangledName.consumeFront('X'))
1973 NodeList *Head = Arena.alloc<NodeList>();
1974 NodeList **Current = &Head;
1976 while (!Error && !MangledName.startsWith('@') &&
1977 !MangledName.startsWith('Z')) {
1980 if (startsWithDigit(MangledName)) {
1981 size_t N = MangledName[0] - '0';
1982 if (N >= Backrefs.FunctionParamCount) {
1986 MangledName = MangledName.dropFront();
1988 *Current = Arena.alloc<NodeList>();
1989 (*Current)->N = Backrefs.FunctionParams[N];
1990 Current = &(*Current)->Next;
1994 size_t OldSize = MangledName.size();
1996 *Current = Arena.alloc<NodeList>();
1997 TypeNode *TN = demangleType(MangledName, QualifierMangleMode::Drop);
2003 size_t CharsConsumed = OldSize - MangledName.size();
2004 assert(CharsConsumed != 0);
2006 // Single-letter types are ignored for backreferences because memorizing
2007 // them doesn't save anything.
2008 if (Backrefs.FunctionParamCount <= 9 && CharsConsumed > 1)
2009 Backrefs.FunctionParams[Backrefs.FunctionParamCount++] = TN;
2011 Current = &(*Current)->Next;
2017 NodeArrayNode *NA = nodeListToNodeArray(Arena, Head, Count);
2018 // A non-empty parameter list is terminated by either 'Z' (variadic) parameter
2019 // list or '@' (non variadic). Careful not to consume "@Z", as in that case
2020 // the following Z could be a throw specifier.
2021 if (MangledName.consumeFront('@'))
2024 if (MangledName.consumeFront('Z')) {
2025 // This is a variadic parameter list. We probably need a variadic node to
2026 // append to the end.
2035 Demangler::demangleTemplateParameterList(StringView &MangledName) {
2037 NodeList **Current = &Head;
2040 while (!Error && !MangledName.startsWith('@')) {
2041 if (MangledName.consumeFront("$S") || MangledName.consumeFront("$$V") ||
2042 MangledName.consumeFront("$$$V") || MangledName.consumeFront("$$Z")) {
2043 // parameter pack separator
2049 // Template parameter lists don't participate in back-referencing.
2050 *Current = Arena.alloc<NodeList>();
2052 NodeList &TP = **Current;
2054 TemplateParameterReferenceNode *TPRN = nullptr;
2055 if (MangledName.consumeFront("$$Y")) {
2057 TP.N = demangleFullyQualifiedTypeName(MangledName);
2058 } else if (MangledName.consumeFront("$$B")) {
2060 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
2061 } else if (MangledName.consumeFront("$$C")) {
2062 // Type has qualifiers.
2063 TP.N = demangleType(MangledName, QualifierMangleMode::Mangle);
2064 } else if (MangledName.startsWith("$1") || MangledName.startsWith("$H") ||
2065 MangledName.startsWith("$I") || MangledName.startsWith("$J")) {
2066 // Pointer to member
2067 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2068 TPRN->IsMemberPointer = true;
2070 MangledName = MangledName.dropFront();
2071 // 1 - single inheritance <name>
2072 // H - multiple inheritance <name> <number>
2073 // I - virtual inheritance <name> <number> <number> <number>
2074 // J - unspecified inheritance <name> <number> <number> <number>
2075 char InheritanceSpecifier = MangledName.popFront();
2076 SymbolNode *S = nullptr;
2077 if (MangledName.startsWith('?')) {
2078 S = parse(MangledName);
2079 memorizeIdentifier(S->Name->getUnqualifiedIdentifier());
2082 switch (InheritanceSpecifier) {
2084 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2085 demangleSigned(MangledName);
2088 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2089 demangleSigned(MangledName);
2092 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2093 demangleSigned(MangledName);
2101 TPRN->Affinity = PointerAffinity::Pointer;
2103 } else if (MangledName.startsWith("$E?")) {
2104 MangledName.consumeFront("$E");
2105 // Reference to symbol
2106 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2107 TPRN->Symbol = parse(MangledName);
2108 TPRN->Affinity = PointerAffinity::Reference;
2109 } else if (MangledName.startsWith("$F") || MangledName.startsWith("$G")) {
2110 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2112 // Data member pointer.
2113 MangledName = MangledName.dropFront();
2114 char InheritanceSpecifier = MangledName.popFront();
2116 switch (InheritanceSpecifier) {
2118 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2119 demangleSigned(MangledName);
2122 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2123 demangleSigned(MangledName);
2124 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2125 demangleSigned(MangledName);
2133 TPRN->IsMemberPointer = true;
2135 } else if (MangledName.consumeFront("$0")) {
2136 // Integral non-type template parameter
2137 bool IsNegative = false;
2139 std::tie(Value, IsNegative) = demangleNumber(MangledName);
2141 TP.N = Arena.alloc<IntegerLiteralNode>(Value, IsNegative);
2143 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
2154 // Template parameter lists cannot be variadic, so it can only be terminated
2156 if (MangledName.consumeFront('@'))
2157 return nodeListToNodeArray(Arena, Head, Count);
2162 void Demangler::dumpBackReferences() {
2163 std::printf("%d function parameter backreferences\n",
2164 (int)Backrefs.FunctionParamCount);
2166 // Create an output stream so we can render each type.
2168 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
2170 for (size_t I = 0; I < Backrefs.FunctionParamCount; ++I) {
2171 OS.setCurrentPosition(0);
2173 TypeNode *T = Backrefs.FunctionParams[I];
2174 T->output(OS, OF_Default);
2176 std::printf(" [%d] - %.*s\n", (int)I, (int)OS.getCurrentPosition(),
2179 std::free(OS.getBuffer());
2181 if (Backrefs.FunctionParamCount > 0)
2183 std::printf("%d name backreferences\n", (int)Backrefs.NamesCount);
2184 for (size_t I = 0; I < Backrefs.NamesCount; ++I) {
2185 std::printf(" [%d] - %.*s\n", (int)I, (int)Backrefs.Names[I]->Name.size(),
2186 Backrefs.Names[I]->Name.begin());
2188 if (Backrefs.NamesCount > 0)
2192 char *llvm::microsoftDemangle(const char *MangledName, char *Buf, size_t *N,
2193 int *Status, MSDemangleFlags Flags) {
2194 int InternalStatus = demangle_success;
2198 StringView Name{MangledName};
2199 SymbolNode *AST = D.parse(Name);
2201 if (Flags & MSDF_DumpBackrefs)
2202 D.dumpBackReferences();
2205 InternalStatus = demangle_invalid_mangled_name;
2206 else if (!initializeOutputStream(Buf, N, S, 1024))
2207 InternalStatus = demangle_memory_alloc_failure;
2209 AST->output(S, OF_Default);
2212 *N = S.getCurrentPosition();
2213 Buf = S.getBuffer();
2217 *Status = InternalStatus;
2218 return InternalStatus == demangle_success ? Buf : nullptr;