blob: e596f0cea1c8e659a78083b9c0cbcbb21a4e245f [file] [log] [blame]
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001//===- MicrosoftDemangle.cpp ----------------------------------------------===//
2//
Chandler Carruth57b08b02019-01-19 10:56:40 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Zachary Turnerf435a7e2018-07-20 17:27:48 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file defines a demangler for MSVC-style mangled symbols.
10//
11// This file has no dependencies on the rest of LLVM so that it can be
12// easily reused in other programs such as libcxxabi.
13//
14//===----------------------------------------------------------------------===//
15
Zachary Turner7ba90562018-11-01 15:07:32 +000016#include "llvm/Demangle/MicrosoftDemangle.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000017#include "llvm/Demangle/Demangle.h"
Zachary Turner7ba90562018-11-01 15:07:32 +000018#include "llvm/Demangle/MicrosoftDemangleNodes.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000019
Erik Pilkington5094e5e2019-01-17 20:37:51 +000020#include "llvm/Demangle/DemangleConfig.h"
Richard Smith8a57f2e2018-08-20 19:44:01 +000021#include "llvm/Demangle/StringView.h"
22#include "llvm/Demangle/Utility.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000023
Zachary Turner66555a72018-08-20 19:15:35 +000024#include <array>
Zachary Turnerf435a7e2018-07-20 17:27:48 +000025#include <cctype>
Zachary Turner5ae08b82018-08-01 18:44:12 +000026#include <cstdio>
Zachary Turnerd742d642018-07-26 19:56:09 +000027#include <tuple>
Zachary Turnerf435a7e2018-07-20 17:27:48 +000028
Zachary Turner03312862018-08-27 03:48:03 +000029using namespace llvm;
30using namespace ms_demangle;
Zachary Turnerf435a7e2018-07-20 17:27:48 +000031
32static bool startsWithDigit(StringView S) {
33 return !S.empty() && std::isdigit(S.front());
34}
35
Zachary Turnerd742d642018-07-26 19:56:09 +000036
Zachary Turner03312862018-08-27 03:48:03 +000037struct NodeList {
38 Node *N = nullptr;
39 NodeList *Next = nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +000040};
41
Zachary Turner8fb9a712018-12-14 18:10:13 +000042static bool isMemberPointer(StringView MangledName, bool &Error) {
43 Error = false;
Zachary Turnerd742d642018-07-26 19:56:09 +000044 switch (MangledName.popFront()) {
Zachary Turner931e8792018-07-30 23:02:10 +000045 case '$':
46 // This is probably an rvalue reference (e.g. $$Q), and you cannot have an
47 // rvalue reference to a member.
48 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +000049 case 'A':
50 // 'A' indicates a reference, and you cannot have a reference to a member
Zachary Turner931e8792018-07-30 23:02:10 +000051 // function or member.
Zachary Turnerd742d642018-07-26 19:56:09 +000052 return false;
53 case 'P':
54 case 'Q':
55 case 'R':
56 case 'S':
57 // These 4 values indicate some kind of pointer, but we still don't know
58 // what.
59 break;
60 default:
Zachary Turner8fb9a712018-12-14 18:10:13 +000061 Error = true;
62 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +000063 }
64
65 // If it starts with a number, then 6 indicates a non-member function
66 // pointer, and 8 indicates a member function pointer.
67 if (startsWithDigit(MangledName)) {
Nico Weber63b97d22019-04-08 19:46:53 +000068 if (MangledName[0] != '6' && MangledName[0] != '8') {
69 Error = true;
70 return false;
71 }
Zachary Turnerd742d642018-07-26 19:56:09 +000072 return (MangledName[0] == '8');
73 }
74
75 // Remove ext qualifiers since those can appear on either type and are
76 // therefore not indicative.
77 MangledName.consumeFront('E'); // 64-bit
78 MangledName.consumeFront('I'); // restrict
79 MangledName.consumeFront('F'); // unaligned
80
Nico Weber63b97d22019-04-08 19:46:53 +000081 if (MangledName.empty()) {
82 Error = true;
83 return false;
84 }
Zachary Turnerd742d642018-07-26 19:56:09 +000085
86 // The next value should be either ABCD (non-member) or QRST (member).
87 switch (MangledName.front()) {
88 case 'A':
89 case 'B':
90 case 'C':
91 case 'D':
92 return false;
93 case 'Q':
94 case 'R':
95 case 'S':
96 case 'T':
97 return true;
98 default:
Zachary Turner8fb9a712018-12-14 18:10:13 +000099 Error = true;
100 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +0000101 }
Zachary Turnerd742d642018-07-26 19:56:09 +0000102}
103
Zachary Turner03312862018-08-27 03:48:03 +0000104static SpecialIntrinsicKind
105consumeSpecialIntrinsicKind(StringView &MangledName) {
106 if (MangledName.consumeFront("?_7"))
107 return SpecialIntrinsicKind::Vftable;
108 if (MangledName.consumeFront("?_8"))
109 return SpecialIntrinsicKind::Vbtable;
110 if (MangledName.consumeFront("?_9"))
111 return SpecialIntrinsicKind::VcallThunk;
112 if (MangledName.consumeFront("?_A"))
113 return SpecialIntrinsicKind::Typeof;
114 if (MangledName.consumeFront("?_B"))
115 return SpecialIntrinsicKind::LocalStaticGuard;
116 if (MangledName.consumeFront("?_C"))
117 return SpecialIntrinsicKind::StringLiteralSymbol;
118 if (MangledName.consumeFront("?_P"))
119 return SpecialIntrinsicKind::UdtReturning;
120 if (MangledName.consumeFront("?_R0"))
121 return SpecialIntrinsicKind::RttiTypeDescriptor;
122 if (MangledName.consumeFront("?_R1"))
123 return SpecialIntrinsicKind::RttiBaseClassDescriptor;
124 if (MangledName.consumeFront("?_R2"))
125 return SpecialIntrinsicKind::RttiBaseClassArray;
126 if (MangledName.consumeFront("?_R3"))
127 return SpecialIntrinsicKind::RttiClassHierarchyDescriptor;
128 if (MangledName.consumeFront("?_R4"))
129 return SpecialIntrinsicKind::RttiCompleteObjLocator;
130 if (MangledName.consumeFront("?_S"))
131 return SpecialIntrinsicKind::LocalVftable;
132 if (MangledName.consumeFront("?__E"))
133 return SpecialIntrinsicKind::DynamicInitializer;
134 if (MangledName.consumeFront("?__F"))
135 return SpecialIntrinsicKind::DynamicAtexitDestructor;
136 if (MangledName.consumeFront("?__J"))
137 return SpecialIntrinsicKind::LocalStaticThreadGuard;
138 return SpecialIntrinsicKind::None;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000139}
140
Zachary Turner71c91f92018-07-30 03:12:34 +0000141static bool startsWithLocalScopePattern(StringView S) {
142 if (!S.consumeFront('?'))
143 return false;
144 if (S.size() < 2)
145 return false;
146
147 size_t End = S.find('?');
148 if (End == StringView::npos)
149 return false;
150 StringView Candidate = S.substr(0, End);
151 if (Candidate.empty())
152 return false;
153
154 // \?[0-9]\?
155 // ?@? is the discriminator 0.
156 if (Candidate.size() == 1)
157 return Candidate[0] == '@' || (Candidate[0] >= '0' && Candidate[0] <= '9');
158
159 // If it's not 0-9, then it's an encoded number terminated with an @
160 if (Candidate.back() != '@')
161 return false;
162 Candidate = Candidate.dropBack();
163
164 // An encoded number starts with B-P and all subsequent digits are in A-P.
165 // Note that the reason the first digit cannot be A is two fold. First, it
166 // would create an ambiguity with ?A which delimits the beginning of an
167 // anonymous namespace. Second, A represents 0, and you don't start a multi
168 // digit number with a leading 0. Presumably the anonymous namespace
169 // ambiguity is also why single digit encoded numbers use 0-9 rather than A-J.
170 if (Candidate[0] < 'B' || Candidate[0] > 'P')
171 return false;
172 Candidate = Candidate.dropFront();
173 while (!Candidate.empty()) {
174 if (Candidate[0] < 'A' || Candidate[0] > 'P')
175 return false;
176 Candidate = Candidate.dropFront();
177 }
178
179 return true;
180}
181
Zachary Turner03312862018-08-27 03:48:03 +0000182static bool isTagType(StringView S) {
183 switch (S.front()) {
184 case 'T': // union
185 case 'U': // struct
186 case 'V': // class
187 case 'W': // enum
188 return true;
Zachary Turner38b78a72018-07-26 20:20:10 +0000189 }
Zachary Turner03312862018-08-27 03:48:03 +0000190 return false;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000191}
192
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000193static bool isCustomType(StringView S) { return S[0] == '?'; }
194
Zachary Turner03312862018-08-27 03:48:03 +0000195static bool isPointerType(StringView S) {
196 if (S.startsWith("$$Q")) // foo &&
197 return true;
198
199 switch (S.front()) {
200 case 'A': // foo &
201 case 'P': // foo *
202 case 'Q': // foo *const
203 case 'R': // foo *volatile
204 case 'S': // foo *const volatile
205 return true;
206 }
207 return false;
208}
209
210static bool isArrayType(StringView S) { return S[0] == 'Y'; }
211
212static bool isFunctionType(StringView S) {
213 return S.startsWith("$$A8@@") || S.startsWith("$$A6");
214}
215
216static FunctionRefQualifier
217demangleFunctionRefQualifier(StringView &MangledName) {
218 if (MangledName.consumeFront('G'))
219 return FunctionRefQualifier::Reference;
220 else if (MangledName.consumeFront('H'))
221 return FunctionRefQualifier::RValueReference;
222 return FunctionRefQualifier::None;
223}
224
225static std::pair<Qualifiers, PointerAffinity>
226demanglePointerCVQualifiers(StringView &MangledName) {
227 if (MangledName.consumeFront("$$Q"))
228 return std::make_pair(Q_None, PointerAffinity::RValueReference);
229
230 switch (MangledName.popFront()) {
231 case 'A':
232 return std::make_pair(Q_None, PointerAffinity::Reference);
233 case 'P':
234 return std::make_pair(Q_None, PointerAffinity::Pointer);
235 case 'Q':
236 return std::make_pair(Q_Const, PointerAffinity::Pointer);
237 case 'R':
238 return std::make_pair(Q_Volatile, PointerAffinity::Pointer);
239 case 'S':
240 return std::make_pair(Qualifiers(Q_Const | Q_Volatile),
241 PointerAffinity::Pointer);
Zachary Turner970fdc32018-08-16 16:17:36 +0000242 default:
Zachary Turner03312862018-08-27 03:48:03 +0000243 assert(false && "Ty is not a pointer type!");
Zachary Turner970fdc32018-08-16 16:17:36 +0000244 }
Zachary Turner03312862018-08-27 03:48:03 +0000245 return std::make_pair(Q_None, PointerAffinity::Pointer);
Zachary Turner970fdc32018-08-16 16:17:36 +0000246}
247
Zachary Turner71c91f92018-07-30 03:12:34 +0000248StringView Demangler::copyString(StringView Borrowed) {
249 char *Stable = Arena.allocUnalignedBuffer(Borrowed.size() + 1);
250 std::strcpy(Stable, Borrowed.begin());
251
252 return {Stable, Borrowed.size()};
253}
254
Zachary Turner03312862018-08-27 03:48:03 +0000255SpecialTableSymbolNode *
256Demangler::demangleSpecialTableSymbolNode(StringView &MangledName,
257 SpecialIntrinsicKind K) {
258 NamedIdentifierNode *NI = Arena.alloc<NamedIdentifierNode>();
259 switch (K) {
260 case SpecialIntrinsicKind::Vftable:
261 NI->Name = "`vftable'";
262 break;
263 case SpecialIntrinsicKind::Vbtable:
264 NI->Name = "`vbtable'";
265 break;
266 case SpecialIntrinsicKind::LocalVftable:
267 NI->Name = "`local vftable'";
268 break;
269 case SpecialIntrinsicKind::RttiCompleteObjLocator:
270 NI->Name = "`RTTI Complete Object Locator'";
271 break;
272 default:
Erik Pilkington5094e5e2019-01-17 20:37:51 +0000273 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000274 }
275 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
276 SpecialTableSymbolNode *STSN = Arena.alloc<SpecialTableSymbolNode>();
277 STSN->Name = QN;
Zachary Turner469f0762018-08-17 21:18:05 +0000278 bool IsMember = false;
Nico Weberae050d22019-04-14 23:32:37 +0000279 if (MangledName.empty()) {
280 Error = true;
281 return nullptr;
282 }
Zachary Turner03312862018-08-27 03:48:03 +0000283 char Front = MangledName.popFront();
284 if (Front != '6' && Front != '7') {
285 Error = true;
286 return nullptr;
287 }
288
289 std::tie(STSN->Quals, IsMember) = demangleQualifiers(MangledName);
290 if (!MangledName.consumeFront('@'))
291 STSN->TargetName = demangleFullyQualifiedTypeName(MangledName);
292 return STSN;
293}
294
295LocalStaticGuardVariableNode *
296Demangler::demangleLocalStaticGuard(StringView &MangledName) {
297 LocalStaticGuardIdentifierNode *LSGI =
298 Arena.alloc<LocalStaticGuardIdentifierNode>();
299 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, LSGI);
300 LocalStaticGuardVariableNode *LSGVN =
301 Arena.alloc<LocalStaticGuardVariableNode>();
302 LSGVN->Name = QN;
303
304 if (MangledName.consumeFront("4IA"))
305 LSGVN->IsVisible = false;
306 else if (MangledName.consumeFront("5"))
307 LSGVN->IsVisible = true;
308 else {
309 Error = true;
310 return nullptr;
311 }
312
313 if (!MangledName.empty())
314 LSGI->ScopeIndex = demangleUnsigned(MangledName);
315 return LSGVN;
316}
317
318static NamedIdentifierNode *synthesizeNamedIdentifier(ArenaAllocator &Arena,
319 StringView Name) {
320 NamedIdentifierNode *Id = Arena.alloc<NamedIdentifierNode>();
321 Id->Name = Name;
322 return Id;
323}
324
325static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
326 IdentifierNode *Identifier) {
327 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
328 QN->Components = Arena.alloc<NodeArrayNode>();
329 QN->Components->Count = 1;
330 QN->Components->Nodes = Arena.allocArray<Node *>(1);
331 QN->Components->Nodes[0] = Identifier;
332 return QN;
333}
334
335static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
336 StringView Name) {
337 NamedIdentifierNode *Id = synthesizeNamedIdentifier(Arena, Name);
338 return synthesizeQualifiedName(Arena, Id);
339}
340
341static VariableSymbolNode *synthesizeVariable(ArenaAllocator &Arena,
342 TypeNode *Type,
343 StringView VariableName) {
344 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
345 VSN->Type = Type;
346 VSN->Name = synthesizeQualifiedName(Arena, VariableName);
347 return VSN;
348}
349
350VariableSymbolNode *Demangler::demangleUntypedVariable(
351 ArenaAllocator &Arena, StringView &MangledName, StringView VariableName) {
352 NamedIdentifierNode *NI = synthesizeNamedIdentifier(Arena, VariableName);
353 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
354 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
355 VSN->Name = QN;
356 if (MangledName.consumeFront("8"))
357 return VSN;
358
359 Error = true;
360 return nullptr;
361}
362
363VariableSymbolNode *
364Demangler::demangleRttiBaseClassDescriptorNode(ArenaAllocator &Arena,
365 StringView &MangledName) {
366 RttiBaseClassDescriptorNode *RBCDN =
367 Arena.alloc<RttiBaseClassDescriptorNode>();
368 RBCDN->NVOffset = demangleUnsigned(MangledName);
369 RBCDN->VBPtrOffset = demangleSigned(MangledName);
370 RBCDN->VBTableOffset = demangleUnsigned(MangledName);
371 RBCDN->Flags = demangleUnsigned(MangledName);
372 if (Error)
373 return nullptr;
374
375 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
376 VSN->Name = demangleNameScopeChain(MangledName, RBCDN);
377 MangledName.consumeFront('8');
378 return VSN;
379}
380
Zachary Turner32a8a202018-08-29 23:56:09 +0000381FunctionSymbolNode *Demangler::demangleInitFiniStub(StringView &MangledName,
382 bool IsDestructor) {
Zachary Turner03312862018-08-27 03:48:03 +0000383 DynamicStructorIdentifierNode *DSIN =
384 Arena.alloc<DynamicStructorIdentifierNode>();
385 DSIN->IsDestructor = IsDestructor;
Zachary Turner32a8a202018-08-29 23:56:09 +0000386
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000387 bool IsKnownStaticDataMember = false;
388 if (MangledName.consumeFront('?'))
389 IsKnownStaticDataMember = true;
390
Nico Weber63b97d22019-04-08 19:46:53 +0000391 SymbolNode *Symbol = demangleDeclarator(MangledName);
392 if (Error)
393 return nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +0000394
Zachary Turner32a8a202018-08-29 23:56:09 +0000395 FunctionSymbolNode *FSN = nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +0000396
397 if (Symbol->kind() == NodeKind::VariableSymbol) {
398 DSIN->Variable = static_cast<VariableSymbolNode *>(Symbol);
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000399
400 // Older versions of clang mangled this type of symbol incorrectly. They
401 // would omit the leading ? and they would only emit a single @ at the end.
402 // The correct mangling is a leading ? and 2 trailing @ signs. Handle
403 // both cases.
404 int AtCount = IsKnownStaticDataMember ? 2 : 1;
405 for (int I = 0; I < AtCount; ++I) {
406 if (MangledName.consumeFront('@'))
407 continue;
Zachary Turner32a8a202018-08-29 23:56:09 +0000408 Error = true;
409 return nullptr;
410 }
411
412 FSN = demangleFunctionEncoding(MangledName);
Nico Weber63b97d22019-04-08 19:46:53 +0000413 if (FSN)
414 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
Zachary Turner32a8a202018-08-29 23:56:09 +0000415 } else {
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000416 if (IsKnownStaticDataMember) {
417 // This was supposed to be a static data member, but we got a function.
418 Error = true;
419 return nullptr;
420 }
421
Zachary Turner32a8a202018-08-29 23:56:09 +0000422 FSN = static_cast<FunctionSymbolNode *>(Symbol);
423 DSIN->Name = Symbol->Name;
424 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
425 }
426
Zachary Turner03312862018-08-27 03:48:03 +0000427 return FSN;
428}
429
430SymbolNode *Demangler::demangleSpecialIntrinsic(StringView &MangledName) {
431 SpecialIntrinsicKind SIK = consumeSpecialIntrinsicKind(MangledName);
432 if (SIK == SpecialIntrinsicKind::None)
433 return nullptr;
434
435 switch (SIK) {
436 case SpecialIntrinsicKind::StringLiteralSymbol:
437 return demangleStringLiteral(MangledName);
438 case SpecialIntrinsicKind::Vftable:
439 case SpecialIntrinsicKind::Vbtable:
440 case SpecialIntrinsicKind::LocalVftable:
441 case SpecialIntrinsicKind::RttiCompleteObjLocator:
442 return demangleSpecialTableSymbolNode(MangledName, SIK);
443 case SpecialIntrinsicKind::VcallThunk:
444 return demangleVcallThunkNode(MangledName);
445 case SpecialIntrinsicKind::LocalStaticGuard:
446 return demangleLocalStaticGuard(MangledName);
447 case SpecialIntrinsicKind::RttiTypeDescriptor: {
448 TypeNode *T = demangleType(MangledName, QualifierMangleMode::Result);
Zachary Turner469f0762018-08-17 21:18:05 +0000449 if (Error)
450 break;
451 if (!MangledName.consumeFront("@8"))
Zachary Turner03312862018-08-27 03:48:03 +0000452 break;
Zachary Turner469f0762018-08-17 21:18:05 +0000453 if (!MangledName.empty())
Zachary Turner03312862018-08-27 03:48:03 +0000454 break;
455 return synthesizeVariable(Arena, T, "`RTTI Type Descriptor'");
456 }
457 case SpecialIntrinsicKind::RttiBaseClassArray:
458 return demangleUntypedVariable(Arena, MangledName,
459 "`RTTI Base Class Array'");
460 case SpecialIntrinsicKind::RttiClassHierarchyDescriptor:
461 return demangleUntypedVariable(Arena, MangledName,
462 "`RTTI Class Hierarchy Descriptor'");
463 case SpecialIntrinsicKind::RttiBaseClassDescriptor:
464 return demangleRttiBaseClassDescriptorNode(Arena, MangledName);
465 case SpecialIntrinsicKind::DynamicInitializer:
Zachary Turner32a8a202018-08-29 23:56:09 +0000466 return demangleInitFiniStub(MangledName, false);
Zachary Turner03312862018-08-27 03:48:03 +0000467 case SpecialIntrinsicKind::DynamicAtexitDestructor:
Zachary Turner32a8a202018-08-29 23:56:09 +0000468 return demangleInitFiniStub(MangledName, true);
Zachary Turner469f0762018-08-17 21:18:05 +0000469 default:
Zachary Turner469f0762018-08-17 21:18:05 +0000470 break;
471 }
Zachary Turner03312862018-08-27 03:48:03 +0000472 Error = true;
473 return nullptr;
Zachary Turner469f0762018-08-17 21:18:05 +0000474}
475
Zachary Turner03312862018-08-27 03:48:03 +0000476IdentifierNode *
477Demangler::demangleFunctionIdentifierCode(StringView &MangledName) {
478 assert(MangledName.startsWith('?'));
479 MangledName = MangledName.dropFront();
Nico Weber321de482019-04-03 23:19:39 +0000480 if (MangledName.empty()) {
481 Error = true;
482 return nullptr;
483 }
Zachary Turner03312862018-08-27 03:48:03 +0000484
485 if (MangledName.consumeFront("__"))
486 return demangleFunctionIdentifierCode(
487 MangledName, FunctionIdentifierCodeGroup::DoubleUnder);
Nico Weberb4f33bb2019-04-11 22:47:18 +0000488 if (MangledName.consumeFront("_"))
Zachary Turner03312862018-08-27 03:48:03 +0000489 return demangleFunctionIdentifierCode(MangledName,
490 FunctionIdentifierCodeGroup::Under);
491 return demangleFunctionIdentifierCode(MangledName,
492 FunctionIdentifierCodeGroup::Basic);
493}
494
495StructorIdentifierNode *
496Demangler::demangleStructorIdentifier(StringView &MangledName,
497 bool IsDestructor) {
498 StructorIdentifierNode *N = Arena.alloc<StructorIdentifierNode>();
499 N->IsDestructor = IsDestructor;
500 return N;
501}
502
503ConversionOperatorIdentifierNode *
504Demangler::demangleConversionOperatorIdentifier(StringView &MangledName) {
505 ConversionOperatorIdentifierNode *N =
506 Arena.alloc<ConversionOperatorIdentifierNode>();
507 return N;
508}
509
510LiteralOperatorIdentifierNode *
511Demangler::demangleLiteralOperatorIdentifier(StringView &MangledName) {
512 LiteralOperatorIdentifierNode *N =
513 Arena.alloc<LiteralOperatorIdentifierNode>();
Nico Weberaf2ee7d2019-04-11 23:20:18 +0000514 N->Name = demangleSimpleString(MangledName, /*Memorize=*/false);
Zachary Turner03312862018-08-27 03:48:03 +0000515 return N;
516}
517
Nico Weber03db6252019-04-11 23:11:33 +0000518IntrinsicFunctionKind
519Demangler::translateIntrinsicFunctionCode(char CH,
520 FunctionIdentifierCodeGroup Group) {
521 using IFK = IntrinsicFunctionKind;
522 if (!(CH >= '0' && CH <= '9') && !(CH >= 'A' && CH <= 'Z')) {
523 Error = true;
524 return IFK::None;
525 }
526
Zachary Turner03312862018-08-27 03:48:03 +0000527 // Not all ? identifiers are intrinsics *functions*. This function only maps
528 // operator codes for the special functions, all others are handled elsewhere,
529 // hence the IFK::None entries in the table.
Zachary Turner03312862018-08-27 03:48:03 +0000530 static IFK Basic[36] = {
531 IFK::None, // ?0 # Foo::Foo()
532 IFK::None, // ?1 # Foo::~Foo()
533 IFK::New, // ?2 # operator new
534 IFK::Delete, // ?3 # operator delete
535 IFK::Assign, // ?4 # operator=
536 IFK::RightShift, // ?5 # operator>>
537 IFK::LeftShift, // ?6 # operator<<
538 IFK::LogicalNot, // ?7 # operator!
539 IFK::Equals, // ?8 # operator==
540 IFK::NotEquals, // ?9 # operator!=
541 IFK::ArraySubscript, // ?A # operator[]
542 IFK::None, // ?B # Foo::operator <type>()
543 IFK::Pointer, // ?C # operator->
544 IFK::Dereference, // ?D # operator*
545 IFK::Increment, // ?E # operator++
546 IFK::Decrement, // ?F # operator--
547 IFK::Minus, // ?G # operator-
548 IFK::Plus, // ?H # operator+
549 IFK::BitwiseAnd, // ?I # operator&
550 IFK::MemberPointer, // ?J # operator->*
551 IFK::Divide, // ?K # operator/
552 IFK::Modulus, // ?L # operator%
553 IFK::LessThan, // ?M operator<
554 IFK::LessThanEqual, // ?N operator<=
555 IFK::GreaterThan, // ?O operator>
556 IFK::GreaterThanEqual, // ?P operator>=
557 IFK::Comma, // ?Q operator,
558 IFK::Parens, // ?R operator()
559 IFK::BitwiseNot, // ?S operator~
560 IFK::BitwiseXor, // ?T operator^
561 IFK::BitwiseOr, // ?U operator|
562 IFK::LogicalAnd, // ?V operator&&
563 IFK::LogicalOr, // ?W operator||
564 IFK::TimesEqual, // ?X operator*=
565 IFK::PlusEqual, // ?Y operator+=
566 IFK::MinusEqual, // ?Z operator-=
567 };
568 static IFK Under[36] = {
569 IFK::DivEqual, // ?_0 operator/=
570 IFK::ModEqual, // ?_1 operator%=
571 IFK::RshEqual, // ?_2 operator>>=
572 IFK::LshEqual, // ?_3 operator<<=
573 IFK::BitwiseAndEqual, // ?_4 operator&=
574 IFK::BitwiseOrEqual, // ?_5 operator|=
575 IFK::BitwiseXorEqual, // ?_6 operator^=
576 IFK::None, // ?_7 # vftable
577 IFK::None, // ?_8 # vbtable
578 IFK::None, // ?_9 # vcall
579 IFK::None, // ?_A # typeof
580 IFK::None, // ?_B # local static guard
581 IFK::None, // ?_C # string literal
582 IFK::VbaseDtor, // ?_D # vbase destructor
583 IFK::VecDelDtor, // ?_E # vector deleting destructor
584 IFK::DefaultCtorClosure, // ?_F # default constructor closure
585 IFK::ScalarDelDtor, // ?_G # scalar deleting destructor
586 IFK::VecCtorIter, // ?_H # vector constructor iterator
587 IFK::VecDtorIter, // ?_I # vector destructor iterator
588 IFK::VecVbaseCtorIter, // ?_J # vector vbase constructor iterator
589 IFK::VdispMap, // ?_K # virtual displacement map
590 IFK::EHVecCtorIter, // ?_L # eh vector constructor iterator
591 IFK::EHVecDtorIter, // ?_M # eh vector destructor iterator
592 IFK::EHVecVbaseCtorIter, // ?_N # eh vector vbase constructor iterator
593 IFK::CopyCtorClosure, // ?_O # copy constructor closure
594 IFK::None, // ?_P<name> # udt returning <name>
595 IFK::None, // ?_Q # <unknown>
596 IFK::None, // ?_R0 - ?_R4 # RTTI Codes
597 IFK::None, // ?_S # local vftable
598 IFK::LocalVftableCtorClosure, // ?_T # local vftable constructor closure
599 IFK::ArrayNew, // ?_U operator new[]
600 IFK::ArrayDelete, // ?_V operator delete[]
601 IFK::None, // ?_W <unused>
602 IFK::None, // ?_X <unused>
603 IFK::None, // ?_Y <unused>
604 IFK::None, // ?_Z <unused>
605 };
606 static IFK DoubleUnder[36] = {
607 IFK::None, // ?__0 <unused>
608 IFK::None, // ?__1 <unused>
609 IFK::None, // ?__2 <unused>
610 IFK::None, // ?__3 <unused>
611 IFK::None, // ?__4 <unused>
612 IFK::None, // ?__5 <unused>
613 IFK::None, // ?__6 <unused>
614 IFK::None, // ?__7 <unused>
615 IFK::None, // ?__8 <unused>
616 IFK::None, // ?__9 <unused>
617 IFK::ManVectorCtorIter, // ?__A managed vector ctor iterator
618 IFK::ManVectorDtorIter, // ?__B managed vector dtor iterator
619 IFK::EHVectorCopyCtorIter, // ?__C EH vector copy ctor iterator
620 IFK::EHVectorVbaseCopyCtorIter, // ?__D EH vector vbase copy ctor iter
621 IFK::None, // ?__E dynamic initializer for `T'
622 IFK::None, // ?__F dynamic atexit destructor for `T'
623 IFK::VectorCopyCtorIter, // ?__G vector copy constructor iter
624 IFK::VectorVbaseCopyCtorIter, // ?__H vector vbase copy ctor iter
625 IFK::ManVectorVbaseCopyCtorIter, // ?__I managed vector vbase copy ctor
626 // iter
627 IFK::None, // ?__J local static thread guard
628 IFK::None, // ?__K operator ""_name
Nico Webere8f21b12019-04-23 16:20:27 +0000629 IFK::CoAwait, // ?__L operator co_await
630 IFK::Spaceship, // ?__M operator<=>
Zachary Turner03312862018-08-27 03:48:03 +0000631 IFK::None, // ?__N <unused>
632 IFK::None, // ?__O <unused>
633 IFK::None, // ?__P <unused>
634 IFK::None, // ?__Q <unused>
635 IFK::None, // ?__R <unused>
636 IFK::None, // ?__S <unused>
637 IFK::None, // ?__T <unused>
638 IFK::None, // ?__U <unused>
639 IFK::None, // ?__V <unused>
640 IFK::None, // ?__W <unused>
641 IFK::None, // ?__X <unused>
642 IFK::None, // ?__Y <unused>
643 IFK::None, // ?__Z <unused>
644 };
645
646 int Index = (CH >= '0' && CH <= '9') ? (CH - '0') : (CH - 'A' + 10);
647 switch (Group) {
648 case FunctionIdentifierCodeGroup::Basic:
649 return Basic[Index];
650 case FunctionIdentifierCodeGroup::Under:
651 return Under[Index];
652 case FunctionIdentifierCodeGroup::DoubleUnder:
653 return DoubleUnder[Index];
654 }
Erik Pilkington5094e5e2019-01-17 20:37:51 +0000655 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000656}
657
658IdentifierNode *
659Demangler::demangleFunctionIdentifierCode(StringView &MangledName,
660 FunctionIdentifierCodeGroup Group) {
Nico Weber63fe2592019-04-14 23:08:12 +0000661 if (MangledName.empty()) {
662 Error = true;
663 return nullptr;
664 }
Zachary Turner03312862018-08-27 03:48:03 +0000665 switch (Group) {
666 case FunctionIdentifierCodeGroup::Basic:
667 switch (char CH = MangledName.popFront()) {
668 case '0':
669 case '1':
670 return demangleStructorIdentifier(MangledName, CH == '1');
671 case 'B':
672 return demangleConversionOperatorIdentifier(MangledName);
673 default:
674 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
675 translateIntrinsicFunctionCode(CH, Group));
676 }
Zachary Turner03312862018-08-27 03:48:03 +0000677 case FunctionIdentifierCodeGroup::Under:
678 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
679 translateIntrinsicFunctionCode(MangledName.popFront(), Group));
680 case FunctionIdentifierCodeGroup::DoubleUnder:
681 switch (char CH = MangledName.popFront()) {
682 case 'K':
683 return demangleLiteralOperatorIdentifier(MangledName);
684 default:
685 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
686 translateIntrinsicFunctionCode(CH, Group));
687 }
688 }
Zachary Turner03312862018-08-27 03:48:03 +0000689
Nico Weberef035182019-04-11 23:23:00 +0000690 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000691}
692
693SymbolNode *Demangler::demangleEncodedSymbol(StringView &MangledName,
694 QualifiedNameNode *Name) {
Nico Weber63b97d22019-04-08 19:46:53 +0000695 if (MangledName.empty()) {
696 Error = true;
697 return nullptr;
698 }
699
Zachary Turner469f0762018-08-17 21:18:05 +0000700 // Read a variable.
701 switch (MangledName.front()) {
702 case '0':
703 case '1':
704 case '2':
705 case '3':
Zachary Turner03312862018-08-27 03:48:03 +0000706 case '4': {
707 StorageClass SC = demangleVariableStorageClass(MangledName);
708 return demangleVariableEncoding(MangledName, SC);
Zachary Turner469f0762018-08-17 21:18:05 +0000709 }
Zachary Turner03312862018-08-27 03:48:03 +0000710 }
711 FunctionSymbolNode *FSN = demangleFunctionEncoding(MangledName);
712
713 IdentifierNode *UQN = Name->getUnqualifiedIdentifier();
714 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
715 ConversionOperatorIdentifierNode *COIN =
716 static_cast<ConversionOperatorIdentifierNode *>(UQN);
Nico Weber63b97d22019-04-08 19:46:53 +0000717 if (FSN)
718 COIN->TargetType = FSN->Signature->ReturnType;
Zachary Turner03312862018-08-27 03:48:03 +0000719 }
720 return FSN;
Zachary Turner469f0762018-08-17 21:18:05 +0000721}
722
Nico Weber63b97d22019-04-08 19:46:53 +0000723SymbolNode *Demangler::demangleDeclarator(StringView &MangledName) {
724 // What follows is a main symbol name. This may include namespaces or class
725 // back references.
726 QualifiedNameNode *QN = demangleFullyQualifiedSymbolName(MangledName);
727 if (Error)
728 return nullptr;
729
730 SymbolNode *Symbol = demangleEncodedSymbol(MangledName, QN);
731 if (Error)
732 return nullptr;
733 Symbol->Name = QN;
734
735 IdentifierNode *UQN = QN->getUnqualifiedIdentifier();
736 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
737 ConversionOperatorIdentifierNode *COIN =
738 static_cast<ConversionOperatorIdentifierNode *>(UQN);
739 if (!COIN->TargetType) {
740 Error = true;
741 return nullptr;
742 }
743 }
744 return Symbol;
745}
746
Nico Weber82dc06c2019-05-27 23:10:42 +0000747SymbolNode *Demangler::demangleMD5Name(StringView &MangledName) {
748 assert(MangledName.startsWith("??@"));
749 // This is an MD5 mangled name. We can't demangle it, just return the
750 // mangled name.
751 // An MD5 mangled name is ??@ followed by 32 characters and a terminating @.
752 size_t MD5Last = MangledName.find('@', strlen("??@"));
753 if (MD5Last == StringView::npos) {
754 Error = true;
755 return nullptr;
756 }
757 const char *Start = MangledName.begin();
758 MangledName = MangledName.dropFront(MD5Last + 1);
759
760 // There are two additional special cases for MD5 names:
761 // 1. For complete object locators where the object name is long enough
762 // for the object to have an MD5 name, the complete object locator is
763 // called ??@...@??_R4@ (with a trailing "??_R4@" instead of the usual
764 // leading "??_R4". This is handled here.
765 // 2. For catchable types, in versions of MSVC before 2015 (<1900) or after
766 // 2017.2 (>= 1914), the catchable type mangling is _CT??@...@??@...@8
767 // instead of_CT??@...@8 with just one MD5 name. Since we don't yet
768 // demangle catchable types anywhere, this isn't handled for MD5 names
769 // either.
770 MangledName.consumeFront("??_R4@");
771
772 StringView MD5(Start, MangledName.begin());
773 SymbolNode *S = Arena.alloc<SymbolNode>(NodeKind::Md5Symbol);
774 S->Name = synthesizeQualifiedName(Arena, MD5);
775
776 return S;
777}
778
Zachary Turner469f0762018-08-17 21:18:05 +0000779// Parser entry point.
Zachary Turner03312862018-08-27 03:48:03 +0000780SymbolNode *Demangler::parse(StringView &MangledName) {
Nico Weber82dc06c2019-05-27 23:10:42 +0000781 if (MangledName.startsWith("??@"))
782 return demangleMD5Name(MangledName);
Zachary Turner83313f82018-08-16 16:17:17 +0000783
Nico Webercfe08bc2019-05-27 00:48:59 +0000784 // MSVC-style mangled symbols must start with '?'.
Zachary Turner03312862018-08-27 03:48:03 +0000785 if (!MangledName.startsWith('?')) {
786 Error = true;
787 return nullptr;
788 }
789
Zachary Turner469f0762018-08-17 21:18:05 +0000790 MangledName.consumeFront('?');
Zachary Turner970fdc32018-08-16 16:17:36 +0000791
Zachary Turner469f0762018-08-17 21:18:05 +0000792 // ?$ is a template instantiation, but all other names that start with ? are
793 // operators / special names.
Zachary Turner03312862018-08-27 03:48:03 +0000794 if (SymbolNode *SI = demangleSpecialIntrinsic(MangledName))
795 return SI;
Zachary Turner469f0762018-08-17 21:18:05 +0000796
Nico Weber63b97d22019-04-08 19:46:53 +0000797 return demangleDeclarator(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000798}
799
Zachary Turner7ba90562018-11-01 15:07:32 +0000800TagTypeNode *Demangler::parseTagUniqueName(StringView &MangledName) {
801 if (!MangledName.consumeFront(".?A"))
802 return nullptr;
803 MangledName.consumeFront(".?A");
804 if (MangledName.empty())
805 return nullptr;
806
807 return demangleClassType(MangledName);
808}
809
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000810// <type-encoding> ::= <storage-class> <variable-type>
811// <storage-class> ::= 0 # private static member
812// ::= 1 # protected static member
813// ::= 2 # public static member
814// ::= 3 # global
815// ::= 4 # static local
816
Zachary Turner03312862018-08-27 03:48:03 +0000817VariableSymbolNode *Demangler::demangleVariableEncoding(StringView &MangledName,
818 StorageClass SC) {
819 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000820
Zachary Turner03312862018-08-27 03:48:03 +0000821 VSN->Type = demangleType(MangledName, QualifierMangleMode::Drop);
822 VSN->SC = SC;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000823
Nico Weber63b97d22019-04-08 19:46:53 +0000824 if (Error)
825 return nullptr;
826
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000827 // <variable-type> ::= <type> <cvr-qualifiers>
828 // ::= <type> <pointee-cvr-qualifiers> # pointers, references
Zachary Turner03312862018-08-27 03:48:03 +0000829 switch (VSN->Type->kind()) {
830 case NodeKind::PointerType: {
831 PointerTypeNode *PTN = static_cast<PointerTypeNode *>(VSN->Type);
832
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000833 Qualifiers ExtraChildQuals = Q_None;
Zachary Turner03312862018-08-27 03:48:03 +0000834 PTN->Quals = Qualifiers(VSN->Type->Quals |
835 demanglePointerExtQualifiers(MangledName));
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000836
Zachary Turnerd742d642018-07-26 19:56:09 +0000837 bool IsMember = false;
Zachary Turner316109b2018-07-29 16:38:02 +0000838 std::tie(ExtraChildQuals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000839
Zachary Turner03312862018-08-27 03:48:03 +0000840 if (PTN->ClassParent) {
841 QualifiedNameNode *BackRefName =
842 demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000843 (void)BackRefName;
844 }
Zachary Turner03312862018-08-27 03:48:03 +0000845 PTN->Pointee->Quals = Qualifiers(PTN->Pointee->Quals | ExtraChildQuals);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000846
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000847 break;
848 }
849 default:
Zachary Turner03312862018-08-27 03:48:03 +0000850 VSN->Type->Quals = demangleQualifiers(MangledName).first;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000851 break;
852 }
853
Zachary Turner03312862018-08-27 03:48:03 +0000854 return VSN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000855}
856
857// Sometimes numbers are encoded in mangled symbols. For example,
858// "int (*x)[20]" is a valid C type (x is a pointer to an array of
859// length 20), so we need some way to embed numbers as part of symbols.
860// This function parses it.
861//
862// <number> ::= [?] <non-negative integer>
863//
864// <non-negative integer> ::= <decimal digit> # when 1 <= Number <= 10
Nico Weber502cf4b2019-04-18 19:30:21 +0000865// ::= <hex digit>+ @ # when Number == 0 or >= 10
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000866//
867// <hex-digit> ::= [A-P] # A = 0, B = 1, ...
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000868std::pair<uint64_t, bool> Demangler::demangleNumber(StringView &MangledName) {
869 bool IsNegative = MangledName.consumeFront('?');
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000870
871 if (startsWithDigit(MangledName)) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000872 uint64_t Ret = MangledName[0] - '0' + 1;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000873 MangledName = MangledName.dropFront(1);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000874 return {Ret, IsNegative};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000875 }
876
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000877 uint64_t Ret = 0;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000878 for (size_t i = 0; i < MangledName.size(); ++i) {
879 char C = MangledName[i];
880 if (C == '@') {
881 MangledName = MangledName.dropFront(i + 1);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000882 return {Ret, IsNegative};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000883 }
884 if ('A' <= C && C <= 'P') {
885 Ret = (Ret << 4) + (C - 'A');
886 continue;
887 }
888 break;
889 }
890
891 Error = true;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000892 return {0ULL, false};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000893}
894
Zachary Turner469f0762018-08-17 21:18:05 +0000895uint64_t Demangler::demangleUnsigned(StringView &MangledName) {
896 bool IsNegative = false;
897 uint64_t Number = 0;
898 std::tie(Number, IsNegative) = demangleNumber(MangledName);
899 if (IsNegative)
900 Error = true;
901 return Number;
902}
903
904int64_t Demangler::demangleSigned(StringView &MangledName) {
905 bool IsNegative = false;
906 uint64_t Number = 0;
907 std::tie(Number, IsNegative) = demangleNumber(MangledName);
908 if (Number > INT64_MAX)
909 Error = true;
910 int64_t I = static_cast<int64_t>(Number);
911 return IsNegative ? -I : I;
912}
913
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000914// First 10 strings can be referenced by special BackReferences ?0, ?1, ..., ?9.
915// Memorize it.
916void Demangler::memorizeString(StringView S) {
Zachary Turnerd346cba2018-08-08 17:17:04 +0000917 if (Backrefs.NamesCount >= BackrefContext::Max)
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000918 return;
Zachary Turnerd346cba2018-08-08 17:17:04 +0000919 for (size_t i = 0; i < Backrefs.NamesCount; ++i)
Zachary Turner03312862018-08-27 03:48:03 +0000920 if (S == Backrefs.Names[i]->Name)
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000921 return;
Zachary Turner03312862018-08-27 03:48:03 +0000922 NamedIdentifierNode *N = Arena.alloc<NamedIdentifierNode>();
923 N->Name = S;
924 Backrefs.Names[Backrefs.NamesCount++] = N;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000925}
926
Zachary Turner03312862018-08-27 03:48:03 +0000927NamedIdentifierNode *Demangler::demangleBackRefName(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +0000928 assert(startsWithDigit(MangledName));
Zachary Turnerd9e925f2018-08-18 18:49:48 +0000929
930 size_t I = MangledName[0] - '0';
931 if (I >= Backrefs.NamesCount) {
932 Error = true;
933 return nullptr;
934 }
935
Zachary Turner172aea12018-08-02 17:08:03 +0000936 MangledName = MangledName.dropFront();
Zachary Turner03312862018-08-27 03:48:03 +0000937 return Backrefs.Names[I];
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000938}
939
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000940void Demangler::memorizeIdentifier(IdentifierNode *Identifier) {
941 // Render this class template name into a string buffer so that we can
942 // memorize it for the purpose of back-referencing.
Nico Weber1359d652018-09-15 18:24:20 +0000943 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +0000944 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +0000945 // FIXME: Propagate out-of-memory as an error?
946 std::terminate();
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000947 Identifier->output(OS, OF_Default);
948 OS << '\0';
949 char *Name = OS.getBuffer();
950
951 StringView Owned = copyString(Name);
952 memorizeString(Owned);
953 std::free(Name);
954}
955
Zachary Turner03312862018-08-27 03:48:03 +0000956IdentifierNode *
957Demangler::demangleTemplateInstantiationName(StringView &MangledName,
958 NameBackrefBehavior NBB) {
Zachary Turnera7dffb12018-07-28 22:10:42 +0000959 assert(MangledName.startsWith("?$"));
960 MangledName.consumeFront("?$");
961
Zachary Turnerd346cba2018-08-08 17:17:04 +0000962 BackrefContext OuterContext;
963 std::swap(OuterContext, Backrefs);
Zachary Turner54d4ffe2018-08-01 18:32:28 +0000964
Zachary Turner03312862018-08-27 03:48:03 +0000965 IdentifierNode *Identifier =
966 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
Zachary Turnerd346cba2018-08-08 17:17:04 +0000967 if (!Error)
Zachary Turner03312862018-08-27 03:48:03 +0000968 Identifier->TemplateParams = demangleTemplateParameterList(MangledName);
Zachary Turnerd346cba2018-08-08 17:17:04 +0000969
970 std::swap(OuterContext, Backrefs);
Zachary Turner54d4ffe2018-08-01 18:32:28 +0000971 if (Error)
972 return nullptr;
Zachary Turner71c91f92018-07-30 03:12:34 +0000973
Nico Weber64041d72019-04-15 16:42:44 +0000974 if (NBB & NBB_Template) {
975 // NBB_Template is only set for types and non-leaf names ("a::" in "a::b").
Nico Weberc035c242019-04-16 14:10:34 +0000976 // Structors and conversion operators only makes sense in a leaf name, so
977 // reject them in NBB_Template contexts.
978 if (Identifier->kind() == NodeKind::ConversionOperatorIdentifier ||
979 Identifier->kind() == NodeKind::StructorIdentifier) {
Nico Weber64041d72019-04-15 16:42:44 +0000980 Error = true;
981 return nullptr;
982 }
983
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000984 memorizeIdentifier(Identifier);
Nico Weber64041d72019-04-15 16:42:44 +0000985 }
Zachary Turner71c91f92018-07-30 03:12:34 +0000986
Zachary Turner03312862018-08-27 03:48:03 +0000987 return Identifier;
Zachary Turnera7dffb12018-07-28 22:10:42 +0000988}
989
Zachary Turner03312862018-08-27 03:48:03 +0000990NamedIdentifierNode *Demangler::demangleSimpleName(StringView &MangledName,
991 bool Memorize) {
Zachary Turner931e8792018-07-30 23:02:10 +0000992 StringView S = demangleSimpleString(MangledName, Memorize);
993 if (Error)
994 return nullptr;
995
Zachary Turner03312862018-08-27 03:48:03 +0000996 NamedIdentifierNode *Name = Arena.alloc<NamedIdentifierNode>();
997 Name->Name = S;
998 return Name;
Zachary Turner931e8792018-07-30 23:02:10 +0000999}
1000
Zachary Turner970fdc32018-08-16 16:17:36 +00001001static bool isRebasedHexDigit(char C) { return (C >= 'A' && C <= 'P'); }
1002
1003static uint8_t rebasedHexDigitToNumber(char C) {
1004 assert(isRebasedHexDigit(C));
1005 return (C <= 'J') ? (C - 'A') : (10 + C - 'K');
1006}
1007
1008uint8_t Demangler::demangleCharLiteral(StringView &MangledName) {
Nico Webera0ac65c2019-04-18 19:52:32 +00001009 assert(!MangledName.empty());
Zachary Turner970fdc32018-08-16 16:17:36 +00001010 if (!MangledName.startsWith('?'))
1011 return MangledName.popFront();
1012
1013 MangledName = MangledName.dropFront();
1014 if (MangledName.empty())
1015 goto CharLiteralError;
1016
1017 if (MangledName.consumeFront('$')) {
1018 // Two hex digits
1019 if (MangledName.size() < 2)
1020 goto CharLiteralError;
1021 StringView Nibbles = MangledName.substr(0, 2);
1022 if (!isRebasedHexDigit(Nibbles[0]) || !isRebasedHexDigit(Nibbles[1]))
1023 goto CharLiteralError;
1024 // Don't append the null terminator.
1025 uint8_t C1 = rebasedHexDigitToNumber(Nibbles[0]);
1026 uint8_t C2 = rebasedHexDigitToNumber(Nibbles[1]);
1027 MangledName = MangledName.dropFront(2);
1028 return (C1 << 4) | C2;
1029 }
1030
1031 if (startsWithDigit(MangledName)) {
1032 const char *Lookup = ",/\\:. \n\t'-";
1033 char C = Lookup[MangledName[0] - '0'];
1034 MangledName = MangledName.dropFront();
1035 return C;
1036 }
1037
1038 if (MangledName[0] >= 'a' && MangledName[0] <= 'z') {
1039 char Lookup[26] = {'\xE1', '\xE2', '\xE3', '\xE4', '\xE5', '\xE6', '\xE7',
1040 '\xE8', '\xE9', '\xEA', '\xEB', '\xEC', '\xED', '\xEE',
1041 '\xEF', '\xF0', '\xF1', '\xF2', '\xF3', '\xF4', '\xF5',
1042 '\xF6', '\xF7', '\xF8', '\xF9', '\xFA'};
1043 char C = Lookup[MangledName[0] - 'a'];
1044 MangledName = MangledName.dropFront();
1045 return C;
1046 }
1047
1048 if (MangledName[0] >= 'A' && MangledName[0] <= 'Z') {
1049 char Lookup[26] = {'\xC1', '\xC2', '\xC3', '\xC4', '\xC5', '\xC6', '\xC7',
1050 '\xC8', '\xC9', '\xCA', '\xCB', '\xCC', '\xCD', '\xCE',
1051 '\xCF', '\xD0', '\xD1', '\xD2', '\xD3', '\xD4', '\xD5',
1052 '\xD6', '\xD7', '\xD8', '\xD9', '\xDA'};
1053 char C = Lookup[MangledName[0] - 'A'];
1054 MangledName = MangledName.dropFront();
1055 return C;
1056 }
1057
1058CharLiteralError:
1059 Error = true;
1060 return '\0';
1061}
1062
1063wchar_t Demangler::demangleWcharLiteral(StringView &MangledName) {
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001064 uint8_t C1, C2;
1065
1066 C1 = demangleCharLiteral(MangledName);
Nico Weberf5c7f3a2019-04-22 15:05:18 +00001067 if (Error || MangledName.empty())
Zachary Turner970fdc32018-08-16 16:17:36 +00001068 goto WCharLiteralError;
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001069 C2 = demangleCharLiteral(MangledName);
Zachary Turner970fdc32018-08-16 16:17:36 +00001070 if (Error)
1071 goto WCharLiteralError;
1072
1073 return ((wchar_t)C1 << 8) | (wchar_t)C2;
1074
1075WCharLiteralError:
1076 Error = true;
1077 return L'\0';
1078}
1079
1080static void writeHexDigit(char *Buffer, uint8_t Digit) {
1081 assert(Digit <= 15);
1082 *Buffer = (Digit < 10) ? ('0' + Digit) : ('A' + Digit - 10);
1083}
1084
1085static void outputHex(OutputStream &OS, unsigned C) {
1086 if (C == 0) {
1087 OS << "\\x00";
1088 return;
1089 }
1090 // It's easier to do the math if we can work from right to left, but we need
1091 // to print the numbers from left to right. So render this into a temporary
1092 // buffer first, then output the temporary buffer. Each byte is of the form
1093 // \xAB, which means that each byte needs 4 characters. Since there are at
1094 // most 4 bytes, we need a 4*4+1 = 17 character temporary buffer.
1095 char TempBuffer[17];
1096
1097 ::memset(TempBuffer, 0, sizeof(TempBuffer));
Nico Weber8fc99022019-04-21 16:58:25 +00001098 constexpr int MaxPos = sizeof(TempBuffer) - 1;
Zachary Turner970fdc32018-08-16 16:17:36 +00001099
Nico Weber8fc99022019-04-21 16:58:25 +00001100 int Pos = MaxPos - 1; // TempBuffer[MaxPos] is the terminating \0.
Zachary Turner970fdc32018-08-16 16:17:36 +00001101 while (C != 0) {
1102 for (int I = 0; I < 2; ++I) {
1103 writeHexDigit(&TempBuffer[Pos--], C % 16);
1104 C /= 16;
1105 }
Zachary Turner970fdc32018-08-16 16:17:36 +00001106 }
Nico Weberce67a412019-04-21 17:19:27 +00001107 TempBuffer[Pos--] = 'x';
1108 assert(Pos >= 0);
1109 TempBuffer[Pos--] = '\\';
Zachary Turner970fdc32018-08-16 16:17:36 +00001110 OS << StringView(&TempBuffer[Pos + 1]);
1111}
1112
1113static void outputEscapedChar(OutputStream &OS, unsigned C) {
1114 switch (C) {
Nico Weber8eeaf512019-04-20 23:59:06 +00001115 case '\0': // nul
1116 OS << "\\0";
1117 return;
Zachary Turner970fdc32018-08-16 16:17:36 +00001118 case '\'': // single quote
1119 OS << "\\\'";
1120 return;
1121 case '\"': // double quote
1122 OS << "\\\"";
1123 return;
1124 case '\\': // backslash
1125 OS << "\\\\";
1126 return;
1127 case '\a': // bell
1128 OS << "\\a";
1129 return;
1130 case '\b': // backspace
1131 OS << "\\b";
1132 return;
1133 case '\f': // form feed
1134 OS << "\\f";
1135 return;
1136 case '\n': // new line
1137 OS << "\\n";
1138 return;
1139 case '\r': // carriage return
1140 OS << "\\r";
1141 return;
1142 case '\t': // tab
1143 OS << "\\t";
1144 return;
1145 case '\v': // vertical tab
1146 OS << "\\v";
1147 return;
1148 default:
1149 break;
1150 }
1151
1152 if (C > 0x1F && C < 0x7F) {
1153 // Standard ascii char.
1154 OS << (char)C;
1155 return;
1156 }
1157
1158 outputHex(OS, C);
1159}
1160
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001161static unsigned countTrailingNullBytes(const uint8_t *StringBytes, int Length) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001162 const uint8_t *End = StringBytes + Length - 1;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001163 unsigned Count = 0;
Zachary Turner970fdc32018-08-16 16:17:36 +00001164 while (Length > 0 && *End == 0) {
1165 --Length;
1166 --End;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001167 ++Count;
Zachary Turner970fdc32018-08-16 16:17:36 +00001168 }
Zachary Turner3461bfa2018-08-17 16:14:05 +00001169 return Count;
Zachary Turner970fdc32018-08-16 16:17:36 +00001170}
1171
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001172static unsigned countEmbeddedNulls(const uint8_t *StringBytes,
1173 unsigned Length) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001174 unsigned Result = 0;
1175 for (unsigned I = 0; I < Length; ++I) {
1176 if (*StringBytes++ == 0)
1177 ++Result;
1178 }
1179 return Result;
1180}
1181
Nico Weber8d05eb82019-04-24 16:09:38 +00001182// A mangled (non-wide) string literal stores the total length of the string it
1183// refers to (passed in NumBytes), and it contains up to 32 bytes of actual text
1184// (passed in StringBytes, NumChars).
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001185static unsigned guessCharByteSize(const uint8_t *StringBytes, unsigned NumChars,
Nico Weber8d05eb82019-04-24 16:09:38 +00001186 uint64_t NumBytes) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001187 assert(NumBytes > 0);
1188
1189 // If the number of bytes is odd, this is guaranteed to be a char string.
1190 if (NumBytes % 2 == 1)
1191 return 1;
1192
1193 // All strings can encode at most 32 bytes of data. If it's less than that,
1194 // then we encoded the entire string. In this case we check for a 1-byte,
1195 // 2-byte, or 4-byte null terminator.
1196 if (NumBytes < 32) {
1197 unsigned TrailingNulls = countTrailingNullBytes(StringBytes, NumChars);
Nico Weber8eeaf512019-04-20 23:59:06 +00001198 if (TrailingNulls >= 4 && NumBytes % 4 == 0)
Zachary Turner970fdc32018-08-16 16:17:36 +00001199 return 4;
1200 if (TrailingNulls >= 2)
1201 return 2;
1202 return 1;
1203 }
1204
1205 // The whole string was not able to be encoded. Try to look at embedded null
1206 // terminators to guess. The heuristic is that we count all embedded null
1207 // terminators. If more than 2/3 are null, it's a char32. If more than 1/3
1208 // are null, it's a char16. Otherwise it's a char8. This obviously isn't
1209 // perfect and is biased towards languages that have ascii alphabets, but this
1210 // was always going to be best effort since the encoding is lossy.
1211 unsigned Nulls = countEmbeddedNulls(StringBytes, NumChars);
Nico Weber8eeaf512019-04-20 23:59:06 +00001212 if (Nulls >= 2 * NumChars / 3 && NumBytes % 4 == 0)
Zachary Turner970fdc32018-08-16 16:17:36 +00001213 return 4;
1214 if (Nulls >= NumChars / 3)
1215 return 2;
1216 return 1;
1217}
1218
1219static unsigned decodeMultiByteChar(const uint8_t *StringBytes,
1220 unsigned CharIndex, unsigned CharBytes) {
1221 assert(CharBytes == 1 || CharBytes == 2 || CharBytes == 4);
1222 unsigned Offset = CharIndex * CharBytes;
1223 unsigned Result = 0;
1224 StringBytes = StringBytes + Offset;
1225 for (unsigned I = 0; I < CharBytes; ++I) {
1226 unsigned C = static_cast<unsigned>(StringBytes[I]);
1227 Result |= C << (8 * I);
1228 }
1229 return Result;
1230}
1231
Zachary Turner03312862018-08-27 03:48:03 +00001232FunctionSymbolNode *Demangler::demangleVcallThunkNode(StringView &MangledName) {
1233 FunctionSymbolNode *FSN = Arena.alloc<FunctionSymbolNode>();
1234 VcallThunkIdentifierNode *VTIN = Arena.alloc<VcallThunkIdentifierNode>();
1235 FSN->Signature = Arena.alloc<ThunkSignatureNode>();
1236 FSN->Signature->FunctionClass = FC_NoParameterList;
1237
1238 FSN->Name = demangleNameScopeChain(MangledName, VTIN);
1239 if (!Error)
1240 Error = !MangledName.consumeFront("$B");
1241 if (!Error)
1242 VTIN->OffsetInVTable = demangleUnsigned(MangledName);
1243 if (!Error)
1244 Error = !MangledName.consumeFront('A');
1245 if (!Error)
1246 FSN->Signature->CallConvention = demangleCallingConvention(MangledName);
1247 return (Error) ? nullptr : FSN;
1248}
1249
1250EncodedStringLiteralNode *
1251Demangler::demangleStringLiteral(StringView &MangledName) {
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001252 // This function uses goto, so declare all variables up front.
Zachary Turner970fdc32018-08-16 16:17:36 +00001253 OutputStream OS;
1254 StringView CRC;
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001255 uint64_t StringByteSize;
1256 bool IsWcharT = false;
1257 bool IsNegative = false;
1258 size_t CrcEndPos = 0;
1259 char *ResultBuffer = nullptr;
1260
Zachary Turner03312862018-08-27 03:48:03 +00001261 EncodedStringLiteralNode *Result = Arena.alloc<EncodedStringLiteralNode>();
Zachary Turner970fdc32018-08-16 16:17:36 +00001262
Nico Webere145a542019-04-19 14:13:11 +00001263 // Must happen before the first `goto StringLiteralError`.
1264 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
1265 // FIXME: Propagate out-of-memory as an error?
1266 std::terminate();
1267
Zachary Turner970fdc32018-08-16 16:17:36 +00001268 // Prefix indicating the beginning of a string literal
Zachary Turner3461bfa2018-08-17 16:14:05 +00001269 if (!MangledName.consumeFront("@_"))
1270 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001271 if (MangledName.empty())
1272 goto StringLiteralError;
1273
1274 // Char Type (regular or wchar_t)
Zachary Turner970fdc32018-08-16 16:17:36 +00001275 switch (MangledName.popFront()) {
1276 case '1':
1277 IsWcharT = true;
Erik Pilkington5094e5e2019-01-17 20:37:51 +00001278 DEMANGLE_FALLTHROUGH;
Zachary Turner970fdc32018-08-16 16:17:36 +00001279 case '0':
1280 break;
1281 default:
1282 goto StringLiteralError;
1283 }
1284
1285 // Encoded Length
Zachary Turner970fdc32018-08-16 16:17:36 +00001286 std::tie(StringByteSize, IsNegative) = demangleNumber(MangledName);
Nico Webera0ac65c2019-04-18 19:52:32 +00001287 if (Error || IsNegative || StringByteSize < (IsWcharT ? 2 : 1))
Zachary Turner970fdc32018-08-16 16:17:36 +00001288 goto StringLiteralError;
1289
1290 // CRC 32 (always 8 characters plus a terminator)
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001291 CrcEndPos = MangledName.find('@');
Zachary Turner970fdc32018-08-16 16:17:36 +00001292 if (CrcEndPos == StringView::npos)
1293 goto StringLiteralError;
1294 CRC = MangledName.substr(0, CrcEndPos);
1295 MangledName = MangledName.dropFront(CrcEndPos + 1);
1296 if (MangledName.empty())
1297 goto StringLiteralError;
1298
Zachary Turner970fdc32018-08-16 16:17:36 +00001299 if (IsWcharT) {
Zachary Turner03312862018-08-27 03:48:03 +00001300 Result->Char = CharKind::Wchar;
Zachary Turner970fdc32018-08-16 16:17:36 +00001301 if (StringByteSize > 64)
Zachary Turner3461bfa2018-08-17 16:14:05 +00001302 Result->IsTruncated = true;
Zachary Turner970fdc32018-08-16 16:17:36 +00001303
1304 while (!MangledName.consumeFront('@')) {
Nico Webera0ac65c2019-04-18 19:52:32 +00001305 if (MangledName.size() < 2)
Nico Weber502cf4b2019-04-18 19:30:21 +00001306 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001307 wchar_t W = demangleWcharLiteral(MangledName);
Zachary Turner3461bfa2018-08-17 16:14:05 +00001308 if (StringByteSize != 2 || Result->IsTruncated)
Zachary Turner970fdc32018-08-16 16:17:36 +00001309 outputEscapedChar(OS, W);
1310 StringByteSize -= 2;
1311 if (Error)
1312 goto StringLiteralError;
1313 }
1314 } else {
Zachary Turner32a8a202018-08-29 23:56:09 +00001315 // The max byte length is actually 32, but some compilers mangled strings
1316 // incorrectly, so we have to assume it can go higher.
1317 constexpr unsigned MaxStringByteLength = 32 * 4;
Zachary Turner970fdc32018-08-16 16:17:36 +00001318 uint8_t StringBytes[MaxStringByteLength];
1319
1320 unsigned BytesDecoded = 0;
1321 while (!MangledName.consumeFront('@')) {
Nico Weberaa162682019-04-21 14:25:07 +00001322 if (MangledName.size() < 1 || BytesDecoded >= MaxStringByteLength)
Nico Weber502cf4b2019-04-18 19:30:21 +00001323 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001324 StringBytes[BytesDecoded++] = demangleCharLiteral(MangledName);
1325 }
1326
Zachary Turner32a8a202018-08-29 23:56:09 +00001327 if (StringByteSize > BytesDecoded)
1328 Result->IsTruncated = true;
1329
Zachary Turner970fdc32018-08-16 16:17:36 +00001330 unsigned CharBytes =
1331 guessCharByteSize(StringBytes, BytesDecoded, StringByteSize);
1332 assert(StringByteSize % CharBytes == 0);
1333 switch (CharBytes) {
1334 case 1:
Zachary Turner03312862018-08-27 03:48:03 +00001335 Result->Char = CharKind::Char;
Zachary Turner970fdc32018-08-16 16:17:36 +00001336 break;
1337 case 2:
Zachary Turner03312862018-08-27 03:48:03 +00001338 Result->Char = CharKind::Char16;
Zachary Turner970fdc32018-08-16 16:17:36 +00001339 break;
1340 case 4:
Zachary Turner03312862018-08-27 03:48:03 +00001341 Result->Char = CharKind::Char32;
Zachary Turner970fdc32018-08-16 16:17:36 +00001342 break;
1343 default:
Erik Pilkington5094e5e2019-01-17 20:37:51 +00001344 DEMANGLE_UNREACHABLE;
Zachary Turner970fdc32018-08-16 16:17:36 +00001345 }
1346 const unsigned NumChars = BytesDecoded / CharBytes;
1347 for (unsigned CharIndex = 0; CharIndex < NumChars; ++CharIndex) {
1348 unsigned NextChar =
1349 decodeMultiByteChar(StringBytes, CharIndex, CharBytes);
Zachary Turner3461bfa2018-08-17 16:14:05 +00001350 if (CharIndex + 1 < NumChars || Result->IsTruncated)
Zachary Turner970fdc32018-08-16 16:17:36 +00001351 outputEscapedChar(OS, NextChar);
1352 }
1353 }
1354
1355 OS << '\0';
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001356 ResultBuffer = OS.getBuffer();
Zachary Turner03312862018-08-27 03:48:03 +00001357 Result->DecodedString = copyString(ResultBuffer);
Zachary Turneraf738f72018-08-16 17:48:32 +00001358 std::free(ResultBuffer);
Zachary Turner970fdc32018-08-16 16:17:36 +00001359 return Result;
1360
1361StringLiteralError:
1362 Error = true;
Nico Webere145a542019-04-19 14:13:11 +00001363 std::free(OS.getBuffer());
Zachary Turner970fdc32018-08-16 16:17:36 +00001364 return nullptr;
1365}
1366
Nico Weberc7444dd2019-04-03 23:15:56 +00001367// Returns MangledName's prefix before the first '@', or an error if
1368// MangledName contains no '@' or the prefix has length 0.
Zachary Turner931e8792018-07-30 23:02:10 +00001369StringView Demangler::demangleSimpleString(StringView &MangledName,
1370 bool Memorize) {
1371 StringView S;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001372 for (size_t i = 0; i < MangledName.size(); ++i) {
1373 if (MangledName[i] != '@')
1374 continue;
Nico Weberc7444dd2019-04-03 23:15:56 +00001375 if (i == 0)
1376 break;
Zachary Turner931e8792018-07-30 23:02:10 +00001377 S = MangledName.substr(0, i);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001378 MangledName = MangledName.dropFront(i + 1);
1379
1380 if (Memorize)
Zachary Turner931e8792018-07-30 23:02:10 +00001381 memorizeString(S);
1382 return S;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001383 }
1384
1385 Error = true;
Zachary Turner931e8792018-07-30 23:02:10 +00001386 return {};
Zachary Turnera7dffb12018-07-28 22:10:42 +00001387}
1388
Zachary Turner03312862018-08-27 03:48:03 +00001389NamedIdentifierNode *
1390Demangler::demangleAnonymousNamespaceName(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001391 assert(MangledName.startsWith("?A"));
1392 MangledName.consumeFront("?A");
1393
Zachary Turner03312862018-08-27 03:48:03 +00001394 NamedIdentifierNode *Node = Arena.alloc<NamedIdentifierNode>();
1395 Node->Name = "`anonymous namespace'";
Zachary Turner91c98a82018-08-20 23:58:35 +00001396 size_t EndPos = MangledName.find('@');
1397 if (EndPos == StringView::npos) {
1398 Error = true;
1399 return nullptr;
1400 }
Zachary Turner0002dd42018-08-20 23:58:58 +00001401 StringView NamespaceKey = MangledName.substr(0, EndPos);
1402 memorizeString(NamespaceKey);
Zachary Turner91c98a82018-08-20 23:58:35 +00001403 MangledName = MangledName.substr(EndPos + 1);
1404 return Node;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001405}
1406
Zachary Turner03312862018-08-27 03:48:03 +00001407NamedIdentifierNode *
1408Demangler::demangleLocallyScopedNamePiece(StringView &MangledName) {
Zachary Turner71c91f92018-07-30 03:12:34 +00001409 assert(startsWithLocalScopePattern(MangledName));
1410
Zachary Turner03312862018-08-27 03:48:03 +00001411 NamedIdentifierNode *Identifier = Arena.alloc<NamedIdentifierNode>();
Zachary Turner71c91f92018-07-30 03:12:34 +00001412 MangledName.consumeFront('?');
Nico Weberc5615c22019-04-03 23:29:05 +00001413 uint64_t Number = 0;
1414 bool IsNegative = false;
1415 std::tie(Number, IsNegative) = demangleNumber(MangledName);
1416 assert(!IsNegative);
Zachary Turner71c91f92018-07-30 03:12:34 +00001417
1418 // One ? to terminate the number
1419 MangledName.consumeFront('?');
1420
1421 assert(!Error);
Zachary Turner03312862018-08-27 03:48:03 +00001422 Node *Scope = parse(MangledName);
Zachary Turner71c91f92018-07-30 03:12:34 +00001423 if (Error)
1424 return nullptr;
1425
1426 // Render the parent symbol's name into a buffer.
Nico Weber1359d652018-09-15 18:24:20 +00001427 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +00001428 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00001429 // FIXME: Propagate out-of-memory as an error?
1430 std::terminate();
Zachary Turner71c91f92018-07-30 03:12:34 +00001431 OS << '`';
Zachary Turner38d2edd2018-08-29 03:59:17 +00001432 Scope->output(OS, OF_Default);
Zachary Turner71c91f92018-07-30 03:12:34 +00001433 OS << '\'';
Nico Weberc5615c22019-04-03 23:29:05 +00001434 OS << "::`" << Number << "'";
Zachary Turner71c91f92018-07-30 03:12:34 +00001435 OS << '\0';
1436 char *Result = OS.getBuffer();
Zachary Turner03312862018-08-27 03:48:03 +00001437 Identifier->Name = copyString(Result);
Zachary Turner71c91f92018-07-30 03:12:34 +00001438 std::free(Result);
Zachary Turner03312862018-08-27 03:48:03 +00001439 return Identifier;
Zachary Turner71c91f92018-07-30 03:12:34 +00001440}
1441
Zachary Turnera7dffb12018-07-28 22:10:42 +00001442// Parses a type name in the form of A@B@C@@ which represents C::B::A.
Zachary Turner03312862018-08-27 03:48:03 +00001443QualifiedNameNode *
1444Demangler::demangleFullyQualifiedTypeName(StringView &MangledName) {
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001445 IdentifierNode *Identifier =
1446 demangleUnqualifiedTypeName(MangledName, /*Memorize=*/true);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001447 if (Error)
1448 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001449 assert(Identifier);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001450
Zachary Turner03312862018-08-27 03:48:03 +00001451 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001452 if (Error)
1453 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001454 assert(QN);
1455 return QN;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001456}
1457
1458// Parses a symbol name in the form of A@B@C@@ which represents C::B::A.
1459// Symbol names have slightly different rules regarding what can appear
1460// so we separate out the implementations for flexibility.
Zachary Turner03312862018-08-27 03:48:03 +00001461QualifiedNameNode *
1462Demangler::demangleFullyQualifiedSymbolName(StringView &MangledName) {
Zachary Turner58d29cf2018-08-08 00:43:31 +00001463 // This is the final component of a symbol name (i.e. the leftmost component
1464 // of a mangled name. Since the only possible template instantiation that
1465 // can appear in this context is a function template, and since those are
1466 // not saved for the purposes of name backreferences, only backref simple
1467 // names.
Zachary Turner03312862018-08-27 03:48:03 +00001468 IdentifierNode *Identifier =
1469 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001470 if (Error)
1471 return nullptr;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001472
Zachary Turner03312862018-08-27 03:48:03 +00001473 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001474 if (Error)
1475 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001476
1477 if (Identifier->kind() == NodeKind::StructorIdentifier) {
Nico Webera9886f82019-04-03 23:23:32 +00001478 if (QN->Components->Count < 2) {
1479 Error = true;
1480 return nullptr;
1481 }
Zachary Turner03312862018-08-27 03:48:03 +00001482 StructorIdentifierNode *SIN =
1483 static_cast<StructorIdentifierNode *>(Identifier);
Zachary Turner03312862018-08-27 03:48:03 +00001484 Node *ClassNode = QN->Components->Nodes[QN->Components->Count - 2];
1485 SIN->Class = static_cast<IdentifierNode *>(ClassNode);
1486 }
1487 assert(QN);
1488 return QN;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001489}
1490
Zachary Turner03312862018-08-27 03:48:03 +00001491IdentifierNode *Demangler::demangleUnqualifiedTypeName(StringView &MangledName,
1492 bool Memorize) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001493 // An inner-most name can be a back-reference, because a fully-qualified name
1494 // (e.g. Scope + Inner) can contain other fully qualified names inside of
1495 // them (for example template parameters), and these nested parameters can
1496 // refer to previously mangled types.
1497 if (startsWithDigit(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001498 return demangleBackRefName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001499
1500 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001501 return demangleTemplateInstantiationName(MangledName, NBB_Template);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001502
Zachary Turner44ebbc22018-08-01 18:32:47 +00001503 return demangleSimpleName(MangledName, Memorize);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001504}
1505
Zachary Turner03312862018-08-27 03:48:03 +00001506IdentifierNode *
1507Demangler::demangleUnqualifiedSymbolName(StringView &MangledName,
1508 NameBackrefBehavior NBB) {
Zachary Turner71c91f92018-07-30 03:12:34 +00001509 if (startsWithDigit(MangledName))
1510 return demangleBackRefName(MangledName);
1511 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001512 return demangleTemplateInstantiationName(MangledName, NBB);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001513 if (MangledName.startsWith('?'))
Zachary Turner03312862018-08-27 03:48:03 +00001514 return demangleFunctionIdentifierCode(MangledName);
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001515 return demangleSimpleName(MangledName, /*Memorize=*/(NBB & NBB_Simple) != 0);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001516}
1517
Zachary Turner03312862018-08-27 03:48:03 +00001518IdentifierNode *Demangler::demangleNameScopePiece(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001519 if (startsWithDigit(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001520 return demangleBackRefName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001521
1522 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001523 return demangleTemplateInstantiationName(MangledName, NBB_Template);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001524
1525 if (MangledName.startsWith("?A"))
Zachary Turner316109b2018-07-29 16:38:02 +00001526 return demangleAnonymousNamespaceName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001527
Zachary Turner71c91f92018-07-30 03:12:34 +00001528 if (startsWithLocalScopePattern(MangledName))
1529 return demangleLocallyScopedNamePiece(MangledName);
1530
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001531 return demangleSimpleName(MangledName, /*Memorize=*/true);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001532}
1533
Zachary Turner03312862018-08-27 03:48:03 +00001534static NodeArrayNode *nodeListToNodeArray(ArenaAllocator &Arena, NodeList *Head,
1535 size_t Count) {
1536 NodeArrayNode *N = Arena.alloc<NodeArrayNode>();
1537 N->Count = Count;
1538 N->Nodes = Arena.allocArray<Node *>(Count);
1539 for (size_t I = 0; I < Count; ++I) {
1540 N->Nodes[I] = Head->N;
1541 Head = Head->Next;
1542 }
1543 return N;
1544}
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001545
Zachary Turner03312862018-08-27 03:48:03 +00001546QualifiedNameNode *
1547Demangler::demangleNameScopeChain(StringView &MangledName,
1548 IdentifierNode *UnqualifiedName) {
1549 NodeList *Head = Arena.alloc<NodeList>();
1550
1551 Head->N = UnqualifiedName;
1552
1553 size_t Count = 1;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001554 while (!MangledName.consumeFront("@")) {
Zachary Turner03312862018-08-27 03:48:03 +00001555 ++Count;
1556 NodeList *NewHead = Arena.alloc<NodeList>();
1557 NewHead->Next = Head;
1558 Head = NewHead;
1559
Zachary Turnera7dffb12018-07-28 22:10:42 +00001560 if (MangledName.empty()) {
1561 Error = true;
1562 return nullptr;
1563 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001564
1565 assert(!Error);
Zachary Turner03312862018-08-27 03:48:03 +00001566 IdentifierNode *Elem = demangleNameScopePiece(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001567 if (Error)
1568 return nullptr;
1569
Zachary Turner03312862018-08-27 03:48:03 +00001570 Head->N = Elem;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001571 }
Zachary Turner03312862018-08-27 03:48:03 +00001572
1573 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
1574 QN->Components = nodeListToNodeArray(Arena, Head, Count);
1575 return QN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001576}
1577
Zachary Turner316109b2018-07-29 16:38:02 +00001578FuncClass Demangler::demangleFunctionClass(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001579 switch (MangledName.popFront()) {
Zachary Turner29ec67b2018-08-10 21:09:05 +00001580 case '9':
Zachary Turner03312862018-08-27 03:48:03 +00001581 return FuncClass(FC_ExternC | FC_NoParameterList);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001582 case 'A':
Zachary Turner03312862018-08-27 03:48:03 +00001583 return FC_Private;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001584 case 'B':
Zachary Turner03312862018-08-27 03:48:03 +00001585 return FuncClass(FC_Private | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001586 case 'C':
Zachary Turner03312862018-08-27 03:48:03 +00001587 return FuncClass(FC_Private | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001588 case 'D':
Zachary Turner03312862018-08-27 03:48:03 +00001589 return FuncClass(FC_Private | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001590 case 'E':
Zachary Turner03312862018-08-27 03:48:03 +00001591 return FuncClass(FC_Private | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001592 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00001593 return FuncClass(FC_Private | FC_Virtual);
Zachary Turner32a8a202018-08-29 23:56:09 +00001594 case 'G':
1595 return FuncClass(FC_Private | FC_StaticThisAdjust);
1596 case 'H':
1597 return FuncClass(FC_Private | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001598 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00001599 return FuncClass(FC_Protected);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001600 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001601 return FuncClass(FC_Protected | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001602 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001603 return FuncClass(FC_Protected | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001604 case 'L':
Zachary Turner03312862018-08-27 03:48:03 +00001605 return FuncClass(FC_Protected | FC_Static | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001606 case 'M':
Zachary Turner03312862018-08-27 03:48:03 +00001607 return FuncClass(FC_Protected | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001608 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001609 return FuncClass(FC_Protected | FC_Virtual | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001610 case 'O':
Zachary Turner03312862018-08-27 03:48:03 +00001611 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust);
Zachary Turner469f0762018-08-17 21:18:05 +00001612 case 'P':
Zachary Turner03312862018-08-27 03:48:03 +00001613 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001614 case 'Q':
Zachary Turner03312862018-08-27 03:48:03 +00001615 return FuncClass(FC_Public);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001616 case 'R':
Zachary Turner03312862018-08-27 03:48:03 +00001617 return FuncClass(FC_Public | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001618 case 'S':
Zachary Turner03312862018-08-27 03:48:03 +00001619 return FuncClass(FC_Public | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001620 case 'T':
Zachary Turner03312862018-08-27 03:48:03 +00001621 return FuncClass(FC_Public | FC_Static | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001622 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001623 return FuncClass(FC_Public | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001624 case 'V':
Zachary Turner03312862018-08-27 03:48:03 +00001625 return FuncClass(FC_Public | FC_Virtual | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001626 case 'W':
Zachary Turner03312862018-08-27 03:48:03 +00001627 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust);
Zachary Turner469f0762018-08-17 21:18:05 +00001628 case 'X':
Zachary Turner03312862018-08-27 03:48:03 +00001629 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001630 case 'Y':
Zachary Turner03312862018-08-27 03:48:03 +00001631 return FuncClass(FC_Global);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001632 case 'Z':
Zachary Turner03312862018-08-27 03:48:03 +00001633 return FuncClass(FC_Global | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001634 case '$': {
Zachary Turner03312862018-08-27 03:48:03 +00001635 FuncClass VFlag = FC_VirtualThisAdjust;
Zachary Turner469f0762018-08-17 21:18:05 +00001636 if (MangledName.consumeFront('R'))
Zachary Turner03312862018-08-27 03:48:03 +00001637 VFlag = FuncClass(VFlag | FC_VirtualThisAdjustEx);
Nico Weberb4f33bb2019-04-11 22:47:18 +00001638 if (MangledName.empty())
1639 break;
Zachary Turner469f0762018-08-17 21:18:05 +00001640 switch (MangledName.popFront()) {
1641 case '0':
Zachary Turner03312862018-08-27 03:48:03 +00001642 return FuncClass(FC_Private | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001643 case '1':
Zachary Turner03312862018-08-27 03:48:03 +00001644 return FuncClass(FC_Private | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001645 case '2':
Zachary Turner03312862018-08-27 03:48:03 +00001646 return FuncClass(FC_Protected | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001647 case '3':
Zachary Turner03312862018-08-27 03:48:03 +00001648 return FuncClass(FC_Protected | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001649 case '4':
Zachary Turner03312862018-08-27 03:48:03 +00001650 return FuncClass(FC_Public | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001651 case '5':
Zachary Turner03312862018-08-27 03:48:03 +00001652 return FuncClass(FC_Public | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001653 }
1654 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001655 }
1656
1657 Error = true;
Zachary Turner03312862018-08-27 03:48:03 +00001658 return FC_Public;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001659}
1660
Zachary Turner316109b2018-07-29 16:38:02 +00001661CallingConv Demangler::demangleCallingConvention(StringView &MangledName) {
Nico Weber63b97d22019-04-08 19:46:53 +00001662 if (MangledName.empty()) {
1663 Error = true;
1664 return CallingConv::None;
1665 }
1666
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001667 switch (MangledName.popFront()) {
1668 case 'A':
1669 case 'B':
1670 return CallingConv::Cdecl;
1671 case 'C':
1672 case 'D':
1673 return CallingConv::Pascal;
1674 case 'E':
1675 case 'F':
1676 return CallingConv::Thiscall;
1677 case 'G':
1678 case 'H':
1679 return CallingConv::Stdcall;
1680 case 'I':
1681 case 'J':
1682 return CallingConv::Fastcall;
1683 case 'M':
1684 case 'N':
1685 return CallingConv::Clrcall;
1686 case 'O':
1687 case 'P':
1688 return CallingConv::Eabi;
1689 case 'Q':
1690 return CallingConv::Vectorcall;
1691 }
1692
1693 return CallingConv::None;
Martin Storsjo0f2abd82018-07-20 18:43:42 +00001694}
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001695
Zachary Turner316109b2018-07-29 16:38:02 +00001696StorageClass Demangler::demangleVariableStorageClass(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001697 assert(std::isdigit(MangledName.front()));
1698
1699 switch (MangledName.popFront()) {
1700 case '0':
1701 return StorageClass::PrivateStatic;
1702 case '1':
1703 return StorageClass::ProtectedStatic;
1704 case '2':
1705 return StorageClass::PublicStatic;
1706 case '3':
1707 return StorageClass::Global;
1708 case '4':
1709 return StorageClass::FunctionLocalStatic;
1710 }
1711 Error = true;
1712 return StorageClass::None;
1713}
1714
Zachary Turner316109b2018-07-29 16:38:02 +00001715std::pair<Qualifiers, bool>
1716Demangler::demangleQualifiers(StringView &MangledName) {
Nico Weber63b97d22019-04-08 19:46:53 +00001717 if (MangledName.empty()) {
1718 Error = true;
1719 return std::make_pair(Q_None, false);
1720 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001721
1722 switch (MangledName.popFront()) {
Zachary Turnerd742d642018-07-26 19:56:09 +00001723 // Member qualifiers
1724 case 'Q':
1725 return std::make_pair(Q_None, true);
1726 case 'R':
1727 return std::make_pair(Q_Const, true);
1728 case 'S':
1729 return std::make_pair(Q_Volatile, true);
1730 case 'T':
1731 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), true);
1732 // Non-Member qualifiers
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001733 case 'A':
Zachary Turnerd742d642018-07-26 19:56:09 +00001734 return std::make_pair(Q_None, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001735 case 'B':
Zachary Turnerd742d642018-07-26 19:56:09 +00001736 return std::make_pair(Q_Const, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001737 case 'C':
Zachary Turnerd742d642018-07-26 19:56:09 +00001738 return std::make_pair(Q_Volatile, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001739 case 'D':
Zachary Turnerd742d642018-07-26 19:56:09 +00001740 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001741 }
1742 Error = true;
Zachary Turnerd742d642018-07-26 19:56:09 +00001743 return std::make_pair(Q_None, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001744}
1745
1746// <variable-type> ::= <type> <cvr-qualifiers>
1747// ::= <type> <pointee-cvr-qualifiers> # pointers, references
Zachary Turner03312862018-08-27 03:48:03 +00001748TypeNode *Demangler::demangleType(StringView &MangledName,
1749 QualifierMangleMode QMM) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001750 Qualifiers Quals = Q_None;
Zachary Turnerd742d642018-07-26 19:56:09 +00001751 bool IsMember = false;
Zachary Turnerd742d642018-07-26 19:56:09 +00001752 if (QMM == QualifierMangleMode::Mangle) {
Zachary Turner316109b2018-07-29 16:38:02 +00001753 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00001754 } else if (QMM == QualifierMangleMode::Result) {
Zachary Turnerdf4cd7c2018-08-21 21:23:49 +00001755 if (MangledName.consumeFront('?'))
Zachary Turner316109b2018-07-29 16:38:02 +00001756 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001757 }
1758
Nico Weber63b97d22019-04-08 19:46:53 +00001759 if (MangledName.empty()) {
1760 Error = true;
1761 return nullptr;
1762 }
1763
Zachary Turner03312862018-08-27 03:48:03 +00001764 TypeNode *Ty = nullptr;
Zachary Turner931e8792018-07-30 23:02:10 +00001765 if (isTagType(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001766 Ty = demangleClassType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001767 else if (isPointerType(MangledName)) {
Zachary Turner8fb9a712018-12-14 18:10:13 +00001768 if (isMemberPointer(MangledName, Error))
Zachary Turner316109b2018-07-29 16:38:02 +00001769 Ty = demangleMemberPointerType(MangledName);
Zachary Turner8fb9a712018-12-14 18:10:13 +00001770 else if (!Error)
Zachary Turner316109b2018-07-29 16:38:02 +00001771 Ty = demanglePointerType(MangledName);
Zachary Turner8fb9a712018-12-14 18:10:13 +00001772 else
1773 return nullptr;
Zachary Turner931e8792018-07-30 23:02:10 +00001774 } else if (isArrayType(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001775 Ty = demangleArrayType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001776 else if (isFunctionType(MangledName)) {
1777 if (MangledName.consumeFront("$$A8@@"))
Zachary Turner03312862018-08-27 03:48:03 +00001778 Ty = demangleFunctionType(MangledName, true);
Zachary Turner931e8792018-07-30 23:02:10 +00001779 else {
1780 assert(MangledName.startsWith("$$A6"));
1781 MangledName.consumeFront("$$A6");
Zachary Turner03312862018-08-27 03:48:03 +00001782 Ty = demangleFunctionType(MangledName, false);
Zachary Turner931e8792018-07-30 23:02:10 +00001783 }
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001784 } else if (isCustomType(MangledName)) {
1785 Ty = demangleCustomType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001786 } else {
Zachary Turner03312862018-08-27 03:48:03 +00001787 Ty = demanglePrimitiveType(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001788 }
Zachary Turner931e8792018-07-30 23:02:10 +00001789
Zachary Turner2cd32862018-12-14 17:43:56 +00001790 if (!Ty || Error)
1791 return Ty;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001792 Ty->Quals = Qualifiers(Ty->Quals | Quals);
1793 return Ty;
1794}
1795
Zachary Turner2fe49002019-01-08 21:05:51 +00001796bool Demangler::demangleThrowSpecification(StringView &MangledName) {
1797 if (MangledName.consumeFront("_E"))
1798 return true;
Zachary Turner38b78a72018-07-26 20:20:10 +00001799 if (MangledName.consumeFront('Z'))
Zachary Turner2fe49002019-01-08 21:05:51 +00001800 return false;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001801
Zachary Turner38b78a72018-07-26 20:20:10 +00001802 Error = true;
Zachary Turner2fe49002019-01-08 21:05:51 +00001803 return false;
Zachary Turner38b78a72018-07-26 20:20:10 +00001804}
1805
Zachary Turner03312862018-08-27 03:48:03 +00001806FunctionSignatureNode *Demangler::demangleFunctionType(StringView &MangledName,
1807 bool HasThisQuals) {
1808 FunctionSignatureNode *FTy = Arena.alloc<FunctionSignatureNode>();
Zachary Turner38b78a72018-07-26 20:20:10 +00001809
1810 if (HasThisQuals) {
Zachary Turner316109b2018-07-29 16:38:02 +00001811 FTy->Quals = demanglePointerExtQualifiers(MangledName);
Zachary Turner03312862018-08-27 03:48:03 +00001812 FTy->RefQualifier = demangleFunctionRefQualifier(MangledName);
Zachary Turner316109b2018-07-29 16:38:02 +00001813 FTy->Quals = Qualifiers(FTy->Quals | demangleQualifiers(MangledName).first);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001814 }
1815
1816 // Fields that appear on both member and non-member functions.
Zachary Turner316109b2018-07-29 16:38:02 +00001817 FTy->CallConvention = demangleCallingConvention(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001818
1819 // <return-type> ::= <type>
1820 // ::= @ # structors (they have no declared return type)
1821 bool IsStructor = MangledName.consumeFront('@');
1822 if (!IsStructor)
Zachary Turner316109b2018-07-29 16:38:02 +00001823 FTy->ReturnType = demangleType(MangledName, QualifierMangleMode::Result);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001824
Zachary Turner316109b2018-07-29 16:38:02 +00001825 FTy->Params = demangleFunctionParameterList(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001826
Zachary Turner2fe49002019-01-08 21:05:51 +00001827 FTy->IsNoexcept = demangleThrowSpecification(MangledName);
Zachary Turner38b78a72018-07-26 20:20:10 +00001828
1829 return FTy;
1830}
1831
Zachary Turner03312862018-08-27 03:48:03 +00001832FunctionSymbolNode *
1833Demangler::demangleFunctionEncoding(StringView &MangledName) {
1834 FuncClass ExtraFlags = FC_None;
Zachary Turner469f0762018-08-17 21:18:05 +00001835 if (MangledName.consumeFront("$$J0"))
Zachary Turner03312862018-08-27 03:48:03 +00001836 ExtraFlags = FC_ExternC;
Zachary Turner469f0762018-08-17 21:18:05 +00001837
Nico Weber63b97d22019-04-08 19:46:53 +00001838 if (MangledName.empty()) {
1839 Error = true;
1840 return nullptr;
1841 }
1842
Zachary Turner316109b2018-07-29 16:38:02 +00001843 FuncClass FC = demangleFunctionClass(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001844 FC = FuncClass(ExtraFlags | FC);
1845
Zachary Turner03312862018-08-27 03:48:03 +00001846 FunctionSignatureNode *FSN = nullptr;
1847 ThunkSignatureNode *TTN = nullptr;
1848 if (FC & FC_StaticThisAdjust) {
1849 TTN = Arena.alloc<ThunkSignatureNode>();
1850 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
1851 } else if (FC & FC_VirtualThisAdjust) {
1852 TTN = Arena.alloc<ThunkSignatureNode>();
1853 if (FC & FC_VirtualThisAdjustEx) {
1854 TTN->ThisAdjust.VBPtrOffset = demangleSigned(MangledName);
1855 TTN->ThisAdjust.VBOffsetOffset = demangleSigned(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001856 }
Zachary Turner03312862018-08-27 03:48:03 +00001857 TTN->ThisAdjust.VtordispOffset = demangleSigned(MangledName);
1858 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001859 }
1860
Zachary Turner03312862018-08-27 03:48:03 +00001861 if (FC & FC_NoParameterList) {
Zachary Turner29ec67b2018-08-10 21:09:05 +00001862 // This is an extern "C" function whose full signature hasn't been mangled.
1863 // This happens when we need to mangle a local symbol inside of an extern
1864 // "C" function.
Zachary Turner03312862018-08-27 03:48:03 +00001865 FSN = Arena.alloc<FunctionSignatureNode>();
Zachary Turner29ec67b2018-08-10 21:09:05 +00001866 } else {
Zachary Turner03312862018-08-27 03:48:03 +00001867 bool HasThisQuals = !(FC & (FC_Global | FC_Static));
1868 FSN = demangleFunctionType(MangledName, HasThisQuals);
Zachary Turner29ec67b2018-08-10 21:09:05 +00001869 }
Nico Weber63b97d22019-04-08 19:46:53 +00001870
1871 if (Error)
1872 return nullptr;
1873
Zachary Turner03312862018-08-27 03:48:03 +00001874 if (TTN) {
1875 *static_cast<FunctionSignatureNode *>(TTN) = *FSN;
1876 FSN = TTN;
1877 }
1878 FSN->FunctionClass = FC;
Zachary Turner38b78a72018-07-26 20:20:10 +00001879
Zachary Turner03312862018-08-27 03:48:03 +00001880 FunctionSymbolNode *Symbol = Arena.alloc<FunctionSymbolNode>();
1881 Symbol->Signature = FSN;
1882 return Symbol;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001883}
1884
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001885CustomTypeNode *Demangler::demangleCustomType(StringView &MangledName) {
1886 assert(MangledName.startsWith('?'));
1887 MangledName.popFront();
1888
1889 CustomTypeNode *CTN = Arena.alloc<CustomTypeNode>();
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001890 CTN->Identifier = demangleUnqualifiedTypeName(MangledName, /*Memorize=*/true);
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001891 if (!MangledName.consumeFront('@'))
1892 Error = true;
1893 if (Error)
1894 return nullptr;
1895 return CTN;
1896}
1897
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001898// Reads a primitive type.
Zachary Turner03312862018-08-27 03:48:03 +00001899PrimitiveTypeNode *Demangler::demanglePrimitiveType(StringView &MangledName) {
1900 if (MangledName.consumeFront("$$T"))
1901 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Nullptr);
Zachary Turner931e8792018-07-30 23:02:10 +00001902
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001903 switch (MangledName.popFront()) {
1904 case 'X':
Zachary Turner03312862018-08-27 03:48:03 +00001905 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Void);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001906 case 'D':
Zachary Turner03312862018-08-27 03:48:03 +00001907 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001908 case 'C':
Zachary Turner03312862018-08-27 03:48:03 +00001909 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Schar);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001910 case 'E':
Zachary Turner03312862018-08-27 03:48:03 +00001911 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uchar);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001912 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00001913 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Short);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001914 case 'G':
Zachary Turner03312862018-08-27 03:48:03 +00001915 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ushort);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001916 case 'H':
Zachary Turner03312862018-08-27 03:48:03 +00001917 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001918 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00001919 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001920 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001921 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Long);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001922 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001923 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ulong);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001924 case 'M':
Zachary Turner03312862018-08-27 03:48:03 +00001925 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Float);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001926 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001927 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Double);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001928 case 'O':
Zachary Turner03312862018-08-27 03:48:03 +00001929 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ldouble);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001930 case '_': {
Zachary Turner91ecedd2018-07-20 18:07:33 +00001931 if (MangledName.empty()) {
1932 Error = true;
1933 return nullptr;
1934 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001935 switch (MangledName.popFront()) {
1936 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001937 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Bool);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001938 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001939 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int64);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001940 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001941 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint64);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001942 case 'W':
Zachary Turner03312862018-08-27 03:48:03 +00001943 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Wchar);
Zachary Turner931e8792018-07-30 23:02:10 +00001944 case 'S':
Zachary Turner03312862018-08-27 03:48:03 +00001945 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char16);
Zachary Turner931e8792018-07-30 23:02:10 +00001946 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001947 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char32);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001948 }
1949 break;
1950 }
1951 }
Zachary Turner03312862018-08-27 03:48:03 +00001952 Error = true;
1953 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001954}
1955
Zachary Turner03312862018-08-27 03:48:03 +00001956TagTypeNode *Demangler::demangleClassType(StringView &MangledName) {
1957 TagTypeNode *TT = nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001958
1959 switch (MangledName.popFront()) {
1960 case 'T':
Zachary Turner03312862018-08-27 03:48:03 +00001961 TT = Arena.alloc<TagTypeNode>(TagKind::Union);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001962 break;
1963 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001964 TT = Arena.alloc<TagTypeNode>(TagKind::Struct);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001965 break;
1966 case 'V':
Zachary Turner03312862018-08-27 03:48:03 +00001967 TT = Arena.alloc<TagTypeNode>(TagKind::Class);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001968 break;
1969 case 'W':
Nico Webere5b62652019-04-11 22:59:25 +00001970 if (!MangledName.consumeFront('4')) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001971 Error = true;
1972 return nullptr;
1973 }
Zachary Turner03312862018-08-27 03:48:03 +00001974 TT = Arena.alloc<TagTypeNode>(TagKind::Enum);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001975 break;
1976 default:
1977 assert(false);
1978 }
1979
Zachary Turner03312862018-08-27 03:48:03 +00001980 TT->QualifiedName = demangleFullyQualifiedTypeName(MangledName);
1981 return TT;
Zachary Turnerd742d642018-07-26 19:56:09 +00001982}
1983
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001984// <pointer-type> ::= E? <pointer-cvr-qualifiers> <ext-qualifiers> <type>
1985// # the E is required for 64-bit non-static pointers
Zachary Turner03312862018-08-27 03:48:03 +00001986PointerTypeNode *Demangler::demanglePointerType(StringView &MangledName) {
1987 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001988
Zachary Turner931e8792018-07-30 23:02:10 +00001989 std::tie(Pointer->Quals, Pointer->Affinity) =
1990 demanglePointerCVQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001991
1992 if (MangledName.consumeFront("6")) {
Zachary Turner03312862018-08-27 03:48:03 +00001993 Pointer->Pointee = demangleFunctionType(MangledName, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001994 return Pointer;
1995 }
1996
Zachary Turner316109b2018-07-29 16:38:02 +00001997 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001998 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
1999
Zachary Turner316109b2018-07-29 16:38:02 +00002000 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Mangle);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002001 return Pointer;
2002}
2003
Zachary Turner03312862018-08-27 03:48:03 +00002004PointerTypeNode *Demangler::demangleMemberPointerType(StringView &MangledName) {
2005 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
Zachary Turnerd742d642018-07-26 19:56:09 +00002006
Zachary Turner03312862018-08-27 03:48:03 +00002007 std::tie(Pointer->Quals, Pointer->Affinity) =
2008 demanglePointerCVQualifiers(MangledName);
2009 assert(Pointer->Affinity == PointerAffinity::Pointer);
Zachary Turnerd742d642018-07-26 19:56:09 +00002010
Zachary Turner316109b2018-07-29 16:38:02 +00002011 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00002012 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
2013
Nico Weber63b97d22019-04-08 19:46:53 +00002014 // isMemberPointer() only returns true if there is at least one character
2015 // after the qualifiers.
Zachary Turner38b78a72018-07-26 20:20:10 +00002016 if (MangledName.consumeFront("8")) {
Zachary Turner32a8a202018-08-29 23:56:09 +00002017 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
Zachary Turner03312862018-08-27 03:48:03 +00002018 Pointer->Pointee = demangleFunctionType(MangledName, true);
Zachary Turner38b78a72018-07-26 20:20:10 +00002019 } else {
2020 Qualifiers PointeeQuals = Q_None;
2021 bool IsMember = false;
Zachary Turner316109b2018-07-29 16:38:02 +00002022 std::tie(PointeeQuals, IsMember) = demangleQualifiers(MangledName);
Nico Weber63b97d22019-04-08 19:46:53 +00002023 assert(IsMember || Error);
Zachary Turner32a8a202018-08-29 23:56:09 +00002024 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00002025
Zachary Turner316109b2018-07-29 16:38:02 +00002026 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Drop);
Nico Weber63b97d22019-04-08 19:46:53 +00002027 if (Pointer->Pointee)
2028 Pointer->Pointee->Quals = PointeeQuals;
Zachary Turner38b78a72018-07-26 20:20:10 +00002029 }
2030
Zachary Turnerd742d642018-07-26 19:56:09 +00002031 return Pointer;
2032}
2033
Zachary Turner316109b2018-07-29 16:38:02 +00002034Qualifiers Demangler::demanglePointerExtQualifiers(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002035 Qualifiers Quals = Q_None;
2036 if (MangledName.consumeFront('E'))
2037 Quals = Qualifiers(Quals | Q_Pointer64);
2038 if (MangledName.consumeFront('I'))
2039 Quals = Qualifiers(Quals | Q_Restrict);
2040 if (MangledName.consumeFront('F'))
2041 Quals = Qualifiers(Quals | Q_Unaligned);
2042
2043 return Quals;
2044}
2045
Zachary Turner03312862018-08-27 03:48:03 +00002046ArrayTypeNode *Demangler::demangleArrayType(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002047 assert(MangledName.front() == 'Y');
2048 MangledName.popFront();
2049
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002050 uint64_t Rank = 0;
2051 bool IsNegative = false;
2052 std::tie(Rank, IsNegative) = demangleNumber(MangledName);
2053 if (IsNegative || Rank == 0) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002054 Error = true;
2055 return nullptr;
2056 }
2057
Zachary Turner03312862018-08-27 03:48:03 +00002058 ArrayTypeNode *ATy = Arena.alloc<ArrayTypeNode>();
2059 NodeList *Head = Arena.alloc<NodeList>();
2060 NodeList *Tail = Head;
2061
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002062 for (uint64_t I = 0; I < Rank; ++I) {
Zachary Turner03312862018-08-27 03:48:03 +00002063 uint64_t D = 0;
2064 std::tie(D, IsNegative) = demangleNumber(MangledName);
Nico Weber16725812019-04-03 23:27:18 +00002065 if (Error || IsNegative) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002066 Error = true;
2067 return nullptr;
2068 }
Zachary Turner03312862018-08-27 03:48:03 +00002069 Tail->N = Arena.alloc<IntegerLiteralNode>(D, IsNegative);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002070 if (I + 1 < Rank) {
Zachary Turner03312862018-08-27 03:48:03 +00002071 Tail->Next = Arena.alloc<NodeList>();
2072 Tail = Tail->Next;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002073 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002074 }
Zachary Turner03312862018-08-27 03:48:03 +00002075 ATy->Dimensions = nodeListToNodeArray(Arena, Head, Rank);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002076
2077 if (MangledName.consumeFront("$$C")) {
Zachary Turner2bbb23b2018-08-14 18:54:28 +00002078 bool IsMember = false;
2079 std::tie(ATy->Quals, IsMember) = demangleQualifiers(MangledName);
2080 if (IsMember) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002081 Error = true;
Zachary Turner2bbb23b2018-08-14 18:54:28 +00002082 return nullptr;
2083 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002084 }
2085
Zachary Turner316109b2018-07-29 16:38:02 +00002086 ATy->ElementType = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002087 return ATy;
2088}
2089
2090// Reads a function or a template parameters.
Zachary Turner03312862018-08-27 03:48:03 +00002091NodeArrayNode *
Zachary Turnerd30700f2018-07-31 17:16:44 +00002092Demangler::demangleFunctionParameterList(StringView &MangledName) {
Zachary Turner38b78a72018-07-26 20:20:10 +00002093 // Empty parameter list.
Zachary Turner38b78a72018-07-26 20:20:10 +00002094 if (MangledName.consumeFront('X'))
Nico Weber930994c2019-04-16 14:24:42 +00002095 return nullptr;
Zachary Turner38b78a72018-07-26 20:20:10 +00002096
Zachary Turner03312862018-08-27 03:48:03 +00002097 NodeList *Head = Arena.alloc<NodeList>();
2098 NodeList **Current = &Head;
2099 size_t Count = 0;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002100 while (!Error && !MangledName.startsWith('@') &&
2101 !MangledName.startsWith('Z')) {
Zachary Turner03312862018-08-27 03:48:03 +00002102 ++Count;
Zachary Turner23df1312018-07-26 22:13:39 +00002103
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002104 if (startsWithDigit(MangledName)) {
Zachary Turner30375de2018-07-26 22:24:01 +00002105 size_t N = MangledName[0] - '0';
Zachary Turnerd346cba2018-08-08 17:17:04 +00002106 if (N >= Backrefs.FunctionParamCount) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002107 Error = true;
Nico Weber930994c2019-04-16 14:24:42 +00002108 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002109 }
2110 MangledName = MangledName.dropFront();
2111
Zachary Turner03312862018-08-27 03:48:03 +00002112 *Current = Arena.alloc<NodeList>();
2113 (*Current)->N = Backrefs.FunctionParams[N];
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002114 Current = &(*Current)->Next;
2115 continue;
2116 }
2117
Zachary Turner23df1312018-07-26 22:13:39 +00002118 size_t OldSize = MangledName.size();
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002119
Zachary Turner03312862018-08-27 03:48:03 +00002120 *Current = Arena.alloc<NodeList>();
2121 TypeNode *TN = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turner8fb9a712018-12-14 18:10:13 +00002122 if (!TN || Error)
2123 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00002124
2125 (*Current)->N = TN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002126
Zachary Turner23df1312018-07-26 22:13:39 +00002127 size_t CharsConsumed = OldSize - MangledName.size();
2128 assert(CharsConsumed != 0);
2129
2130 // Single-letter types are ignored for backreferences because memorizing
2131 // them doesn't save anything.
Zachary Turnerd346cba2018-08-08 17:17:04 +00002132 if (Backrefs.FunctionParamCount <= 9 && CharsConsumed > 1)
Zachary Turner03312862018-08-27 03:48:03 +00002133 Backrefs.FunctionParams[Backrefs.FunctionParamCount++] = TN;
Zachary Turner23df1312018-07-26 22:13:39 +00002134
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002135 Current = &(*Current)->Next;
2136 }
2137
Zachary Turner38b78a72018-07-26 20:20:10 +00002138 if (Error)
Nico Weber930994c2019-04-16 14:24:42 +00002139 return nullptr;
Zachary Turner38b78a72018-07-26 20:20:10 +00002140
Zachary Turner03312862018-08-27 03:48:03 +00002141 NodeArrayNode *NA = nodeListToNodeArray(Arena, Head, Count);
Zachary Turner38b78a72018-07-26 20:20:10 +00002142 // A non-empty parameter list is terminated by either 'Z' (variadic) parameter
2143 // list or '@' (non variadic). Careful not to consume "@Z", as in that case
2144 // the following Z could be a throw specifier.
2145 if (MangledName.consumeFront('@'))
Zachary Turner03312862018-08-27 03:48:03 +00002146 return NA;
Zachary Turner38b78a72018-07-26 20:20:10 +00002147
2148 if (MangledName.consumeFront('Z')) {
Zachary Turner03312862018-08-27 03:48:03 +00002149 // This is a variadic parameter list. We probably need a variadic node to
2150 // append to the end.
2151 return NA;
Zachary Turner38b78a72018-07-26 20:20:10 +00002152 }
2153
2154 Error = true;
Nico Weber930994c2019-04-16 14:24:42 +00002155 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002156}
2157
Zachary Turner03312862018-08-27 03:48:03 +00002158NodeArrayNode *
Zachary Turnerd30700f2018-07-31 17:16:44 +00002159Demangler::demangleTemplateParameterList(StringView &MangledName) {
Zachary Turner03312862018-08-27 03:48:03 +00002160 NodeList *Head;
2161 NodeList **Current = &Head;
2162 size_t Count = 0;
2163
Zachary Turner23df1312018-07-26 22:13:39 +00002164 while (!Error && !MangledName.startsWith('@')) {
Zachary Turner32a8a202018-08-29 23:56:09 +00002165 if (MangledName.consumeFront("$S") || MangledName.consumeFront("$$V") ||
Zachary Turner78ab3cb2018-08-30 20:53:29 +00002166 MangledName.consumeFront("$$$V") || MangledName.consumeFront("$$Z")) {
2167 // parameter pack separator
Zachary Turner32a8a202018-08-29 23:56:09 +00002168 continue;
2169 }
2170
Zachary Turner03312862018-08-27 03:48:03 +00002171 ++Count;
Zachary Turner32a8a202018-08-29 23:56:09 +00002172
Zachary Turner23df1312018-07-26 22:13:39 +00002173 // Template parameter lists don't participate in back-referencing.
Zachary Turner03312862018-08-27 03:48:03 +00002174 *Current = Arena.alloc<NodeList>();
Zachary Turner931e8792018-07-30 23:02:10 +00002175
Zachary Turner03312862018-08-27 03:48:03 +00002176 NodeList &TP = **Current;
Zachary Turner66555a72018-08-20 19:15:35 +00002177
Zachary Turner03312862018-08-27 03:48:03 +00002178 TemplateParameterReferenceNode *TPRN = nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +00002179 if (MangledName.consumeFront("$$Y")) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002180 // Template alias
Zachary Turner03312862018-08-27 03:48:03 +00002181 TP.N = demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002182 } else if (MangledName.consumeFront("$$B")) {
2183 // Array
Zachary Turner03312862018-08-27 03:48:03 +00002184 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turner073620b2018-08-10 19:57:36 +00002185 } else if (MangledName.consumeFront("$$C")) {
2186 // Type has qualifiers.
Zachary Turner03312862018-08-27 03:48:03 +00002187 TP.N = demangleType(MangledName, QualifierMangleMode::Mangle);
Zachary Turner66555a72018-08-20 19:15:35 +00002188 } else if (MangledName.startsWith("$1") || MangledName.startsWith("$H") ||
2189 MangledName.startsWith("$I") || MangledName.startsWith("$J")) {
Zachary Turner03312862018-08-27 03:48:03 +00002190 // Pointer to member
2191 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2192 TPRN->IsMemberPointer = true;
2193
Zachary Turner66555a72018-08-20 19:15:35 +00002194 MangledName = MangledName.dropFront();
2195 // 1 - single inheritance <name>
2196 // H - multiple inheritance <name> <number>
2197 // I - virtual inheritance <name> <number> <number> <number>
2198 // J - unspecified inheritance <name> <number> <number> <number>
2199 char InheritanceSpecifier = MangledName.popFront();
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00002200 SymbolNode *S = nullptr;
2201 if (MangledName.startsWith('?')) {
2202 S = parse(MangledName);
Nico Weber09fb2022019-05-22 15:53:23 +00002203 if (Error || !S->Name) {
2204 Error = true;
Nico Weberf2d8f092019-04-11 22:23:35 +00002205 return nullptr;
Nico Weber09fb2022019-05-22 15:53:23 +00002206 }
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00002207 memorizeIdentifier(S->Name->getUnqualifiedIdentifier());
2208 }
2209
Zachary Turner66555a72018-08-20 19:15:35 +00002210 switch (InheritanceSpecifier) {
2211 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00002212 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2213 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002214 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002215 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00002216 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2217 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002218 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002219 case 'H':
Zachary Turner03312862018-08-27 03:48:03 +00002220 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2221 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002222 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002223 case '1':
2224 break;
2225 default:
2226 Error = true;
2227 break;
2228 }
Zachary Turner03312862018-08-27 03:48:03 +00002229 TPRN->Affinity = PointerAffinity::Pointer;
2230 TPRN->Symbol = S;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002231 } else if (MangledName.startsWith("$E?")) {
2232 MangledName.consumeFront("$E");
2233 // Reference to symbol
Zachary Turner03312862018-08-27 03:48:03 +00002234 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2235 TPRN->Symbol = parse(MangledName);
2236 TPRN->Affinity = PointerAffinity::Reference;
Zachary Turner66555a72018-08-20 19:15:35 +00002237 } else if (MangledName.startsWith("$F") || MangledName.startsWith("$G")) {
Zachary Turner03312862018-08-27 03:48:03 +00002238 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2239
Zachary Turner66555a72018-08-20 19:15:35 +00002240 // Data member pointer.
2241 MangledName = MangledName.dropFront();
2242 char InheritanceSpecifier = MangledName.popFront();
2243
2244 switch (InheritanceSpecifier) {
2245 case 'G':
Zachary Turner03312862018-08-27 03:48:03 +00002246 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2247 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002248 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002249 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00002250 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2251 demangleSigned(MangledName);
2252 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2253 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002254 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002255 case '0':
2256 break;
2257 default:
2258 Error = true;
2259 break;
2260 }
Zachary Turner03312862018-08-27 03:48:03 +00002261 TPRN->IsMemberPointer = true;
Zachary Turner66555a72018-08-20 19:15:35 +00002262
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002263 } else if (MangledName.consumeFront("$0")) {
2264 // Integral non-type template parameter
2265 bool IsNegative = false;
2266 uint64_t Value = 0;
2267 std::tie(Value, IsNegative) = demangleNumber(MangledName);
2268
Zachary Turner03312862018-08-27 03:48:03 +00002269 TP.N = Arena.alloc<IntegerLiteralNode>(Value, IsNegative);
Zachary Turnerd30700f2018-07-31 17:16:44 +00002270 } else {
Zachary Turner03312862018-08-27 03:48:03 +00002271 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turnerd30700f2018-07-31 17:16:44 +00002272 }
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002273 if (Error)
2274 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002275
Zachary Turner66555a72018-08-20 19:15:35 +00002276 Current = &TP.Next;
Zachary Turner23df1312018-07-26 22:13:39 +00002277 }
2278
2279 if (Error)
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002280 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002281
2282 // Template parameter lists cannot be variadic, so it can only be terminated
2283 // by @.
2284 if (MangledName.consumeFront('@'))
Zachary Turner03312862018-08-27 03:48:03 +00002285 return nodeListToNodeArray(Arena, Head, Count);
Zachary Turner23df1312018-07-26 22:13:39 +00002286 Error = true;
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002287 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002288}
2289
Zachary Turner3a758e22018-08-01 18:33:04 +00002290void Demangler::dumpBackReferences() {
Zachary Turner5ae08b82018-08-01 18:44:12 +00002291 std::printf("%d function parameter backreferences\n",
Zachary Turnerd346cba2018-08-08 17:17:04 +00002292 (int)Backrefs.FunctionParamCount);
Zachary Turner3a758e22018-08-01 18:33:04 +00002293
2294 // Create an output stream so we can render each type.
Nico Weber1359d652018-09-15 18:24:20 +00002295 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +00002296 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00002297 std::terminate();
Zachary Turnerd346cba2018-08-08 17:17:04 +00002298 for (size_t I = 0; I < Backrefs.FunctionParamCount; ++I) {
Zachary Turner3a758e22018-08-01 18:33:04 +00002299 OS.setCurrentPosition(0);
2300
Zachary Turner03312862018-08-27 03:48:03 +00002301 TypeNode *T = Backrefs.FunctionParams[I];
Zachary Turner38d2edd2018-08-29 03:59:17 +00002302 T->output(OS, OF_Default);
Zachary Turner3a758e22018-08-01 18:33:04 +00002303
Zachary Turner7563ebe2018-08-02 17:08:24 +00002304 std::printf(" [%d] - %.*s\n", (int)I, (int)OS.getCurrentPosition(),
Zachary Turner5ae08b82018-08-01 18:44:12 +00002305 OS.getBuffer());
Zachary Turner3a758e22018-08-01 18:33:04 +00002306 }
2307 std::free(OS.getBuffer());
2308
Zachary Turnerd346cba2018-08-08 17:17:04 +00002309 if (Backrefs.FunctionParamCount > 0)
Zachary Turner5ae08b82018-08-01 18:44:12 +00002310 std::printf("\n");
Zachary Turnerd346cba2018-08-08 17:17:04 +00002311 std::printf("%d name backreferences\n", (int)Backrefs.NamesCount);
2312 for (size_t I = 0; I < Backrefs.NamesCount; ++I) {
Zachary Turner03312862018-08-27 03:48:03 +00002313 std::printf(" [%d] - %.*s\n", (int)I, (int)Backrefs.Names[I]->Name.size(),
2314 Backrefs.Names[I]->Name.begin());
Zachary Turner3a758e22018-08-01 18:33:04 +00002315 }
Zachary Turnerd346cba2018-08-08 17:17:04 +00002316 if (Backrefs.NamesCount > 0)
Zachary Turner5ae08b82018-08-01 18:44:12 +00002317 std::printf("\n");
Zachary Turner3a758e22018-08-01 18:33:04 +00002318}
2319
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002320char *llvm::microsoftDemangle(const char *MangledName, char *Buf, size_t *N,
Zachary Turner3a758e22018-08-01 18:33:04 +00002321 int *Status, MSDemangleFlags Flags) {
Nico Weber1359d652018-09-15 18:24:20 +00002322 int InternalStatus = demangle_success;
Zachary Turner316109b2018-07-29 16:38:02 +00002323 Demangler D;
Nico Weber1359d652018-09-15 18:24:20 +00002324 OutputStream S;
2325
Zachary Turner316109b2018-07-29 16:38:02 +00002326 StringView Name{MangledName};
Nico Weber1359d652018-09-15 18:24:20 +00002327 SymbolNode *AST = D.parse(Name);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002328
Zachary Turner3a758e22018-08-01 18:33:04 +00002329 if (Flags & MSDF_DumpBackrefs)
2330 D.dumpBackReferences();
Nico Weber1359d652018-09-15 18:24:20 +00002331
2332 if (D.Error)
2333 InternalStatus = demangle_invalid_mangled_name;
Nico Weber6808bc02018-11-11 10:04:00 +00002334 else if (!initializeOutputStream(Buf, N, S, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00002335 InternalStatus = demangle_memory_alloc_failure;
2336 else {
2337 AST->output(S, OF_Default);
2338 S += '\0';
2339 if (N != nullptr)
2340 *N = S.getCurrentPosition();
2341 Buf = S.getBuffer();
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002342 }
2343
Nico Weber1359d652018-09-15 18:24:20 +00002344 if (Status)
2345 *Status = InternalStatus;
2346 return InternalStatus == demangle_success ? Buf : nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002347}