blob: ed9052f40570abb7a094f383c07e9a1e60092617 [file] [log] [blame]
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001//===- MicrosoftDemangle.cpp ----------------------------------------------===//
2//
Chandler Carruth57b08b02019-01-19 10:56:40 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Zachary Turnerf435a7e2018-07-20 17:27:48 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file defines a demangler for MSVC-style mangled symbols.
10//
11// This file has no dependencies on the rest of LLVM so that it can be
12// easily reused in other programs such as libcxxabi.
13//
14//===----------------------------------------------------------------------===//
15
Zachary Turner7ba90562018-11-01 15:07:32 +000016#include "llvm/Demangle/MicrosoftDemangle.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000017#include "llvm/Demangle/Demangle.h"
Zachary Turner7ba90562018-11-01 15:07:32 +000018#include "llvm/Demangle/MicrosoftDemangleNodes.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000019
Erik Pilkington5094e5e2019-01-17 20:37:51 +000020#include "llvm/Demangle/DemangleConfig.h"
Richard Smith8a57f2e2018-08-20 19:44:01 +000021#include "llvm/Demangle/StringView.h"
22#include "llvm/Demangle/Utility.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000023
Zachary Turner66555a72018-08-20 19:15:35 +000024#include <array>
Zachary Turnerf435a7e2018-07-20 17:27:48 +000025#include <cctype>
Zachary Turner5ae08b82018-08-01 18:44:12 +000026#include <cstdio>
Zachary Turnerd742d642018-07-26 19:56:09 +000027#include <tuple>
Zachary Turnerf435a7e2018-07-20 17:27:48 +000028
Zachary Turner03312862018-08-27 03:48:03 +000029using namespace llvm;
30using namespace ms_demangle;
Zachary Turnerf435a7e2018-07-20 17:27:48 +000031
32static bool startsWithDigit(StringView S) {
33 return !S.empty() && std::isdigit(S.front());
34}
35
Zachary Turnerd742d642018-07-26 19:56:09 +000036
Zachary Turner03312862018-08-27 03:48:03 +000037struct NodeList {
38 Node *N = nullptr;
39 NodeList *Next = nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +000040};
41
Zachary Turner8fb9a712018-12-14 18:10:13 +000042static bool isMemberPointer(StringView MangledName, bool &Error) {
43 Error = false;
Zachary Turnerd742d642018-07-26 19:56:09 +000044 switch (MangledName.popFront()) {
Zachary Turner931e8792018-07-30 23:02:10 +000045 case '$':
46 // This is probably an rvalue reference (e.g. $$Q), and you cannot have an
47 // rvalue reference to a member.
48 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +000049 case 'A':
50 // 'A' indicates a reference, and you cannot have a reference to a member
Zachary Turner931e8792018-07-30 23:02:10 +000051 // function or member.
Zachary Turnerd742d642018-07-26 19:56:09 +000052 return false;
53 case 'P':
54 case 'Q':
55 case 'R':
56 case 'S':
57 // These 4 values indicate some kind of pointer, but we still don't know
58 // what.
59 break;
60 default:
Zachary Turner8fb9a712018-12-14 18:10:13 +000061 Error = true;
62 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +000063 }
64
65 // If it starts with a number, then 6 indicates a non-member function
66 // pointer, and 8 indicates a member function pointer.
67 if (startsWithDigit(MangledName)) {
Nico Weber63b97d22019-04-08 19:46:53 +000068 if (MangledName[0] != '6' && MangledName[0] != '8') {
69 Error = true;
70 return false;
71 }
Zachary Turnerd742d642018-07-26 19:56:09 +000072 return (MangledName[0] == '8');
73 }
74
75 // Remove ext qualifiers since those can appear on either type and are
76 // therefore not indicative.
77 MangledName.consumeFront('E'); // 64-bit
78 MangledName.consumeFront('I'); // restrict
79 MangledName.consumeFront('F'); // unaligned
80
Nico Weber63b97d22019-04-08 19:46:53 +000081 if (MangledName.empty()) {
82 Error = true;
83 return false;
84 }
Zachary Turnerd742d642018-07-26 19:56:09 +000085
86 // The next value should be either ABCD (non-member) or QRST (member).
87 switch (MangledName.front()) {
88 case 'A':
89 case 'B':
90 case 'C':
91 case 'D':
92 return false;
93 case 'Q':
94 case 'R':
95 case 'S':
96 case 'T':
97 return true;
98 default:
Zachary Turner8fb9a712018-12-14 18:10:13 +000099 Error = true;
100 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +0000101 }
Zachary Turnerd742d642018-07-26 19:56:09 +0000102}
103
Zachary Turner03312862018-08-27 03:48:03 +0000104static SpecialIntrinsicKind
105consumeSpecialIntrinsicKind(StringView &MangledName) {
106 if (MangledName.consumeFront("?_7"))
107 return SpecialIntrinsicKind::Vftable;
108 if (MangledName.consumeFront("?_8"))
109 return SpecialIntrinsicKind::Vbtable;
110 if (MangledName.consumeFront("?_9"))
111 return SpecialIntrinsicKind::VcallThunk;
112 if (MangledName.consumeFront("?_A"))
113 return SpecialIntrinsicKind::Typeof;
114 if (MangledName.consumeFront("?_B"))
115 return SpecialIntrinsicKind::LocalStaticGuard;
116 if (MangledName.consumeFront("?_C"))
117 return SpecialIntrinsicKind::StringLiteralSymbol;
118 if (MangledName.consumeFront("?_P"))
119 return SpecialIntrinsicKind::UdtReturning;
120 if (MangledName.consumeFront("?_R0"))
121 return SpecialIntrinsicKind::RttiTypeDescriptor;
122 if (MangledName.consumeFront("?_R1"))
123 return SpecialIntrinsicKind::RttiBaseClassDescriptor;
124 if (MangledName.consumeFront("?_R2"))
125 return SpecialIntrinsicKind::RttiBaseClassArray;
126 if (MangledName.consumeFront("?_R3"))
127 return SpecialIntrinsicKind::RttiClassHierarchyDescriptor;
128 if (MangledName.consumeFront("?_R4"))
129 return SpecialIntrinsicKind::RttiCompleteObjLocator;
130 if (MangledName.consumeFront("?_S"))
131 return SpecialIntrinsicKind::LocalVftable;
132 if (MangledName.consumeFront("?__E"))
133 return SpecialIntrinsicKind::DynamicInitializer;
134 if (MangledName.consumeFront("?__F"))
135 return SpecialIntrinsicKind::DynamicAtexitDestructor;
136 if (MangledName.consumeFront("?__J"))
137 return SpecialIntrinsicKind::LocalStaticThreadGuard;
138 return SpecialIntrinsicKind::None;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000139}
140
Zachary Turner71c91f92018-07-30 03:12:34 +0000141static bool startsWithLocalScopePattern(StringView S) {
142 if (!S.consumeFront('?'))
143 return false;
144 if (S.size() < 2)
145 return false;
146
147 size_t End = S.find('?');
148 if (End == StringView::npos)
149 return false;
150 StringView Candidate = S.substr(0, End);
151 if (Candidate.empty())
152 return false;
153
154 // \?[0-9]\?
155 // ?@? is the discriminator 0.
156 if (Candidate.size() == 1)
157 return Candidate[0] == '@' || (Candidate[0] >= '0' && Candidate[0] <= '9');
158
159 // If it's not 0-9, then it's an encoded number terminated with an @
160 if (Candidate.back() != '@')
161 return false;
162 Candidate = Candidate.dropBack();
163
164 // An encoded number starts with B-P and all subsequent digits are in A-P.
165 // Note that the reason the first digit cannot be A is two fold. First, it
166 // would create an ambiguity with ?A which delimits the beginning of an
167 // anonymous namespace. Second, A represents 0, and you don't start a multi
168 // digit number with a leading 0. Presumably the anonymous namespace
169 // ambiguity is also why single digit encoded numbers use 0-9 rather than A-J.
170 if (Candidate[0] < 'B' || Candidate[0] > 'P')
171 return false;
172 Candidate = Candidate.dropFront();
173 while (!Candidate.empty()) {
174 if (Candidate[0] < 'A' || Candidate[0] > 'P')
175 return false;
176 Candidate = Candidate.dropFront();
177 }
178
179 return true;
180}
181
Zachary Turner03312862018-08-27 03:48:03 +0000182static bool isTagType(StringView S) {
183 switch (S.front()) {
184 case 'T': // union
185 case 'U': // struct
186 case 'V': // class
187 case 'W': // enum
188 return true;
Zachary Turner38b78a72018-07-26 20:20:10 +0000189 }
Zachary Turner03312862018-08-27 03:48:03 +0000190 return false;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000191}
192
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000193static bool isCustomType(StringView S) { return S[0] == '?'; }
194
Zachary Turner03312862018-08-27 03:48:03 +0000195static bool isPointerType(StringView S) {
196 if (S.startsWith("$$Q")) // foo &&
197 return true;
198
199 switch (S.front()) {
200 case 'A': // foo &
201 case 'P': // foo *
202 case 'Q': // foo *const
203 case 'R': // foo *volatile
204 case 'S': // foo *const volatile
205 return true;
206 }
207 return false;
208}
209
210static bool isArrayType(StringView S) { return S[0] == 'Y'; }
211
212static bool isFunctionType(StringView S) {
213 return S.startsWith("$$A8@@") || S.startsWith("$$A6");
214}
215
216static FunctionRefQualifier
217demangleFunctionRefQualifier(StringView &MangledName) {
218 if (MangledName.consumeFront('G'))
219 return FunctionRefQualifier::Reference;
220 else if (MangledName.consumeFront('H'))
221 return FunctionRefQualifier::RValueReference;
222 return FunctionRefQualifier::None;
223}
224
225static std::pair<Qualifiers, PointerAffinity>
226demanglePointerCVQualifiers(StringView &MangledName) {
227 if (MangledName.consumeFront("$$Q"))
228 return std::make_pair(Q_None, PointerAffinity::RValueReference);
229
230 switch (MangledName.popFront()) {
231 case 'A':
232 return std::make_pair(Q_None, PointerAffinity::Reference);
233 case 'P':
234 return std::make_pair(Q_None, PointerAffinity::Pointer);
235 case 'Q':
236 return std::make_pair(Q_Const, PointerAffinity::Pointer);
237 case 'R':
238 return std::make_pair(Q_Volatile, PointerAffinity::Pointer);
239 case 'S':
240 return std::make_pair(Qualifiers(Q_Const | Q_Volatile),
241 PointerAffinity::Pointer);
Zachary Turner970fdc32018-08-16 16:17:36 +0000242 default:
Zachary Turner03312862018-08-27 03:48:03 +0000243 assert(false && "Ty is not a pointer type!");
Zachary Turner970fdc32018-08-16 16:17:36 +0000244 }
Zachary Turner03312862018-08-27 03:48:03 +0000245 return std::make_pair(Q_None, PointerAffinity::Pointer);
Zachary Turner970fdc32018-08-16 16:17:36 +0000246}
247
Zachary Turner71c91f92018-07-30 03:12:34 +0000248StringView Demangler::copyString(StringView Borrowed) {
249 char *Stable = Arena.allocUnalignedBuffer(Borrowed.size() + 1);
250 std::strcpy(Stable, Borrowed.begin());
251
252 return {Stable, Borrowed.size()};
253}
254
Zachary Turner03312862018-08-27 03:48:03 +0000255SpecialTableSymbolNode *
256Demangler::demangleSpecialTableSymbolNode(StringView &MangledName,
257 SpecialIntrinsicKind K) {
258 NamedIdentifierNode *NI = Arena.alloc<NamedIdentifierNode>();
259 switch (K) {
260 case SpecialIntrinsicKind::Vftable:
261 NI->Name = "`vftable'";
262 break;
263 case SpecialIntrinsicKind::Vbtable:
264 NI->Name = "`vbtable'";
265 break;
266 case SpecialIntrinsicKind::LocalVftable:
267 NI->Name = "`local vftable'";
268 break;
269 case SpecialIntrinsicKind::RttiCompleteObjLocator:
270 NI->Name = "`RTTI Complete Object Locator'";
271 break;
272 default:
Erik Pilkington5094e5e2019-01-17 20:37:51 +0000273 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000274 }
275 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
276 SpecialTableSymbolNode *STSN = Arena.alloc<SpecialTableSymbolNode>();
277 STSN->Name = QN;
Zachary Turner469f0762018-08-17 21:18:05 +0000278 bool IsMember = false;
Nico Weberae050d22019-04-14 23:32:37 +0000279 if (MangledName.empty()) {
280 Error = true;
281 return nullptr;
282 }
Zachary Turner03312862018-08-27 03:48:03 +0000283 char Front = MangledName.popFront();
284 if (Front != '6' && Front != '7') {
285 Error = true;
286 return nullptr;
287 }
288
289 std::tie(STSN->Quals, IsMember) = demangleQualifiers(MangledName);
290 if (!MangledName.consumeFront('@'))
291 STSN->TargetName = demangleFullyQualifiedTypeName(MangledName);
292 return STSN;
293}
294
295LocalStaticGuardVariableNode *
Nico Weber88ab2812019-05-28 14:54:49 +0000296Demangler::demangleLocalStaticGuard(StringView &MangledName, bool IsThread) {
Zachary Turner03312862018-08-27 03:48:03 +0000297 LocalStaticGuardIdentifierNode *LSGI =
298 Arena.alloc<LocalStaticGuardIdentifierNode>();
Nico Weber88ab2812019-05-28 14:54:49 +0000299 LSGI->IsThread = IsThread;
Zachary Turner03312862018-08-27 03:48:03 +0000300 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, LSGI);
301 LocalStaticGuardVariableNode *LSGVN =
302 Arena.alloc<LocalStaticGuardVariableNode>();
303 LSGVN->Name = QN;
304
305 if (MangledName.consumeFront("4IA"))
306 LSGVN->IsVisible = false;
307 else if (MangledName.consumeFront("5"))
308 LSGVN->IsVisible = true;
309 else {
310 Error = true;
311 return nullptr;
312 }
313
314 if (!MangledName.empty())
315 LSGI->ScopeIndex = demangleUnsigned(MangledName);
316 return LSGVN;
317}
318
319static NamedIdentifierNode *synthesizeNamedIdentifier(ArenaAllocator &Arena,
320 StringView Name) {
321 NamedIdentifierNode *Id = Arena.alloc<NamedIdentifierNode>();
322 Id->Name = Name;
323 return Id;
324}
325
326static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
327 IdentifierNode *Identifier) {
328 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
329 QN->Components = Arena.alloc<NodeArrayNode>();
330 QN->Components->Count = 1;
331 QN->Components->Nodes = Arena.allocArray<Node *>(1);
332 QN->Components->Nodes[0] = Identifier;
333 return QN;
334}
335
336static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
337 StringView Name) {
338 NamedIdentifierNode *Id = synthesizeNamedIdentifier(Arena, Name);
339 return synthesizeQualifiedName(Arena, Id);
340}
341
342static VariableSymbolNode *synthesizeVariable(ArenaAllocator &Arena,
343 TypeNode *Type,
344 StringView VariableName) {
345 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
346 VSN->Type = Type;
347 VSN->Name = synthesizeQualifiedName(Arena, VariableName);
348 return VSN;
349}
350
351VariableSymbolNode *Demangler::demangleUntypedVariable(
352 ArenaAllocator &Arena, StringView &MangledName, StringView VariableName) {
353 NamedIdentifierNode *NI = synthesizeNamedIdentifier(Arena, VariableName);
354 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
355 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
356 VSN->Name = QN;
357 if (MangledName.consumeFront("8"))
358 return VSN;
359
360 Error = true;
361 return nullptr;
362}
363
364VariableSymbolNode *
365Demangler::demangleRttiBaseClassDescriptorNode(ArenaAllocator &Arena,
366 StringView &MangledName) {
367 RttiBaseClassDescriptorNode *RBCDN =
368 Arena.alloc<RttiBaseClassDescriptorNode>();
369 RBCDN->NVOffset = demangleUnsigned(MangledName);
370 RBCDN->VBPtrOffset = demangleSigned(MangledName);
371 RBCDN->VBTableOffset = demangleUnsigned(MangledName);
372 RBCDN->Flags = demangleUnsigned(MangledName);
373 if (Error)
374 return nullptr;
375
376 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
377 VSN->Name = demangleNameScopeChain(MangledName, RBCDN);
378 MangledName.consumeFront('8');
379 return VSN;
380}
381
Zachary Turner32a8a202018-08-29 23:56:09 +0000382FunctionSymbolNode *Demangler::demangleInitFiniStub(StringView &MangledName,
383 bool IsDestructor) {
Zachary Turner03312862018-08-27 03:48:03 +0000384 DynamicStructorIdentifierNode *DSIN =
385 Arena.alloc<DynamicStructorIdentifierNode>();
386 DSIN->IsDestructor = IsDestructor;
Zachary Turner32a8a202018-08-29 23:56:09 +0000387
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000388 bool IsKnownStaticDataMember = false;
389 if (MangledName.consumeFront('?'))
390 IsKnownStaticDataMember = true;
391
Nico Weber63b97d22019-04-08 19:46:53 +0000392 SymbolNode *Symbol = demangleDeclarator(MangledName);
393 if (Error)
394 return nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +0000395
Zachary Turner32a8a202018-08-29 23:56:09 +0000396 FunctionSymbolNode *FSN = nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +0000397
398 if (Symbol->kind() == NodeKind::VariableSymbol) {
399 DSIN->Variable = static_cast<VariableSymbolNode *>(Symbol);
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000400
401 // Older versions of clang mangled this type of symbol incorrectly. They
402 // would omit the leading ? and they would only emit a single @ at the end.
403 // The correct mangling is a leading ? and 2 trailing @ signs. Handle
404 // both cases.
405 int AtCount = IsKnownStaticDataMember ? 2 : 1;
406 for (int I = 0; I < AtCount; ++I) {
407 if (MangledName.consumeFront('@'))
408 continue;
Zachary Turner32a8a202018-08-29 23:56:09 +0000409 Error = true;
410 return nullptr;
411 }
412
413 FSN = demangleFunctionEncoding(MangledName);
Nico Weber63b97d22019-04-08 19:46:53 +0000414 if (FSN)
415 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
Zachary Turner32a8a202018-08-29 23:56:09 +0000416 } else {
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000417 if (IsKnownStaticDataMember) {
418 // This was supposed to be a static data member, but we got a function.
419 Error = true;
420 return nullptr;
421 }
422
Zachary Turner32a8a202018-08-29 23:56:09 +0000423 FSN = static_cast<FunctionSymbolNode *>(Symbol);
424 DSIN->Name = Symbol->Name;
425 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
426 }
427
Zachary Turner03312862018-08-27 03:48:03 +0000428 return FSN;
429}
430
431SymbolNode *Demangler::demangleSpecialIntrinsic(StringView &MangledName) {
432 SpecialIntrinsicKind SIK = consumeSpecialIntrinsicKind(MangledName);
433 if (SIK == SpecialIntrinsicKind::None)
434 return nullptr;
435
436 switch (SIK) {
437 case SpecialIntrinsicKind::StringLiteralSymbol:
438 return demangleStringLiteral(MangledName);
439 case SpecialIntrinsicKind::Vftable:
440 case SpecialIntrinsicKind::Vbtable:
441 case SpecialIntrinsicKind::LocalVftable:
442 case SpecialIntrinsicKind::RttiCompleteObjLocator:
443 return demangleSpecialTableSymbolNode(MangledName, SIK);
444 case SpecialIntrinsicKind::VcallThunk:
445 return demangleVcallThunkNode(MangledName);
446 case SpecialIntrinsicKind::LocalStaticGuard:
Nico Weber88ab2812019-05-28 14:54:49 +0000447 return demangleLocalStaticGuard(MangledName, /*IsThread=*/false);
448 case SpecialIntrinsicKind::LocalStaticThreadGuard:
449 return demangleLocalStaticGuard(MangledName, /*IsThread=*/true);
Zachary Turner03312862018-08-27 03:48:03 +0000450 case SpecialIntrinsicKind::RttiTypeDescriptor: {
451 TypeNode *T = demangleType(MangledName, QualifierMangleMode::Result);
Zachary Turner469f0762018-08-17 21:18:05 +0000452 if (Error)
453 break;
454 if (!MangledName.consumeFront("@8"))
Zachary Turner03312862018-08-27 03:48:03 +0000455 break;
Zachary Turner469f0762018-08-17 21:18:05 +0000456 if (!MangledName.empty())
Zachary Turner03312862018-08-27 03:48:03 +0000457 break;
458 return synthesizeVariable(Arena, T, "`RTTI Type Descriptor'");
459 }
460 case SpecialIntrinsicKind::RttiBaseClassArray:
461 return demangleUntypedVariable(Arena, MangledName,
462 "`RTTI Base Class Array'");
463 case SpecialIntrinsicKind::RttiClassHierarchyDescriptor:
464 return demangleUntypedVariable(Arena, MangledName,
465 "`RTTI Class Hierarchy Descriptor'");
466 case SpecialIntrinsicKind::RttiBaseClassDescriptor:
467 return demangleRttiBaseClassDescriptorNode(Arena, MangledName);
468 case SpecialIntrinsicKind::DynamicInitializer:
Zachary Turner32a8a202018-08-29 23:56:09 +0000469 return demangleInitFiniStub(MangledName, false);
Zachary Turner03312862018-08-27 03:48:03 +0000470 case SpecialIntrinsicKind::DynamicAtexitDestructor:
Zachary Turner32a8a202018-08-29 23:56:09 +0000471 return demangleInitFiniStub(MangledName, true);
Zachary Turner469f0762018-08-17 21:18:05 +0000472 default:
Zachary Turner469f0762018-08-17 21:18:05 +0000473 break;
474 }
Zachary Turner03312862018-08-27 03:48:03 +0000475 Error = true;
476 return nullptr;
Zachary Turner469f0762018-08-17 21:18:05 +0000477}
478
Zachary Turner03312862018-08-27 03:48:03 +0000479IdentifierNode *
480Demangler::demangleFunctionIdentifierCode(StringView &MangledName) {
481 assert(MangledName.startsWith('?'));
482 MangledName = MangledName.dropFront();
Nico Weber321de482019-04-03 23:19:39 +0000483 if (MangledName.empty()) {
484 Error = true;
485 return nullptr;
486 }
Zachary Turner03312862018-08-27 03:48:03 +0000487
488 if (MangledName.consumeFront("__"))
489 return demangleFunctionIdentifierCode(
490 MangledName, FunctionIdentifierCodeGroup::DoubleUnder);
Nico Weberb4f33bb2019-04-11 22:47:18 +0000491 if (MangledName.consumeFront("_"))
Zachary Turner03312862018-08-27 03:48:03 +0000492 return demangleFunctionIdentifierCode(MangledName,
493 FunctionIdentifierCodeGroup::Under);
494 return demangleFunctionIdentifierCode(MangledName,
495 FunctionIdentifierCodeGroup::Basic);
496}
497
498StructorIdentifierNode *
499Demangler::demangleStructorIdentifier(StringView &MangledName,
500 bool IsDestructor) {
501 StructorIdentifierNode *N = Arena.alloc<StructorIdentifierNode>();
502 N->IsDestructor = IsDestructor;
503 return N;
504}
505
506ConversionOperatorIdentifierNode *
507Demangler::demangleConversionOperatorIdentifier(StringView &MangledName) {
508 ConversionOperatorIdentifierNode *N =
509 Arena.alloc<ConversionOperatorIdentifierNode>();
510 return N;
511}
512
513LiteralOperatorIdentifierNode *
514Demangler::demangleLiteralOperatorIdentifier(StringView &MangledName) {
515 LiteralOperatorIdentifierNode *N =
516 Arena.alloc<LiteralOperatorIdentifierNode>();
Nico Weberaf2ee7d2019-04-11 23:20:18 +0000517 N->Name = demangleSimpleString(MangledName, /*Memorize=*/false);
Zachary Turner03312862018-08-27 03:48:03 +0000518 return N;
519}
520
Nico Weber03db6252019-04-11 23:11:33 +0000521IntrinsicFunctionKind
522Demangler::translateIntrinsicFunctionCode(char CH,
523 FunctionIdentifierCodeGroup Group) {
524 using IFK = IntrinsicFunctionKind;
525 if (!(CH >= '0' && CH <= '9') && !(CH >= 'A' && CH <= 'Z')) {
526 Error = true;
527 return IFK::None;
528 }
529
Zachary Turner03312862018-08-27 03:48:03 +0000530 // Not all ? identifiers are intrinsics *functions*. This function only maps
531 // operator codes for the special functions, all others are handled elsewhere,
532 // hence the IFK::None entries in the table.
Zachary Turner03312862018-08-27 03:48:03 +0000533 static IFK Basic[36] = {
534 IFK::None, // ?0 # Foo::Foo()
535 IFK::None, // ?1 # Foo::~Foo()
536 IFK::New, // ?2 # operator new
537 IFK::Delete, // ?3 # operator delete
538 IFK::Assign, // ?4 # operator=
539 IFK::RightShift, // ?5 # operator>>
540 IFK::LeftShift, // ?6 # operator<<
541 IFK::LogicalNot, // ?7 # operator!
542 IFK::Equals, // ?8 # operator==
543 IFK::NotEquals, // ?9 # operator!=
544 IFK::ArraySubscript, // ?A # operator[]
545 IFK::None, // ?B # Foo::operator <type>()
546 IFK::Pointer, // ?C # operator->
547 IFK::Dereference, // ?D # operator*
548 IFK::Increment, // ?E # operator++
549 IFK::Decrement, // ?F # operator--
550 IFK::Minus, // ?G # operator-
551 IFK::Plus, // ?H # operator+
552 IFK::BitwiseAnd, // ?I # operator&
553 IFK::MemberPointer, // ?J # operator->*
554 IFK::Divide, // ?K # operator/
555 IFK::Modulus, // ?L # operator%
556 IFK::LessThan, // ?M operator<
557 IFK::LessThanEqual, // ?N operator<=
558 IFK::GreaterThan, // ?O operator>
559 IFK::GreaterThanEqual, // ?P operator>=
560 IFK::Comma, // ?Q operator,
561 IFK::Parens, // ?R operator()
562 IFK::BitwiseNot, // ?S operator~
563 IFK::BitwiseXor, // ?T operator^
564 IFK::BitwiseOr, // ?U operator|
565 IFK::LogicalAnd, // ?V operator&&
566 IFK::LogicalOr, // ?W operator||
567 IFK::TimesEqual, // ?X operator*=
568 IFK::PlusEqual, // ?Y operator+=
569 IFK::MinusEqual, // ?Z operator-=
570 };
571 static IFK Under[36] = {
572 IFK::DivEqual, // ?_0 operator/=
573 IFK::ModEqual, // ?_1 operator%=
574 IFK::RshEqual, // ?_2 operator>>=
575 IFK::LshEqual, // ?_3 operator<<=
576 IFK::BitwiseAndEqual, // ?_4 operator&=
577 IFK::BitwiseOrEqual, // ?_5 operator|=
578 IFK::BitwiseXorEqual, // ?_6 operator^=
579 IFK::None, // ?_7 # vftable
580 IFK::None, // ?_8 # vbtable
581 IFK::None, // ?_9 # vcall
582 IFK::None, // ?_A # typeof
583 IFK::None, // ?_B # local static guard
584 IFK::None, // ?_C # string literal
585 IFK::VbaseDtor, // ?_D # vbase destructor
586 IFK::VecDelDtor, // ?_E # vector deleting destructor
587 IFK::DefaultCtorClosure, // ?_F # default constructor closure
588 IFK::ScalarDelDtor, // ?_G # scalar deleting destructor
589 IFK::VecCtorIter, // ?_H # vector constructor iterator
590 IFK::VecDtorIter, // ?_I # vector destructor iterator
591 IFK::VecVbaseCtorIter, // ?_J # vector vbase constructor iterator
592 IFK::VdispMap, // ?_K # virtual displacement map
593 IFK::EHVecCtorIter, // ?_L # eh vector constructor iterator
594 IFK::EHVecDtorIter, // ?_M # eh vector destructor iterator
595 IFK::EHVecVbaseCtorIter, // ?_N # eh vector vbase constructor iterator
596 IFK::CopyCtorClosure, // ?_O # copy constructor closure
597 IFK::None, // ?_P<name> # udt returning <name>
598 IFK::None, // ?_Q # <unknown>
599 IFK::None, // ?_R0 - ?_R4 # RTTI Codes
600 IFK::None, // ?_S # local vftable
601 IFK::LocalVftableCtorClosure, // ?_T # local vftable constructor closure
602 IFK::ArrayNew, // ?_U operator new[]
603 IFK::ArrayDelete, // ?_V operator delete[]
604 IFK::None, // ?_W <unused>
605 IFK::None, // ?_X <unused>
606 IFK::None, // ?_Y <unused>
607 IFK::None, // ?_Z <unused>
608 };
609 static IFK DoubleUnder[36] = {
610 IFK::None, // ?__0 <unused>
611 IFK::None, // ?__1 <unused>
612 IFK::None, // ?__2 <unused>
613 IFK::None, // ?__3 <unused>
614 IFK::None, // ?__4 <unused>
615 IFK::None, // ?__5 <unused>
616 IFK::None, // ?__6 <unused>
617 IFK::None, // ?__7 <unused>
618 IFK::None, // ?__8 <unused>
619 IFK::None, // ?__9 <unused>
620 IFK::ManVectorCtorIter, // ?__A managed vector ctor iterator
621 IFK::ManVectorDtorIter, // ?__B managed vector dtor iterator
622 IFK::EHVectorCopyCtorIter, // ?__C EH vector copy ctor iterator
623 IFK::EHVectorVbaseCopyCtorIter, // ?__D EH vector vbase copy ctor iter
624 IFK::None, // ?__E dynamic initializer for `T'
625 IFK::None, // ?__F dynamic atexit destructor for `T'
626 IFK::VectorCopyCtorIter, // ?__G vector copy constructor iter
627 IFK::VectorVbaseCopyCtorIter, // ?__H vector vbase copy ctor iter
628 IFK::ManVectorVbaseCopyCtorIter, // ?__I managed vector vbase copy ctor
629 // iter
630 IFK::None, // ?__J local static thread guard
631 IFK::None, // ?__K operator ""_name
Nico Webere8f21b12019-04-23 16:20:27 +0000632 IFK::CoAwait, // ?__L operator co_await
633 IFK::Spaceship, // ?__M operator<=>
Zachary Turner03312862018-08-27 03:48:03 +0000634 IFK::None, // ?__N <unused>
635 IFK::None, // ?__O <unused>
636 IFK::None, // ?__P <unused>
637 IFK::None, // ?__Q <unused>
638 IFK::None, // ?__R <unused>
639 IFK::None, // ?__S <unused>
640 IFK::None, // ?__T <unused>
641 IFK::None, // ?__U <unused>
642 IFK::None, // ?__V <unused>
643 IFK::None, // ?__W <unused>
644 IFK::None, // ?__X <unused>
645 IFK::None, // ?__Y <unused>
646 IFK::None, // ?__Z <unused>
647 };
648
649 int Index = (CH >= '0' && CH <= '9') ? (CH - '0') : (CH - 'A' + 10);
650 switch (Group) {
651 case FunctionIdentifierCodeGroup::Basic:
652 return Basic[Index];
653 case FunctionIdentifierCodeGroup::Under:
654 return Under[Index];
655 case FunctionIdentifierCodeGroup::DoubleUnder:
656 return DoubleUnder[Index];
657 }
Erik Pilkington5094e5e2019-01-17 20:37:51 +0000658 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000659}
660
661IdentifierNode *
662Demangler::demangleFunctionIdentifierCode(StringView &MangledName,
663 FunctionIdentifierCodeGroup Group) {
Nico Weber63fe2592019-04-14 23:08:12 +0000664 if (MangledName.empty()) {
665 Error = true;
666 return nullptr;
667 }
Zachary Turner03312862018-08-27 03:48:03 +0000668 switch (Group) {
669 case FunctionIdentifierCodeGroup::Basic:
670 switch (char CH = MangledName.popFront()) {
671 case '0':
672 case '1':
673 return demangleStructorIdentifier(MangledName, CH == '1');
674 case 'B':
675 return demangleConversionOperatorIdentifier(MangledName);
676 default:
677 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
678 translateIntrinsicFunctionCode(CH, Group));
679 }
Zachary Turner03312862018-08-27 03:48:03 +0000680 case FunctionIdentifierCodeGroup::Under:
681 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
682 translateIntrinsicFunctionCode(MangledName.popFront(), Group));
683 case FunctionIdentifierCodeGroup::DoubleUnder:
684 switch (char CH = MangledName.popFront()) {
685 case 'K':
686 return demangleLiteralOperatorIdentifier(MangledName);
687 default:
688 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
689 translateIntrinsicFunctionCode(CH, Group));
690 }
691 }
Zachary Turner03312862018-08-27 03:48:03 +0000692
Nico Weberef035182019-04-11 23:23:00 +0000693 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000694}
695
696SymbolNode *Demangler::demangleEncodedSymbol(StringView &MangledName,
697 QualifiedNameNode *Name) {
Nico Weber63b97d22019-04-08 19:46:53 +0000698 if (MangledName.empty()) {
699 Error = true;
700 return nullptr;
701 }
702
Zachary Turner469f0762018-08-17 21:18:05 +0000703 // Read a variable.
704 switch (MangledName.front()) {
705 case '0':
706 case '1':
707 case '2':
708 case '3':
Zachary Turner03312862018-08-27 03:48:03 +0000709 case '4': {
710 StorageClass SC = demangleVariableStorageClass(MangledName);
711 return demangleVariableEncoding(MangledName, SC);
Zachary Turner469f0762018-08-17 21:18:05 +0000712 }
Zachary Turner03312862018-08-27 03:48:03 +0000713 }
714 FunctionSymbolNode *FSN = demangleFunctionEncoding(MangledName);
715
716 IdentifierNode *UQN = Name->getUnqualifiedIdentifier();
717 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
718 ConversionOperatorIdentifierNode *COIN =
719 static_cast<ConversionOperatorIdentifierNode *>(UQN);
Nico Weber63b97d22019-04-08 19:46:53 +0000720 if (FSN)
721 COIN->TargetType = FSN->Signature->ReturnType;
Zachary Turner03312862018-08-27 03:48:03 +0000722 }
723 return FSN;
Zachary Turner469f0762018-08-17 21:18:05 +0000724}
725
Nico Weber63b97d22019-04-08 19:46:53 +0000726SymbolNode *Demangler::demangleDeclarator(StringView &MangledName) {
727 // What follows is a main symbol name. This may include namespaces or class
728 // back references.
729 QualifiedNameNode *QN = demangleFullyQualifiedSymbolName(MangledName);
730 if (Error)
731 return nullptr;
732
733 SymbolNode *Symbol = demangleEncodedSymbol(MangledName, QN);
734 if (Error)
735 return nullptr;
736 Symbol->Name = QN;
737
738 IdentifierNode *UQN = QN->getUnqualifiedIdentifier();
739 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
740 ConversionOperatorIdentifierNode *COIN =
741 static_cast<ConversionOperatorIdentifierNode *>(UQN);
742 if (!COIN->TargetType) {
743 Error = true;
744 return nullptr;
745 }
746 }
747 return Symbol;
748}
749
Nico Weber82dc06c2019-05-27 23:10:42 +0000750SymbolNode *Demangler::demangleMD5Name(StringView &MangledName) {
751 assert(MangledName.startsWith("??@"));
752 // This is an MD5 mangled name. We can't demangle it, just return the
753 // mangled name.
754 // An MD5 mangled name is ??@ followed by 32 characters and a terminating @.
755 size_t MD5Last = MangledName.find('@', strlen("??@"));
756 if (MD5Last == StringView::npos) {
757 Error = true;
758 return nullptr;
759 }
760 const char *Start = MangledName.begin();
761 MangledName = MangledName.dropFront(MD5Last + 1);
762
763 // There are two additional special cases for MD5 names:
764 // 1. For complete object locators where the object name is long enough
765 // for the object to have an MD5 name, the complete object locator is
766 // called ??@...@??_R4@ (with a trailing "??_R4@" instead of the usual
767 // leading "??_R4". This is handled here.
768 // 2. For catchable types, in versions of MSVC before 2015 (<1900) or after
769 // 2017.2 (>= 1914), the catchable type mangling is _CT??@...@??@...@8
770 // instead of_CT??@...@8 with just one MD5 name. Since we don't yet
771 // demangle catchable types anywhere, this isn't handled for MD5 names
772 // either.
773 MangledName.consumeFront("??_R4@");
774
775 StringView MD5(Start, MangledName.begin());
776 SymbolNode *S = Arena.alloc<SymbolNode>(NodeKind::Md5Symbol);
777 S->Name = synthesizeQualifiedName(Arena, MD5);
778
779 return S;
780}
781
Zachary Turner469f0762018-08-17 21:18:05 +0000782// Parser entry point.
Zachary Turner03312862018-08-27 03:48:03 +0000783SymbolNode *Demangler::parse(StringView &MangledName) {
Nico Weber82dc06c2019-05-27 23:10:42 +0000784 if (MangledName.startsWith("??@"))
785 return demangleMD5Name(MangledName);
Zachary Turner83313f82018-08-16 16:17:17 +0000786
Nico Webercfe08bc2019-05-27 00:48:59 +0000787 // MSVC-style mangled symbols must start with '?'.
Zachary Turner03312862018-08-27 03:48:03 +0000788 if (!MangledName.startsWith('?')) {
789 Error = true;
790 return nullptr;
791 }
792
Zachary Turner469f0762018-08-17 21:18:05 +0000793 MangledName.consumeFront('?');
Zachary Turner970fdc32018-08-16 16:17:36 +0000794
Zachary Turner469f0762018-08-17 21:18:05 +0000795 // ?$ is a template instantiation, but all other names that start with ? are
796 // operators / special names.
Zachary Turner03312862018-08-27 03:48:03 +0000797 if (SymbolNode *SI = demangleSpecialIntrinsic(MangledName))
798 return SI;
Zachary Turner469f0762018-08-17 21:18:05 +0000799
Nico Weber63b97d22019-04-08 19:46:53 +0000800 return demangleDeclarator(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000801}
802
Zachary Turner7ba90562018-11-01 15:07:32 +0000803TagTypeNode *Demangler::parseTagUniqueName(StringView &MangledName) {
804 if (!MangledName.consumeFront(".?A"))
805 return nullptr;
806 MangledName.consumeFront(".?A");
807 if (MangledName.empty())
808 return nullptr;
809
810 return demangleClassType(MangledName);
811}
812
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000813// <type-encoding> ::= <storage-class> <variable-type>
814// <storage-class> ::= 0 # private static member
815// ::= 1 # protected static member
816// ::= 2 # public static member
817// ::= 3 # global
818// ::= 4 # static local
819
Zachary Turner03312862018-08-27 03:48:03 +0000820VariableSymbolNode *Demangler::demangleVariableEncoding(StringView &MangledName,
821 StorageClass SC) {
822 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000823
Zachary Turner03312862018-08-27 03:48:03 +0000824 VSN->Type = demangleType(MangledName, QualifierMangleMode::Drop);
825 VSN->SC = SC;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000826
Nico Weber63b97d22019-04-08 19:46:53 +0000827 if (Error)
828 return nullptr;
829
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000830 // <variable-type> ::= <type> <cvr-qualifiers>
831 // ::= <type> <pointee-cvr-qualifiers> # pointers, references
Zachary Turner03312862018-08-27 03:48:03 +0000832 switch (VSN->Type->kind()) {
833 case NodeKind::PointerType: {
834 PointerTypeNode *PTN = static_cast<PointerTypeNode *>(VSN->Type);
835
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000836 Qualifiers ExtraChildQuals = Q_None;
Zachary Turner03312862018-08-27 03:48:03 +0000837 PTN->Quals = Qualifiers(VSN->Type->Quals |
838 demanglePointerExtQualifiers(MangledName));
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000839
Zachary Turnerd742d642018-07-26 19:56:09 +0000840 bool IsMember = false;
Zachary Turner316109b2018-07-29 16:38:02 +0000841 std::tie(ExtraChildQuals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000842
Zachary Turner03312862018-08-27 03:48:03 +0000843 if (PTN->ClassParent) {
844 QualifiedNameNode *BackRefName =
845 demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000846 (void)BackRefName;
847 }
Zachary Turner03312862018-08-27 03:48:03 +0000848 PTN->Pointee->Quals = Qualifiers(PTN->Pointee->Quals | ExtraChildQuals);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000849
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000850 break;
851 }
852 default:
Zachary Turner03312862018-08-27 03:48:03 +0000853 VSN->Type->Quals = demangleQualifiers(MangledName).first;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000854 break;
855 }
856
Zachary Turner03312862018-08-27 03:48:03 +0000857 return VSN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000858}
859
860// Sometimes numbers are encoded in mangled symbols. For example,
861// "int (*x)[20]" is a valid C type (x is a pointer to an array of
862// length 20), so we need some way to embed numbers as part of symbols.
863// This function parses it.
864//
865// <number> ::= [?] <non-negative integer>
866//
867// <non-negative integer> ::= <decimal digit> # when 1 <= Number <= 10
Nico Weber502cf4b2019-04-18 19:30:21 +0000868// ::= <hex digit>+ @ # when Number == 0 or >= 10
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000869//
870// <hex-digit> ::= [A-P] # A = 0, B = 1, ...
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000871std::pair<uint64_t, bool> Demangler::demangleNumber(StringView &MangledName) {
872 bool IsNegative = MangledName.consumeFront('?');
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000873
874 if (startsWithDigit(MangledName)) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000875 uint64_t Ret = MangledName[0] - '0' + 1;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000876 MangledName = MangledName.dropFront(1);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000877 return {Ret, IsNegative};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000878 }
879
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000880 uint64_t Ret = 0;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000881 for (size_t i = 0; i < MangledName.size(); ++i) {
882 char C = MangledName[i];
883 if (C == '@') {
884 MangledName = MangledName.dropFront(i + 1);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000885 return {Ret, IsNegative};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000886 }
887 if ('A' <= C && C <= 'P') {
888 Ret = (Ret << 4) + (C - 'A');
889 continue;
890 }
891 break;
892 }
893
894 Error = true;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000895 return {0ULL, false};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000896}
897
Zachary Turner469f0762018-08-17 21:18:05 +0000898uint64_t Demangler::demangleUnsigned(StringView &MangledName) {
899 bool IsNegative = false;
900 uint64_t Number = 0;
901 std::tie(Number, IsNegative) = demangleNumber(MangledName);
902 if (IsNegative)
903 Error = true;
904 return Number;
905}
906
907int64_t Demangler::demangleSigned(StringView &MangledName) {
908 bool IsNegative = false;
909 uint64_t Number = 0;
910 std::tie(Number, IsNegative) = demangleNumber(MangledName);
911 if (Number > INT64_MAX)
912 Error = true;
913 int64_t I = static_cast<int64_t>(Number);
914 return IsNegative ? -I : I;
915}
916
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000917// First 10 strings can be referenced by special BackReferences ?0, ?1, ..., ?9.
918// Memorize it.
919void Demangler::memorizeString(StringView S) {
Zachary Turnerd346cba2018-08-08 17:17:04 +0000920 if (Backrefs.NamesCount >= BackrefContext::Max)
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000921 return;
Zachary Turnerd346cba2018-08-08 17:17:04 +0000922 for (size_t i = 0; i < Backrefs.NamesCount; ++i)
Zachary Turner03312862018-08-27 03:48:03 +0000923 if (S == Backrefs.Names[i]->Name)
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000924 return;
Zachary Turner03312862018-08-27 03:48:03 +0000925 NamedIdentifierNode *N = Arena.alloc<NamedIdentifierNode>();
926 N->Name = S;
927 Backrefs.Names[Backrefs.NamesCount++] = N;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000928}
929
Zachary Turner03312862018-08-27 03:48:03 +0000930NamedIdentifierNode *Demangler::demangleBackRefName(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +0000931 assert(startsWithDigit(MangledName));
Zachary Turnerd9e925f2018-08-18 18:49:48 +0000932
933 size_t I = MangledName[0] - '0';
934 if (I >= Backrefs.NamesCount) {
935 Error = true;
936 return nullptr;
937 }
938
Zachary Turner172aea12018-08-02 17:08:03 +0000939 MangledName = MangledName.dropFront();
Zachary Turner03312862018-08-27 03:48:03 +0000940 return Backrefs.Names[I];
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000941}
942
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000943void Demangler::memorizeIdentifier(IdentifierNode *Identifier) {
944 // Render this class template name into a string buffer so that we can
945 // memorize it for the purpose of back-referencing.
Nico Weber1359d652018-09-15 18:24:20 +0000946 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +0000947 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +0000948 // FIXME: Propagate out-of-memory as an error?
949 std::terminate();
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000950 Identifier->output(OS, OF_Default);
951 OS << '\0';
952 char *Name = OS.getBuffer();
953
954 StringView Owned = copyString(Name);
955 memorizeString(Owned);
956 std::free(Name);
957}
958
Zachary Turner03312862018-08-27 03:48:03 +0000959IdentifierNode *
960Demangler::demangleTemplateInstantiationName(StringView &MangledName,
961 NameBackrefBehavior NBB) {
Zachary Turnera7dffb12018-07-28 22:10:42 +0000962 assert(MangledName.startsWith("?$"));
963 MangledName.consumeFront("?$");
964
Zachary Turnerd346cba2018-08-08 17:17:04 +0000965 BackrefContext OuterContext;
966 std::swap(OuterContext, Backrefs);
Zachary Turner54d4ffe2018-08-01 18:32:28 +0000967
Zachary Turner03312862018-08-27 03:48:03 +0000968 IdentifierNode *Identifier =
969 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
Zachary Turnerd346cba2018-08-08 17:17:04 +0000970 if (!Error)
Zachary Turner03312862018-08-27 03:48:03 +0000971 Identifier->TemplateParams = demangleTemplateParameterList(MangledName);
Zachary Turnerd346cba2018-08-08 17:17:04 +0000972
973 std::swap(OuterContext, Backrefs);
Zachary Turner54d4ffe2018-08-01 18:32:28 +0000974 if (Error)
975 return nullptr;
Zachary Turner71c91f92018-07-30 03:12:34 +0000976
Nico Weber64041d72019-04-15 16:42:44 +0000977 if (NBB & NBB_Template) {
978 // NBB_Template is only set for types and non-leaf names ("a::" in "a::b").
Nico Weberc035c242019-04-16 14:10:34 +0000979 // Structors and conversion operators only makes sense in a leaf name, so
980 // reject them in NBB_Template contexts.
981 if (Identifier->kind() == NodeKind::ConversionOperatorIdentifier ||
982 Identifier->kind() == NodeKind::StructorIdentifier) {
Nico Weber64041d72019-04-15 16:42:44 +0000983 Error = true;
984 return nullptr;
985 }
986
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000987 memorizeIdentifier(Identifier);
Nico Weber64041d72019-04-15 16:42:44 +0000988 }
Zachary Turner71c91f92018-07-30 03:12:34 +0000989
Zachary Turner03312862018-08-27 03:48:03 +0000990 return Identifier;
Zachary Turnera7dffb12018-07-28 22:10:42 +0000991}
992
Zachary Turner03312862018-08-27 03:48:03 +0000993NamedIdentifierNode *Demangler::demangleSimpleName(StringView &MangledName,
994 bool Memorize) {
Zachary Turner931e8792018-07-30 23:02:10 +0000995 StringView S = demangleSimpleString(MangledName, Memorize);
996 if (Error)
997 return nullptr;
998
Zachary Turner03312862018-08-27 03:48:03 +0000999 NamedIdentifierNode *Name = Arena.alloc<NamedIdentifierNode>();
1000 Name->Name = S;
1001 return Name;
Zachary Turner931e8792018-07-30 23:02:10 +00001002}
1003
Zachary Turner970fdc32018-08-16 16:17:36 +00001004static bool isRebasedHexDigit(char C) { return (C >= 'A' && C <= 'P'); }
1005
1006static uint8_t rebasedHexDigitToNumber(char C) {
1007 assert(isRebasedHexDigit(C));
1008 return (C <= 'J') ? (C - 'A') : (10 + C - 'K');
1009}
1010
1011uint8_t Demangler::demangleCharLiteral(StringView &MangledName) {
Nico Webera0ac65c2019-04-18 19:52:32 +00001012 assert(!MangledName.empty());
Zachary Turner970fdc32018-08-16 16:17:36 +00001013 if (!MangledName.startsWith('?'))
1014 return MangledName.popFront();
1015
1016 MangledName = MangledName.dropFront();
1017 if (MangledName.empty())
1018 goto CharLiteralError;
1019
1020 if (MangledName.consumeFront('$')) {
1021 // Two hex digits
1022 if (MangledName.size() < 2)
1023 goto CharLiteralError;
1024 StringView Nibbles = MangledName.substr(0, 2);
1025 if (!isRebasedHexDigit(Nibbles[0]) || !isRebasedHexDigit(Nibbles[1]))
1026 goto CharLiteralError;
1027 // Don't append the null terminator.
1028 uint8_t C1 = rebasedHexDigitToNumber(Nibbles[0]);
1029 uint8_t C2 = rebasedHexDigitToNumber(Nibbles[1]);
1030 MangledName = MangledName.dropFront(2);
1031 return (C1 << 4) | C2;
1032 }
1033
1034 if (startsWithDigit(MangledName)) {
1035 const char *Lookup = ",/\\:. \n\t'-";
1036 char C = Lookup[MangledName[0] - '0'];
1037 MangledName = MangledName.dropFront();
1038 return C;
1039 }
1040
1041 if (MangledName[0] >= 'a' && MangledName[0] <= 'z') {
1042 char Lookup[26] = {'\xE1', '\xE2', '\xE3', '\xE4', '\xE5', '\xE6', '\xE7',
1043 '\xE8', '\xE9', '\xEA', '\xEB', '\xEC', '\xED', '\xEE',
1044 '\xEF', '\xF0', '\xF1', '\xF2', '\xF3', '\xF4', '\xF5',
1045 '\xF6', '\xF7', '\xF8', '\xF9', '\xFA'};
1046 char C = Lookup[MangledName[0] - 'a'];
1047 MangledName = MangledName.dropFront();
1048 return C;
1049 }
1050
1051 if (MangledName[0] >= 'A' && MangledName[0] <= 'Z') {
1052 char Lookup[26] = {'\xC1', '\xC2', '\xC3', '\xC4', '\xC5', '\xC6', '\xC7',
1053 '\xC8', '\xC9', '\xCA', '\xCB', '\xCC', '\xCD', '\xCE',
1054 '\xCF', '\xD0', '\xD1', '\xD2', '\xD3', '\xD4', '\xD5',
1055 '\xD6', '\xD7', '\xD8', '\xD9', '\xDA'};
1056 char C = Lookup[MangledName[0] - 'A'];
1057 MangledName = MangledName.dropFront();
1058 return C;
1059 }
1060
1061CharLiteralError:
1062 Error = true;
1063 return '\0';
1064}
1065
1066wchar_t Demangler::demangleWcharLiteral(StringView &MangledName) {
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001067 uint8_t C1, C2;
1068
1069 C1 = demangleCharLiteral(MangledName);
Nico Weberf5c7f3a2019-04-22 15:05:18 +00001070 if (Error || MangledName.empty())
Zachary Turner970fdc32018-08-16 16:17:36 +00001071 goto WCharLiteralError;
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001072 C2 = demangleCharLiteral(MangledName);
Zachary Turner970fdc32018-08-16 16:17:36 +00001073 if (Error)
1074 goto WCharLiteralError;
1075
1076 return ((wchar_t)C1 << 8) | (wchar_t)C2;
1077
1078WCharLiteralError:
1079 Error = true;
1080 return L'\0';
1081}
1082
1083static void writeHexDigit(char *Buffer, uint8_t Digit) {
1084 assert(Digit <= 15);
1085 *Buffer = (Digit < 10) ? ('0' + Digit) : ('A' + Digit - 10);
1086}
1087
1088static void outputHex(OutputStream &OS, unsigned C) {
Nico Weberb5cd6162019-06-02 17:41:07 +00001089 assert (C != 0);
1090
Zachary Turner970fdc32018-08-16 16:17:36 +00001091 // It's easier to do the math if we can work from right to left, but we need
1092 // to print the numbers from left to right. So render this into a temporary
1093 // buffer first, then output the temporary buffer. Each byte is of the form
1094 // \xAB, which means that each byte needs 4 characters. Since there are at
1095 // most 4 bytes, we need a 4*4+1 = 17 character temporary buffer.
1096 char TempBuffer[17];
1097
1098 ::memset(TempBuffer, 0, sizeof(TempBuffer));
Nico Weber8fc99022019-04-21 16:58:25 +00001099 constexpr int MaxPos = sizeof(TempBuffer) - 1;
Zachary Turner970fdc32018-08-16 16:17:36 +00001100
Nico Weber8fc99022019-04-21 16:58:25 +00001101 int Pos = MaxPos - 1; // TempBuffer[MaxPos] is the terminating \0.
Zachary Turner970fdc32018-08-16 16:17:36 +00001102 while (C != 0) {
1103 for (int I = 0; I < 2; ++I) {
1104 writeHexDigit(&TempBuffer[Pos--], C % 16);
1105 C /= 16;
1106 }
Zachary Turner970fdc32018-08-16 16:17:36 +00001107 }
Nico Weberce67a412019-04-21 17:19:27 +00001108 TempBuffer[Pos--] = 'x';
1109 assert(Pos >= 0);
1110 TempBuffer[Pos--] = '\\';
Zachary Turner970fdc32018-08-16 16:17:36 +00001111 OS << StringView(&TempBuffer[Pos + 1]);
1112}
1113
1114static void outputEscapedChar(OutputStream &OS, unsigned C) {
1115 switch (C) {
Nico Weber8eeaf512019-04-20 23:59:06 +00001116 case '\0': // nul
1117 OS << "\\0";
1118 return;
Zachary Turner970fdc32018-08-16 16:17:36 +00001119 case '\'': // single quote
1120 OS << "\\\'";
1121 return;
1122 case '\"': // double quote
1123 OS << "\\\"";
1124 return;
1125 case '\\': // backslash
1126 OS << "\\\\";
1127 return;
1128 case '\a': // bell
1129 OS << "\\a";
1130 return;
1131 case '\b': // backspace
1132 OS << "\\b";
1133 return;
1134 case '\f': // form feed
1135 OS << "\\f";
1136 return;
1137 case '\n': // new line
1138 OS << "\\n";
1139 return;
1140 case '\r': // carriage return
1141 OS << "\\r";
1142 return;
1143 case '\t': // tab
1144 OS << "\\t";
1145 return;
1146 case '\v': // vertical tab
1147 OS << "\\v";
1148 return;
1149 default:
1150 break;
1151 }
1152
1153 if (C > 0x1F && C < 0x7F) {
1154 // Standard ascii char.
1155 OS << (char)C;
1156 return;
1157 }
1158
1159 outputHex(OS, C);
1160}
1161
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001162static unsigned countTrailingNullBytes(const uint8_t *StringBytes, int Length) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001163 const uint8_t *End = StringBytes + Length - 1;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001164 unsigned Count = 0;
Zachary Turner970fdc32018-08-16 16:17:36 +00001165 while (Length > 0 && *End == 0) {
1166 --Length;
1167 --End;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001168 ++Count;
Zachary Turner970fdc32018-08-16 16:17:36 +00001169 }
Zachary Turner3461bfa2018-08-17 16:14:05 +00001170 return Count;
Zachary Turner970fdc32018-08-16 16:17:36 +00001171}
1172
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001173static unsigned countEmbeddedNulls(const uint8_t *StringBytes,
1174 unsigned Length) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001175 unsigned Result = 0;
1176 for (unsigned I = 0; I < Length; ++I) {
1177 if (*StringBytes++ == 0)
1178 ++Result;
1179 }
1180 return Result;
1181}
1182
Nico Weber8d05eb82019-04-24 16:09:38 +00001183// A mangled (non-wide) string literal stores the total length of the string it
1184// refers to (passed in NumBytes), and it contains up to 32 bytes of actual text
1185// (passed in StringBytes, NumChars).
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001186static unsigned guessCharByteSize(const uint8_t *StringBytes, unsigned NumChars,
Nico Weber8d05eb82019-04-24 16:09:38 +00001187 uint64_t NumBytes) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001188 assert(NumBytes > 0);
1189
1190 // If the number of bytes is odd, this is guaranteed to be a char string.
1191 if (NumBytes % 2 == 1)
1192 return 1;
1193
1194 // All strings can encode at most 32 bytes of data. If it's less than that,
1195 // then we encoded the entire string. In this case we check for a 1-byte,
1196 // 2-byte, or 4-byte null terminator.
1197 if (NumBytes < 32) {
1198 unsigned TrailingNulls = countTrailingNullBytes(StringBytes, NumChars);
Nico Weber8eeaf512019-04-20 23:59:06 +00001199 if (TrailingNulls >= 4 && NumBytes % 4 == 0)
Zachary Turner970fdc32018-08-16 16:17:36 +00001200 return 4;
1201 if (TrailingNulls >= 2)
1202 return 2;
1203 return 1;
1204 }
1205
1206 // The whole string was not able to be encoded. Try to look at embedded null
1207 // terminators to guess. The heuristic is that we count all embedded null
1208 // terminators. If more than 2/3 are null, it's a char32. If more than 1/3
1209 // are null, it's a char16. Otherwise it's a char8. This obviously isn't
1210 // perfect and is biased towards languages that have ascii alphabets, but this
1211 // was always going to be best effort since the encoding is lossy.
1212 unsigned Nulls = countEmbeddedNulls(StringBytes, NumChars);
Nico Weber8eeaf512019-04-20 23:59:06 +00001213 if (Nulls >= 2 * NumChars / 3 && NumBytes % 4 == 0)
Zachary Turner970fdc32018-08-16 16:17:36 +00001214 return 4;
1215 if (Nulls >= NumChars / 3)
1216 return 2;
1217 return 1;
1218}
1219
1220static unsigned decodeMultiByteChar(const uint8_t *StringBytes,
1221 unsigned CharIndex, unsigned CharBytes) {
1222 assert(CharBytes == 1 || CharBytes == 2 || CharBytes == 4);
1223 unsigned Offset = CharIndex * CharBytes;
1224 unsigned Result = 0;
1225 StringBytes = StringBytes + Offset;
1226 for (unsigned I = 0; I < CharBytes; ++I) {
1227 unsigned C = static_cast<unsigned>(StringBytes[I]);
1228 Result |= C << (8 * I);
1229 }
1230 return Result;
1231}
1232
Zachary Turner03312862018-08-27 03:48:03 +00001233FunctionSymbolNode *Demangler::demangleVcallThunkNode(StringView &MangledName) {
1234 FunctionSymbolNode *FSN = Arena.alloc<FunctionSymbolNode>();
1235 VcallThunkIdentifierNode *VTIN = Arena.alloc<VcallThunkIdentifierNode>();
1236 FSN->Signature = Arena.alloc<ThunkSignatureNode>();
1237 FSN->Signature->FunctionClass = FC_NoParameterList;
1238
1239 FSN->Name = demangleNameScopeChain(MangledName, VTIN);
1240 if (!Error)
1241 Error = !MangledName.consumeFront("$B");
1242 if (!Error)
1243 VTIN->OffsetInVTable = demangleUnsigned(MangledName);
1244 if (!Error)
1245 Error = !MangledName.consumeFront('A');
1246 if (!Error)
1247 FSN->Signature->CallConvention = demangleCallingConvention(MangledName);
1248 return (Error) ? nullptr : FSN;
1249}
1250
1251EncodedStringLiteralNode *
1252Demangler::demangleStringLiteral(StringView &MangledName) {
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001253 // This function uses goto, so declare all variables up front.
Zachary Turner970fdc32018-08-16 16:17:36 +00001254 OutputStream OS;
1255 StringView CRC;
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001256 uint64_t StringByteSize;
1257 bool IsWcharT = false;
1258 bool IsNegative = false;
1259 size_t CrcEndPos = 0;
1260 char *ResultBuffer = nullptr;
1261
Zachary Turner03312862018-08-27 03:48:03 +00001262 EncodedStringLiteralNode *Result = Arena.alloc<EncodedStringLiteralNode>();
Zachary Turner970fdc32018-08-16 16:17:36 +00001263
Nico Webere145a542019-04-19 14:13:11 +00001264 // Must happen before the first `goto StringLiteralError`.
1265 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
1266 // FIXME: Propagate out-of-memory as an error?
1267 std::terminate();
1268
Zachary Turner970fdc32018-08-16 16:17:36 +00001269 // Prefix indicating the beginning of a string literal
Zachary Turner3461bfa2018-08-17 16:14:05 +00001270 if (!MangledName.consumeFront("@_"))
1271 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001272 if (MangledName.empty())
1273 goto StringLiteralError;
1274
1275 // Char Type (regular or wchar_t)
Zachary Turner970fdc32018-08-16 16:17:36 +00001276 switch (MangledName.popFront()) {
1277 case '1':
1278 IsWcharT = true;
Erik Pilkington5094e5e2019-01-17 20:37:51 +00001279 DEMANGLE_FALLTHROUGH;
Zachary Turner970fdc32018-08-16 16:17:36 +00001280 case '0':
1281 break;
1282 default:
1283 goto StringLiteralError;
1284 }
1285
1286 // Encoded Length
Zachary Turner970fdc32018-08-16 16:17:36 +00001287 std::tie(StringByteSize, IsNegative) = demangleNumber(MangledName);
Nico Webera0ac65c2019-04-18 19:52:32 +00001288 if (Error || IsNegative || StringByteSize < (IsWcharT ? 2 : 1))
Zachary Turner970fdc32018-08-16 16:17:36 +00001289 goto StringLiteralError;
1290
1291 // CRC 32 (always 8 characters plus a terminator)
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001292 CrcEndPos = MangledName.find('@');
Zachary Turner970fdc32018-08-16 16:17:36 +00001293 if (CrcEndPos == StringView::npos)
1294 goto StringLiteralError;
1295 CRC = MangledName.substr(0, CrcEndPos);
1296 MangledName = MangledName.dropFront(CrcEndPos + 1);
1297 if (MangledName.empty())
1298 goto StringLiteralError;
1299
Zachary Turner970fdc32018-08-16 16:17:36 +00001300 if (IsWcharT) {
Zachary Turner03312862018-08-27 03:48:03 +00001301 Result->Char = CharKind::Wchar;
Zachary Turner970fdc32018-08-16 16:17:36 +00001302 if (StringByteSize > 64)
Zachary Turner3461bfa2018-08-17 16:14:05 +00001303 Result->IsTruncated = true;
Zachary Turner970fdc32018-08-16 16:17:36 +00001304
1305 while (!MangledName.consumeFront('@')) {
Nico Webera0ac65c2019-04-18 19:52:32 +00001306 if (MangledName.size() < 2)
Nico Weber502cf4b2019-04-18 19:30:21 +00001307 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001308 wchar_t W = demangleWcharLiteral(MangledName);
Zachary Turner3461bfa2018-08-17 16:14:05 +00001309 if (StringByteSize != 2 || Result->IsTruncated)
Zachary Turner970fdc32018-08-16 16:17:36 +00001310 outputEscapedChar(OS, W);
1311 StringByteSize -= 2;
1312 if (Error)
1313 goto StringLiteralError;
1314 }
1315 } else {
Zachary Turner32a8a202018-08-29 23:56:09 +00001316 // The max byte length is actually 32, but some compilers mangled strings
1317 // incorrectly, so we have to assume it can go higher.
1318 constexpr unsigned MaxStringByteLength = 32 * 4;
Zachary Turner970fdc32018-08-16 16:17:36 +00001319 uint8_t StringBytes[MaxStringByteLength];
1320
1321 unsigned BytesDecoded = 0;
1322 while (!MangledName.consumeFront('@')) {
Nico Weberaa162682019-04-21 14:25:07 +00001323 if (MangledName.size() < 1 || BytesDecoded >= MaxStringByteLength)
Nico Weber502cf4b2019-04-18 19:30:21 +00001324 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001325 StringBytes[BytesDecoded++] = demangleCharLiteral(MangledName);
1326 }
1327
Zachary Turner32a8a202018-08-29 23:56:09 +00001328 if (StringByteSize > BytesDecoded)
1329 Result->IsTruncated = true;
1330
Zachary Turner970fdc32018-08-16 16:17:36 +00001331 unsigned CharBytes =
1332 guessCharByteSize(StringBytes, BytesDecoded, StringByteSize);
1333 assert(StringByteSize % CharBytes == 0);
1334 switch (CharBytes) {
1335 case 1:
Zachary Turner03312862018-08-27 03:48:03 +00001336 Result->Char = CharKind::Char;
Zachary Turner970fdc32018-08-16 16:17:36 +00001337 break;
1338 case 2:
Zachary Turner03312862018-08-27 03:48:03 +00001339 Result->Char = CharKind::Char16;
Zachary Turner970fdc32018-08-16 16:17:36 +00001340 break;
1341 case 4:
Zachary Turner03312862018-08-27 03:48:03 +00001342 Result->Char = CharKind::Char32;
Zachary Turner970fdc32018-08-16 16:17:36 +00001343 break;
1344 default:
Erik Pilkington5094e5e2019-01-17 20:37:51 +00001345 DEMANGLE_UNREACHABLE;
Zachary Turner970fdc32018-08-16 16:17:36 +00001346 }
1347 const unsigned NumChars = BytesDecoded / CharBytes;
1348 for (unsigned CharIndex = 0; CharIndex < NumChars; ++CharIndex) {
1349 unsigned NextChar =
1350 decodeMultiByteChar(StringBytes, CharIndex, CharBytes);
Zachary Turner3461bfa2018-08-17 16:14:05 +00001351 if (CharIndex + 1 < NumChars || Result->IsTruncated)
Zachary Turner970fdc32018-08-16 16:17:36 +00001352 outputEscapedChar(OS, NextChar);
1353 }
1354 }
1355
1356 OS << '\0';
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001357 ResultBuffer = OS.getBuffer();
Zachary Turner03312862018-08-27 03:48:03 +00001358 Result->DecodedString = copyString(ResultBuffer);
Zachary Turneraf738f72018-08-16 17:48:32 +00001359 std::free(ResultBuffer);
Zachary Turner970fdc32018-08-16 16:17:36 +00001360 return Result;
1361
1362StringLiteralError:
1363 Error = true;
Nico Webere145a542019-04-19 14:13:11 +00001364 std::free(OS.getBuffer());
Zachary Turner970fdc32018-08-16 16:17:36 +00001365 return nullptr;
1366}
1367
Nico Weberc7444dd2019-04-03 23:15:56 +00001368// Returns MangledName's prefix before the first '@', or an error if
1369// MangledName contains no '@' or the prefix has length 0.
Zachary Turner931e8792018-07-30 23:02:10 +00001370StringView Demangler::demangleSimpleString(StringView &MangledName,
1371 bool Memorize) {
1372 StringView S;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001373 for (size_t i = 0; i < MangledName.size(); ++i) {
1374 if (MangledName[i] != '@')
1375 continue;
Nico Weberc7444dd2019-04-03 23:15:56 +00001376 if (i == 0)
1377 break;
Zachary Turner931e8792018-07-30 23:02:10 +00001378 S = MangledName.substr(0, i);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001379 MangledName = MangledName.dropFront(i + 1);
1380
1381 if (Memorize)
Zachary Turner931e8792018-07-30 23:02:10 +00001382 memorizeString(S);
1383 return S;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001384 }
1385
1386 Error = true;
Zachary Turner931e8792018-07-30 23:02:10 +00001387 return {};
Zachary Turnera7dffb12018-07-28 22:10:42 +00001388}
1389
Zachary Turner03312862018-08-27 03:48:03 +00001390NamedIdentifierNode *
1391Demangler::demangleAnonymousNamespaceName(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001392 assert(MangledName.startsWith("?A"));
1393 MangledName.consumeFront("?A");
1394
Zachary Turner03312862018-08-27 03:48:03 +00001395 NamedIdentifierNode *Node = Arena.alloc<NamedIdentifierNode>();
1396 Node->Name = "`anonymous namespace'";
Zachary Turner91c98a82018-08-20 23:58:35 +00001397 size_t EndPos = MangledName.find('@');
1398 if (EndPos == StringView::npos) {
1399 Error = true;
1400 return nullptr;
1401 }
Zachary Turner0002dd42018-08-20 23:58:58 +00001402 StringView NamespaceKey = MangledName.substr(0, EndPos);
1403 memorizeString(NamespaceKey);
Zachary Turner91c98a82018-08-20 23:58:35 +00001404 MangledName = MangledName.substr(EndPos + 1);
1405 return Node;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001406}
1407
Zachary Turner03312862018-08-27 03:48:03 +00001408NamedIdentifierNode *
1409Demangler::demangleLocallyScopedNamePiece(StringView &MangledName) {
Zachary Turner71c91f92018-07-30 03:12:34 +00001410 assert(startsWithLocalScopePattern(MangledName));
1411
Zachary Turner03312862018-08-27 03:48:03 +00001412 NamedIdentifierNode *Identifier = Arena.alloc<NamedIdentifierNode>();
Zachary Turner71c91f92018-07-30 03:12:34 +00001413 MangledName.consumeFront('?');
Nico Weberc5615c22019-04-03 23:29:05 +00001414 uint64_t Number = 0;
1415 bool IsNegative = false;
1416 std::tie(Number, IsNegative) = demangleNumber(MangledName);
1417 assert(!IsNegative);
Zachary Turner71c91f92018-07-30 03:12:34 +00001418
1419 // One ? to terminate the number
1420 MangledName.consumeFront('?');
1421
1422 assert(!Error);
Zachary Turner03312862018-08-27 03:48:03 +00001423 Node *Scope = parse(MangledName);
Zachary Turner71c91f92018-07-30 03:12:34 +00001424 if (Error)
1425 return nullptr;
1426
1427 // Render the parent symbol's name into a buffer.
Nico Weber1359d652018-09-15 18:24:20 +00001428 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +00001429 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00001430 // FIXME: Propagate out-of-memory as an error?
1431 std::terminate();
Zachary Turner71c91f92018-07-30 03:12:34 +00001432 OS << '`';
Zachary Turner38d2edd2018-08-29 03:59:17 +00001433 Scope->output(OS, OF_Default);
Zachary Turner71c91f92018-07-30 03:12:34 +00001434 OS << '\'';
Nico Weberc5615c22019-04-03 23:29:05 +00001435 OS << "::`" << Number << "'";
Zachary Turner71c91f92018-07-30 03:12:34 +00001436 OS << '\0';
1437 char *Result = OS.getBuffer();
Zachary Turner03312862018-08-27 03:48:03 +00001438 Identifier->Name = copyString(Result);
Zachary Turner71c91f92018-07-30 03:12:34 +00001439 std::free(Result);
Zachary Turner03312862018-08-27 03:48:03 +00001440 return Identifier;
Zachary Turner71c91f92018-07-30 03:12:34 +00001441}
1442
Zachary Turnera7dffb12018-07-28 22:10:42 +00001443// Parses a type name in the form of A@B@C@@ which represents C::B::A.
Zachary Turner03312862018-08-27 03:48:03 +00001444QualifiedNameNode *
1445Demangler::demangleFullyQualifiedTypeName(StringView &MangledName) {
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001446 IdentifierNode *Identifier =
1447 demangleUnqualifiedTypeName(MangledName, /*Memorize=*/true);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001448 if (Error)
1449 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001450 assert(Identifier);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001451
Zachary Turner03312862018-08-27 03:48:03 +00001452 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001453 if (Error)
1454 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001455 assert(QN);
1456 return QN;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001457}
1458
1459// Parses a symbol name in the form of A@B@C@@ which represents C::B::A.
1460// Symbol names have slightly different rules regarding what can appear
1461// so we separate out the implementations for flexibility.
Zachary Turner03312862018-08-27 03:48:03 +00001462QualifiedNameNode *
1463Demangler::demangleFullyQualifiedSymbolName(StringView &MangledName) {
Zachary Turner58d29cf2018-08-08 00:43:31 +00001464 // This is the final component of a symbol name (i.e. the leftmost component
1465 // of a mangled name. Since the only possible template instantiation that
1466 // can appear in this context is a function template, and since those are
1467 // not saved for the purposes of name backreferences, only backref simple
1468 // names.
Zachary Turner03312862018-08-27 03:48:03 +00001469 IdentifierNode *Identifier =
1470 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001471 if (Error)
1472 return nullptr;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001473
Zachary Turner03312862018-08-27 03:48:03 +00001474 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001475 if (Error)
1476 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001477
1478 if (Identifier->kind() == NodeKind::StructorIdentifier) {
Nico Webera9886f82019-04-03 23:23:32 +00001479 if (QN->Components->Count < 2) {
1480 Error = true;
1481 return nullptr;
1482 }
Zachary Turner03312862018-08-27 03:48:03 +00001483 StructorIdentifierNode *SIN =
1484 static_cast<StructorIdentifierNode *>(Identifier);
Zachary Turner03312862018-08-27 03:48:03 +00001485 Node *ClassNode = QN->Components->Nodes[QN->Components->Count - 2];
1486 SIN->Class = static_cast<IdentifierNode *>(ClassNode);
1487 }
1488 assert(QN);
1489 return QN;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001490}
1491
Zachary Turner03312862018-08-27 03:48:03 +00001492IdentifierNode *Demangler::demangleUnqualifiedTypeName(StringView &MangledName,
1493 bool Memorize) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001494 // An inner-most name can be a back-reference, because a fully-qualified name
1495 // (e.g. Scope + Inner) can contain other fully qualified names inside of
1496 // them (for example template parameters), and these nested parameters can
1497 // refer to previously mangled types.
1498 if (startsWithDigit(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001499 return demangleBackRefName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001500
1501 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001502 return demangleTemplateInstantiationName(MangledName, NBB_Template);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001503
Zachary Turner44ebbc22018-08-01 18:32:47 +00001504 return demangleSimpleName(MangledName, Memorize);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001505}
1506
Zachary Turner03312862018-08-27 03:48:03 +00001507IdentifierNode *
1508Demangler::demangleUnqualifiedSymbolName(StringView &MangledName,
1509 NameBackrefBehavior NBB) {
Zachary Turner71c91f92018-07-30 03:12:34 +00001510 if (startsWithDigit(MangledName))
1511 return demangleBackRefName(MangledName);
1512 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001513 return demangleTemplateInstantiationName(MangledName, NBB);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001514 if (MangledName.startsWith('?'))
Zachary Turner03312862018-08-27 03:48:03 +00001515 return demangleFunctionIdentifierCode(MangledName);
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001516 return demangleSimpleName(MangledName, /*Memorize=*/(NBB & NBB_Simple) != 0);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001517}
1518
Zachary Turner03312862018-08-27 03:48:03 +00001519IdentifierNode *Demangler::demangleNameScopePiece(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001520 if (startsWithDigit(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001521 return demangleBackRefName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001522
1523 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001524 return demangleTemplateInstantiationName(MangledName, NBB_Template);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001525
1526 if (MangledName.startsWith("?A"))
Zachary Turner316109b2018-07-29 16:38:02 +00001527 return demangleAnonymousNamespaceName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001528
Zachary Turner71c91f92018-07-30 03:12:34 +00001529 if (startsWithLocalScopePattern(MangledName))
1530 return demangleLocallyScopedNamePiece(MangledName);
1531
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001532 return demangleSimpleName(MangledName, /*Memorize=*/true);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001533}
1534
Zachary Turner03312862018-08-27 03:48:03 +00001535static NodeArrayNode *nodeListToNodeArray(ArenaAllocator &Arena, NodeList *Head,
1536 size_t Count) {
1537 NodeArrayNode *N = Arena.alloc<NodeArrayNode>();
1538 N->Count = Count;
1539 N->Nodes = Arena.allocArray<Node *>(Count);
1540 for (size_t I = 0; I < Count; ++I) {
1541 N->Nodes[I] = Head->N;
1542 Head = Head->Next;
1543 }
1544 return N;
1545}
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001546
Zachary Turner03312862018-08-27 03:48:03 +00001547QualifiedNameNode *
1548Demangler::demangleNameScopeChain(StringView &MangledName,
1549 IdentifierNode *UnqualifiedName) {
1550 NodeList *Head = Arena.alloc<NodeList>();
1551
1552 Head->N = UnqualifiedName;
1553
1554 size_t Count = 1;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001555 while (!MangledName.consumeFront("@")) {
Zachary Turner03312862018-08-27 03:48:03 +00001556 ++Count;
1557 NodeList *NewHead = Arena.alloc<NodeList>();
1558 NewHead->Next = Head;
1559 Head = NewHead;
1560
Zachary Turnera7dffb12018-07-28 22:10:42 +00001561 if (MangledName.empty()) {
1562 Error = true;
1563 return nullptr;
1564 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001565
1566 assert(!Error);
Zachary Turner03312862018-08-27 03:48:03 +00001567 IdentifierNode *Elem = demangleNameScopePiece(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001568 if (Error)
1569 return nullptr;
1570
Zachary Turner03312862018-08-27 03:48:03 +00001571 Head->N = Elem;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001572 }
Zachary Turner03312862018-08-27 03:48:03 +00001573
1574 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
1575 QN->Components = nodeListToNodeArray(Arena, Head, Count);
1576 return QN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001577}
1578
Zachary Turner316109b2018-07-29 16:38:02 +00001579FuncClass Demangler::demangleFunctionClass(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001580 switch (MangledName.popFront()) {
Zachary Turner29ec67b2018-08-10 21:09:05 +00001581 case '9':
Zachary Turner03312862018-08-27 03:48:03 +00001582 return FuncClass(FC_ExternC | FC_NoParameterList);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001583 case 'A':
Zachary Turner03312862018-08-27 03:48:03 +00001584 return FC_Private;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001585 case 'B':
Zachary Turner03312862018-08-27 03:48:03 +00001586 return FuncClass(FC_Private | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001587 case 'C':
Zachary Turner03312862018-08-27 03:48:03 +00001588 return FuncClass(FC_Private | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001589 case 'D':
Zachary Turner03312862018-08-27 03:48:03 +00001590 return FuncClass(FC_Private | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001591 case 'E':
Zachary Turner03312862018-08-27 03:48:03 +00001592 return FuncClass(FC_Private | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001593 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00001594 return FuncClass(FC_Private | FC_Virtual);
Zachary Turner32a8a202018-08-29 23:56:09 +00001595 case 'G':
1596 return FuncClass(FC_Private | FC_StaticThisAdjust);
1597 case 'H':
1598 return FuncClass(FC_Private | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001599 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00001600 return FuncClass(FC_Protected);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001601 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001602 return FuncClass(FC_Protected | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001603 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001604 return FuncClass(FC_Protected | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001605 case 'L':
Zachary Turner03312862018-08-27 03:48:03 +00001606 return FuncClass(FC_Protected | FC_Static | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001607 case 'M':
Zachary Turner03312862018-08-27 03:48:03 +00001608 return FuncClass(FC_Protected | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001609 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001610 return FuncClass(FC_Protected | FC_Virtual | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001611 case 'O':
Zachary Turner03312862018-08-27 03:48:03 +00001612 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust);
Zachary Turner469f0762018-08-17 21:18:05 +00001613 case 'P':
Zachary Turner03312862018-08-27 03:48:03 +00001614 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001615 case 'Q':
Zachary Turner03312862018-08-27 03:48:03 +00001616 return FuncClass(FC_Public);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001617 case 'R':
Zachary Turner03312862018-08-27 03:48:03 +00001618 return FuncClass(FC_Public | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001619 case 'S':
Zachary Turner03312862018-08-27 03:48:03 +00001620 return FuncClass(FC_Public | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001621 case 'T':
Zachary Turner03312862018-08-27 03:48:03 +00001622 return FuncClass(FC_Public | FC_Static | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001623 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001624 return FuncClass(FC_Public | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001625 case 'V':
Zachary Turner03312862018-08-27 03:48:03 +00001626 return FuncClass(FC_Public | FC_Virtual | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001627 case 'W':
Zachary Turner03312862018-08-27 03:48:03 +00001628 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust);
Zachary Turner469f0762018-08-17 21:18:05 +00001629 case 'X':
Zachary Turner03312862018-08-27 03:48:03 +00001630 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001631 case 'Y':
Zachary Turner03312862018-08-27 03:48:03 +00001632 return FuncClass(FC_Global);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001633 case 'Z':
Zachary Turner03312862018-08-27 03:48:03 +00001634 return FuncClass(FC_Global | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001635 case '$': {
Zachary Turner03312862018-08-27 03:48:03 +00001636 FuncClass VFlag = FC_VirtualThisAdjust;
Zachary Turner469f0762018-08-17 21:18:05 +00001637 if (MangledName.consumeFront('R'))
Zachary Turner03312862018-08-27 03:48:03 +00001638 VFlag = FuncClass(VFlag | FC_VirtualThisAdjustEx);
Nico Weberb4f33bb2019-04-11 22:47:18 +00001639 if (MangledName.empty())
1640 break;
Zachary Turner469f0762018-08-17 21:18:05 +00001641 switch (MangledName.popFront()) {
1642 case '0':
Zachary Turner03312862018-08-27 03:48:03 +00001643 return FuncClass(FC_Private | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001644 case '1':
Zachary Turner03312862018-08-27 03:48:03 +00001645 return FuncClass(FC_Private | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001646 case '2':
Zachary Turner03312862018-08-27 03:48:03 +00001647 return FuncClass(FC_Protected | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001648 case '3':
Zachary Turner03312862018-08-27 03:48:03 +00001649 return FuncClass(FC_Protected | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001650 case '4':
Zachary Turner03312862018-08-27 03:48:03 +00001651 return FuncClass(FC_Public | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001652 case '5':
Zachary Turner03312862018-08-27 03:48:03 +00001653 return FuncClass(FC_Public | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001654 }
1655 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001656 }
1657
1658 Error = true;
Zachary Turner03312862018-08-27 03:48:03 +00001659 return FC_Public;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001660}
1661
Zachary Turner316109b2018-07-29 16:38:02 +00001662CallingConv Demangler::demangleCallingConvention(StringView &MangledName) {
Nico Weber63b97d22019-04-08 19:46:53 +00001663 if (MangledName.empty()) {
1664 Error = true;
1665 return CallingConv::None;
1666 }
1667
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001668 switch (MangledName.popFront()) {
1669 case 'A':
1670 case 'B':
1671 return CallingConv::Cdecl;
1672 case 'C':
1673 case 'D':
1674 return CallingConv::Pascal;
1675 case 'E':
1676 case 'F':
1677 return CallingConv::Thiscall;
1678 case 'G':
1679 case 'H':
1680 return CallingConv::Stdcall;
1681 case 'I':
1682 case 'J':
1683 return CallingConv::Fastcall;
1684 case 'M':
1685 case 'N':
1686 return CallingConv::Clrcall;
1687 case 'O':
1688 case 'P':
1689 return CallingConv::Eabi;
1690 case 'Q':
1691 return CallingConv::Vectorcall;
1692 }
1693
1694 return CallingConv::None;
Martin Storsjo0f2abd82018-07-20 18:43:42 +00001695}
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001696
Zachary Turner316109b2018-07-29 16:38:02 +00001697StorageClass Demangler::demangleVariableStorageClass(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001698 assert(std::isdigit(MangledName.front()));
1699
1700 switch (MangledName.popFront()) {
1701 case '0':
1702 return StorageClass::PrivateStatic;
1703 case '1':
1704 return StorageClass::ProtectedStatic;
1705 case '2':
1706 return StorageClass::PublicStatic;
1707 case '3':
1708 return StorageClass::Global;
1709 case '4':
1710 return StorageClass::FunctionLocalStatic;
1711 }
1712 Error = true;
1713 return StorageClass::None;
1714}
1715
Zachary Turner316109b2018-07-29 16:38:02 +00001716std::pair<Qualifiers, bool>
1717Demangler::demangleQualifiers(StringView &MangledName) {
Nico Weber63b97d22019-04-08 19:46:53 +00001718 if (MangledName.empty()) {
1719 Error = true;
1720 return std::make_pair(Q_None, false);
1721 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001722
1723 switch (MangledName.popFront()) {
Zachary Turnerd742d642018-07-26 19:56:09 +00001724 // Member qualifiers
1725 case 'Q':
1726 return std::make_pair(Q_None, true);
1727 case 'R':
1728 return std::make_pair(Q_Const, true);
1729 case 'S':
1730 return std::make_pair(Q_Volatile, true);
1731 case 'T':
1732 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), true);
1733 // Non-Member qualifiers
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001734 case 'A':
Zachary Turnerd742d642018-07-26 19:56:09 +00001735 return std::make_pair(Q_None, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001736 case 'B':
Zachary Turnerd742d642018-07-26 19:56:09 +00001737 return std::make_pair(Q_Const, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001738 case 'C':
Zachary Turnerd742d642018-07-26 19:56:09 +00001739 return std::make_pair(Q_Volatile, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001740 case 'D':
Zachary Turnerd742d642018-07-26 19:56:09 +00001741 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001742 }
1743 Error = true;
Zachary Turnerd742d642018-07-26 19:56:09 +00001744 return std::make_pair(Q_None, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001745}
1746
1747// <variable-type> ::= <type> <cvr-qualifiers>
1748// ::= <type> <pointee-cvr-qualifiers> # pointers, references
Zachary Turner03312862018-08-27 03:48:03 +00001749TypeNode *Demangler::demangleType(StringView &MangledName,
1750 QualifierMangleMode QMM) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001751 Qualifiers Quals = Q_None;
Zachary Turnerd742d642018-07-26 19:56:09 +00001752 bool IsMember = false;
Zachary Turnerd742d642018-07-26 19:56:09 +00001753 if (QMM == QualifierMangleMode::Mangle) {
Zachary Turner316109b2018-07-29 16:38:02 +00001754 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00001755 } else if (QMM == QualifierMangleMode::Result) {
Zachary Turnerdf4cd7c2018-08-21 21:23:49 +00001756 if (MangledName.consumeFront('?'))
Zachary Turner316109b2018-07-29 16:38:02 +00001757 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001758 }
1759
Nico Weber63b97d22019-04-08 19:46:53 +00001760 if (MangledName.empty()) {
1761 Error = true;
1762 return nullptr;
1763 }
1764
Zachary Turner03312862018-08-27 03:48:03 +00001765 TypeNode *Ty = nullptr;
Zachary Turner931e8792018-07-30 23:02:10 +00001766 if (isTagType(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001767 Ty = demangleClassType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001768 else if (isPointerType(MangledName)) {
Zachary Turner8fb9a712018-12-14 18:10:13 +00001769 if (isMemberPointer(MangledName, Error))
Zachary Turner316109b2018-07-29 16:38:02 +00001770 Ty = demangleMemberPointerType(MangledName);
Zachary Turner8fb9a712018-12-14 18:10:13 +00001771 else if (!Error)
Zachary Turner316109b2018-07-29 16:38:02 +00001772 Ty = demanglePointerType(MangledName);
Zachary Turner8fb9a712018-12-14 18:10:13 +00001773 else
1774 return nullptr;
Zachary Turner931e8792018-07-30 23:02:10 +00001775 } else if (isArrayType(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001776 Ty = demangleArrayType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001777 else if (isFunctionType(MangledName)) {
1778 if (MangledName.consumeFront("$$A8@@"))
Zachary Turner03312862018-08-27 03:48:03 +00001779 Ty = demangleFunctionType(MangledName, true);
Zachary Turner931e8792018-07-30 23:02:10 +00001780 else {
1781 assert(MangledName.startsWith("$$A6"));
1782 MangledName.consumeFront("$$A6");
Zachary Turner03312862018-08-27 03:48:03 +00001783 Ty = demangleFunctionType(MangledName, false);
Zachary Turner931e8792018-07-30 23:02:10 +00001784 }
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001785 } else if (isCustomType(MangledName)) {
1786 Ty = demangleCustomType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001787 } else {
Zachary Turner03312862018-08-27 03:48:03 +00001788 Ty = demanglePrimitiveType(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001789 }
Zachary Turner931e8792018-07-30 23:02:10 +00001790
Zachary Turner2cd32862018-12-14 17:43:56 +00001791 if (!Ty || Error)
1792 return Ty;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001793 Ty->Quals = Qualifiers(Ty->Quals | Quals);
1794 return Ty;
1795}
1796
Zachary Turner2fe49002019-01-08 21:05:51 +00001797bool Demangler::demangleThrowSpecification(StringView &MangledName) {
1798 if (MangledName.consumeFront("_E"))
1799 return true;
Zachary Turner38b78a72018-07-26 20:20:10 +00001800 if (MangledName.consumeFront('Z'))
Zachary Turner2fe49002019-01-08 21:05:51 +00001801 return false;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001802
Zachary Turner38b78a72018-07-26 20:20:10 +00001803 Error = true;
Zachary Turner2fe49002019-01-08 21:05:51 +00001804 return false;
Zachary Turner38b78a72018-07-26 20:20:10 +00001805}
1806
Zachary Turner03312862018-08-27 03:48:03 +00001807FunctionSignatureNode *Demangler::demangleFunctionType(StringView &MangledName,
1808 bool HasThisQuals) {
1809 FunctionSignatureNode *FTy = Arena.alloc<FunctionSignatureNode>();
Zachary Turner38b78a72018-07-26 20:20:10 +00001810
1811 if (HasThisQuals) {
Zachary Turner316109b2018-07-29 16:38:02 +00001812 FTy->Quals = demanglePointerExtQualifiers(MangledName);
Zachary Turner03312862018-08-27 03:48:03 +00001813 FTy->RefQualifier = demangleFunctionRefQualifier(MangledName);
Zachary Turner316109b2018-07-29 16:38:02 +00001814 FTy->Quals = Qualifiers(FTy->Quals | demangleQualifiers(MangledName).first);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001815 }
1816
1817 // Fields that appear on both member and non-member functions.
Zachary Turner316109b2018-07-29 16:38:02 +00001818 FTy->CallConvention = demangleCallingConvention(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001819
1820 // <return-type> ::= <type>
1821 // ::= @ # structors (they have no declared return type)
1822 bool IsStructor = MangledName.consumeFront('@');
1823 if (!IsStructor)
Zachary Turner316109b2018-07-29 16:38:02 +00001824 FTy->ReturnType = demangleType(MangledName, QualifierMangleMode::Result);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001825
Zachary Turner316109b2018-07-29 16:38:02 +00001826 FTy->Params = demangleFunctionParameterList(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001827
Zachary Turner2fe49002019-01-08 21:05:51 +00001828 FTy->IsNoexcept = demangleThrowSpecification(MangledName);
Zachary Turner38b78a72018-07-26 20:20:10 +00001829
1830 return FTy;
1831}
1832
Zachary Turner03312862018-08-27 03:48:03 +00001833FunctionSymbolNode *
1834Demangler::demangleFunctionEncoding(StringView &MangledName) {
1835 FuncClass ExtraFlags = FC_None;
Zachary Turner469f0762018-08-17 21:18:05 +00001836 if (MangledName.consumeFront("$$J0"))
Zachary Turner03312862018-08-27 03:48:03 +00001837 ExtraFlags = FC_ExternC;
Zachary Turner469f0762018-08-17 21:18:05 +00001838
Nico Weber63b97d22019-04-08 19:46:53 +00001839 if (MangledName.empty()) {
1840 Error = true;
1841 return nullptr;
1842 }
1843
Zachary Turner316109b2018-07-29 16:38:02 +00001844 FuncClass FC = demangleFunctionClass(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001845 FC = FuncClass(ExtraFlags | FC);
1846
Zachary Turner03312862018-08-27 03:48:03 +00001847 FunctionSignatureNode *FSN = nullptr;
1848 ThunkSignatureNode *TTN = nullptr;
1849 if (FC & FC_StaticThisAdjust) {
1850 TTN = Arena.alloc<ThunkSignatureNode>();
1851 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
1852 } else if (FC & FC_VirtualThisAdjust) {
1853 TTN = Arena.alloc<ThunkSignatureNode>();
1854 if (FC & FC_VirtualThisAdjustEx) {
1855 TTN->ThisAdjust.VBPtrOffset = demangleSigned(MangledName);
1856 TTN->ThisAdjust.VBOffsetOffset = demangleSigned(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001857 }
Zachary Turner03312862018-08-27 03:48:03 +00001858 TTN->ThisAdjust.VtordispOffset = demangleSigned(MangledName);
1859 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001860 }
1861
Zachary Turner03312862018-08-27 03:48:03 +00001862 if (FC & FC_NoParameterList) {
Zachary Turner29ec67b2018-08-10 21:09:05 +00001863 // This is an extern "C" function whose full signature hasn't been mangled.
1864 // This happens when we need to mangle a local symbol inside of an extern
1865 // "C" function.
Zachary Turner03312862018-08-27 03:48:03 +00001866 FSN = Arena.alloc<FunctionSignatureNode>();
Zachary Turner29ec67b2018-08-10 21:09:05 +00001867 } else {
Zachary Turner03312862018-08-27 03:48:03 +00001868 bool HasThisQuals = !(FC & (FC_Global | FC_Static));
1869 FSN = demangleFunctionType(MangledName, HasThisQuals);
Zachary Turner29ec67b2018-08-10 21:09:05 +00001870 }
Nico Weber63b97d22019-04-08 19:46:53 +00001871
1872 if (Error)
1873 return nullptr;
1874
Zachary Turner03312862018-08-27 03:48:03 +00001875 if (TTN) {
1876 *static_cast<FunctionSignatureNode *>(TTN) = *FSN;
1877 FSN = TTN;
1878 }
1879 FSN->FunctionClass = FC;
Zachary Turner38b78a72018-07-26 20:20:10 +00001880
Zachary Turner03312862018-08-27 03:48:03 +00001881 FunctionSymbolNode *Symbol = Arena.alloc<FunctionSymbolNode>();
1882 Symbol->Signature = FSN;
1883 return Symbol;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001884}
1885
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001886CustomTypeNode *Demangler::demangleCustomType(StringView &MangledName) {
1887 assert(MangledName.startsWith('?'));
1888 MangledName.popFront();
1889
1890 CustomTypeNode *CTN = Arena.alloc<CustomTypeNode>();
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001891 CTN->Identifier = demangleUnqualifiedTypeName(MangledName, /*Memorize=*/true);
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001892 if (!MangledName.consumeFront('@'))
1893 Error = true;
1894 if (Error)
1895 return nullptr;
1896 return CTN;
1897}
1898
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001899// Reads a primitive type.
Zachary Turner03312862018-08-27 03:48:03 +00001900PrimitiveTypeNode *Demangler::demanglePrimitiveType(StringView &MangledName) {
1901 if (MangledName.consumeFront("$$T"))
1902 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Nullptr);
Zachary Turner931e8792018-07-30 23:02:10 +00001903
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001904 switch (MangledName.popFront()) {
1905 case 'X':
Zachary Turner03312862018-08-27 03:48:03 +00001906 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Void);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001907 case 'D':
Zachary Turner03312862018-08-27 03:48:03 +00001908 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001909 case 'C':
Zachary Turner03312862018-08-27 03:48:03 +00001910 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Schar);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001911 case 'E':
Zachary Turner03312862018-08-27 03:48:03 +00001912 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uchar);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001913 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00001914 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Short);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001915 case 'G':
Zachary Turner03312862018-08-27 03:48:03 +00001916 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ushort);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001917 case 'H':
Zachary Turner03312862018-08-27 03:48:03 +00001918 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001919 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00001920 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001921 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001922 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Long);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001923 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001924 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ulong);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001925 case 'M':
Zachary Turner03312862018-08-27 03:48:03 +00001926 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Float);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001927 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001928 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Double);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001929 case 'O':
Zachary Turner03312862018-08-27 03:48:03 +00001930 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ldouble);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001931 case '_': {
Zachary Turner91ecedd2018-07-20 18:07:33 +00001932 if (MangledName.empty()) {
1933 Error = true;
1934 return nullptr;
1935 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001936 switch (MangledName.popFront()) {
1937 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001938 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Bool);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001939 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001940 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int64);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001941 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001942 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint64);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001943 case 'W':
Zachary Turner03312862018-08-27 03:48:03 +00001944 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Wchar);
Nico Webera2ca6e72019-05-28 15:30:04 +00001945 case 'Q':
1946 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char8);
Zachary Turner931e8792018-07-30 23:02:10 +00001947 case 'S':
Zachary Turner03312862018-08-27 03:48:03 +00001948 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char16);
Zachary Turner931e8792018-07-30 23:02:10 +00001949 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001950 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char32);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001951 }
1952 break;
1953 }
1954 }
Zachary Turner03312862018-08-27 03:48:03 +00001955 Error = true;
1956 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001957}
1958
Zachary Turner03312862018-08-27 03:48:03 +00001959TagTypeNode *Demangler::demangleClassType(StringView &MangledName) {
1960 TagTypeNode *TT = nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001961
1962 switch (MangledName.popFront()) {
1963 case 'T':
Zachary Turner03312862018-08-27 03:48:03 +00001964 TT = Arena.alloc<TagTypeNode>(TagKind::Union);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001965 break;
1966 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001967 TT = Arena.alloc<TagTypeNode>(TagKind::Struct);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001968 break;
1969 case 'V':
Zachary Turner03312862018-08-27 03:48:03 +00001970 TT = Arena.alloc<TagTypeNode>(TagKind::Class);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001971 break;
1972 case 'W':
Nico Webere5b62652019-04-11 22:59:25 +00001973 if (!MangledName.consumeFront('4')) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001974 Error = true;
1975 return nullptr;
1976 }
Zachary Turner03312862018-08-27 03:48:03 +00001977 TT = Arena.alloc<TagTypeNode>(TagKind::Enum);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001978 break;
1979 default:
1980 assert(false);
1981 }
1982
Zachary Turner03312862018-08-27 03:48:03 +00001983 TT->QualifiedName = demangleFullyQualifiedTypeName(MangledName);
1984 return TT;
Zachary Turnerd742d642018-07-26 19:56:09 +00001985}
1986
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001987// <pointer-type> ::= E? <pointer-cvr-qualifiers> <ext-qualifiers> <type>
1988// # the E is required for 64-bit non-static pointers
Zachary Turner03312862018-08-27 03:48:03 +00001989PointerTypeNode *Demangler::demanglePointerType(StringView &MangledName) {
1990 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001991
Zachary Turner931e8792018-07-30 23:02:10 +00001992 std::tie(Pointer->Quals, Pointer->Affinity) =
1993 demanglePointerCVQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001994
1995 if (MangledName.consumeFront("6")) {
Zachary Turner03312862018-08-27 03:48:03 +00001996 Pointer->Pointee = demangleFunctionType(MangledName, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001997 return Pointer;
1998 }
1999
Zachary Turner316109b2018-07-29 16:38:02 +00002000 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002001 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
2002
Zachary Turner316109b2018-07-29 16:38:02 +00002003 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Mangle);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002004 return Pointer;
2005}
2006
Zachary Turner03312862018-08-27 03:48:03 +00002007PointerTypeNode *Demangler::demangleMemberPointerType(StringView &MangledName) {
2008 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
Zachary Turnerd742d642018-07-26 19:56:09 +00002009
Zachary Turner03312862018-08-27 03:48:03 +00002010 std::tie(Pointer->Quals, Pointer->Affinity) =
2011 demanglePointerCVQualifiers(MangledName);
2012 assert(Pointer->Affinity == PointerAffinity::Pointer);
Zachary Turnerd742d642018-07-26 19:56:09 +00002013
Zachary Turner316109b2018-07-29 16:38:02 +00002014 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00002015 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
2016
Nico Weber63b97d22019-04-08 19:46:53 +00002017 // isMemberPointer() only returns true if there is at least one character
2018 // after the qualifiers.
Zachary Turner38b78a72018-07-26 20:20:10 +00002019 if (MangledName.consumeFront("8")) {
Zachary Turner32a8a202018-08-29 23:56:09 +00002020 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
Zachary Turner03312862018-08-27 03:48:03 +00002021 Pointer->Pointee = demangleFunctionType(MangledName, true);
Zachary Turner38b78a72018-07-26 20:20:10 +00002022 } else {
2023 Qualifiers PointeeQuals = Q_None;
2024 bool IsMember = false;
Zachary Turner316109b2018-07-29 16:38:02 +00002025 std::tie(PointeeQuals, IsMember) = demangleQualifiers(MangledName);
Nico Weber63b97d22019-04-08 19:46:53 +00002026 assert(IsMember || Error);
Zachary Turner32a8a202018-08-29 23:56:09 +00002027 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00002028
Zachary Turner316109b2018-07-29 16:38:02 +00002029 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Drop);
Nico Weber63b97d22019-04-08 19:46:53 +00002030 if (Pointer->Pointee)
2031 Pointer->Pointee->Quals = PointeeQuals;
Zachary Turner38b78a72018-07-26 20:20:10 +00002032 }
2033
Zachary Turnerd742d642018-07-26 19:56:09 +00002034 return Pointer;
2035}
2036
Zachary Turner316109b2018-07-29 16:38:02 +00002037Qualifiers Demangler::demanglePointerExtQualifiers(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002038 Qualifiers Quals = Q_None;
2039 if (MangledName.consumeFront('E'))
2040 Quals = Qualifiers(Quals | Q_Pointer64);
2041 if (MangledName.consumeFront('I'))
2042 Quals = Qualifiers(Quals | Q_Restrict);
2043 if (MangledName.consumeFront('F'))
2044 Quals = Qualifiers(Quals | Q_Unaligned);
2045
2046 return Quals;
2047}
2048
Zachary Turner03312862018-08-27 03:48:03 +00002049ArrayTypeNode *Demangler::demangleArrayType(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002050 assert(MangledName.front() == 'Y');
2051 MangledName.popFront();
2052
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002053 uint64_t Rank = 0;
2054 bool IsNegative = false;
2055 std::tie(Rank, IsNegative) = demangleNumber(MangledName);
2056 if (IsNegative || Rank == 0) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002057 Error = true;
2058 return nullptr;
2059 }
2060
Zachary Turner03312862018-08-27 03:48:03 +00002061 ArrayTypeNode *ATy = Arena.alloc<ArrayTypeNode>();
2062 NodeList *Head = Arena.alloc<NodeList>();
2063 NodeList *Tail = Head;
2064
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002065 for (uint64_t I = 0; I < Rank; ++I) {
Zachary Turner03312862018-08-27 03:48:03 +00002066 uint64_t D = 0;
2067 std::tie(D, IsNegative) = demangleNumber(MangledName);
Nico Weber16725812019-04-03 23:27:18 +00002068 if (Error || IsNegative) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002069 Error = true;
2070 return nullptr;
2071 }
Zachary Turner03312862018-08-27 03:48:03 +00002072 Tail->N = Arena.alloc<IntegerLiteralNode>(D, IsNegative);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002073 if (I + 1 < Rank) {
Zachary Turner03312862018-08-27 03:48:03 +00002074 Tail->Next = Arena.alloc<NodeList>();
2075 Tail = Tail->Next;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002076 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002077 }
Zachary Turner03312862018-08-27 03:48:03 +00002078 ATy->Dimensions = nodeListToNodeArray(Arena, Head, Rank);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002079
2080 if (MangledName.consumeFront("$$C")) {
Zachary Turner2bbb23b2018-08-14 18:54:28 +00002081 bool IsMember = false;
2082 std::tie(ATy->Quals, IsMember) = demangleQualifiers(MangledName);
2083 if (IsMember) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002084 Error = true;
Zachary Turner2bbb23b2018-08-14 18:54:28 +00002085 return nullptr;
2086 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002087 }
2088
Zachary Turner316109b2018-07-29 16:38:02 +00002089 ATy->ElementType = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002090 return ATy;
2091}
2092
2093// Reads a function or a template parameters.
Zachary Turner03312862018-08-27 03:48:03 +00002094NodeArrayNode *
Zachary Turnerd30700f2018-07-31 17:16:44 +00002095Demangler::demangleFunctionParameterList(StringView &MangledName) {
Zachary Turner38b78a72018-07-26 20:20:10 +00002096 // Empty parameter list.
Zachary Turner38b78a72018-07-26 20:20:10 +00002097 if (MangledName.consumeFront('X'))
Nico Weber930994c2019-04-16 14:24:42 +00002098 return nullptr;
Zachary Turner38b78a72018-07-26 20:20:10 +00002099
Zachary Turner03312862018-08-27 03:48:03 +00002100 NodeList *Head = Arena.alloc<NodeList>();
2101 NodeList **Current = &Head;
2102 size_t Count = 0;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002103 while (!Error && !MangledName.startsWith('@') &&
2104 !MangledName.startsWith('Z')) {
Zachary Turner03312862018-08-27 03:48:03 +00002105 ++Count;
Zachary Turner23df1312018-07-26 22:13:39 +00002106
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002107 if (startsWithDigit(MangledName)) {
Zachary Turner30375de2018-07-26 22:24:01 +00002108 size_t N = MangledName[0] - '0';
Zachary Turnerd346cba2018-08-08 17:17:04 +00002109 if (N >= Backrefs.FunctionParamCount) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002110 Error = true;
Nico Weber930994c2019-04-16 14:24:42 +00002111 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002112 }
2113 MangledName = MangledName.dropFront();
2114
Zachary Turner03312862018-08-27 03:48:03 +00002115 *Current = Arena.alloc<NodeList>();
2116 (*Current)->N = Backrefs.FunctionParams[N];
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002117 Current = &(*Current)->Next;
2118 continue;
2119 }
2120
Zachary Turner23df1312018-07-26 22:13:39 +00002121 size_t OldSize = MangledName.size();
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002122
Zachary Turner03312862018-08-27 03:48:03 +00002123 *Current = Arena.alloc<NodeList>();
2124 TypeNode *TN = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turner8fb9a712018-12-14 18:10:13 +00002125 if (!TN || Error)
2126 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00002127
2128 (*Current)->N = TN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002129
Zachary Turner23df1312018-07-26 22:13:39 +00002130 size_t CharsConsumed = OldSize - MangledName.size();
2131 assert(CharsConsumed != 0);
2132
2133 // Single-letter types are ignored for backreferences because memorizing
2134 // them doesn't save anything.
Zachary Turnerd346cba2018-08-08 17:17:04 +00002135 if (Backrefs.FunctionParamCount <= 9 && CharsConsumed > 1)
Zachary Turner03312862018-08-27 03:48:03 +00002136 Backrefs.FunctionParams[Backrefs.FunctionParamCount++] = TN;
Zachary Turner23df1312018-07-26 22:13:39 +00002137
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002138 Current = &(*Current)->Next;
2139 }
2140
Zachary Turner38b78a72018-07-26 20:20:10 +00002141 if (Error)
Nico Weber930994c2019-04-16 14:24:42 +00002142 return nullptr;
Zachary Turner38b78a72018-07-26 20:20:10 +00002143
Zachary Turner03312862018-08-27 03:48:03 +00002144 NodeArrayNode *NA = nodeListToNodeArray(Arena, Head, Count);
Zachary Turner38b78a72018-07-26 20:20:10 +00002145 // A non-empty parameter list is terminated by either 'Z' (variadic) parameter
2146 // list or '@' (non variadic). Careful not to consume "@Z", as in that case
2147 // the following Z could be a throw specifier.
2148 if (MangledName.consumeFront('@'))
Zachary Turner03312862018-08-27 03:48:03 +00002149 return NA;
Zachary Turner38b78a72018-07-26 20:20:10 +00002150
2151 if (MangledName.consumeFront('Z')) {
Zachary Turner03312862018-08-27 03:48:03 +00002152 // This is a variadic parameter list. We probably need a variadic node to
2153 // append to the end.
2154 return NA;
Zachary Turner38b78a72018-07-26 20:20:10 +00002155 }
2156
2157 Error = true;
Nico Weber930994c2019-04-16 14:24:42 +00002158 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002159}
2160
Zachary Turner03312862018-08-27 03:48:03 +00002161NodeArrayNode *
Zachary Turnerd30700f2018-07-31 17:16:44 +00002162Demangler::demangleTemplateParameterList(StringView &MangledName) {
Zachary Turner03312862018-08-27 03:48:03 +00002163 NodeList *Head;
2164 NodeList **Current = &Head;
2165 size_t Count = 0;
2166
Zachary Turner23df1312018-07-26 22:13:39 +00002167 while (!Error && !MangledName.startsWith('@')) {
Zachary Turner32a8a202018-08-29 23:56:09 +00002168 if (MangledName.consumeFront("$S") || MangledName.consumeFront("$$V") ||
Zachary Turner78ab3cb2018-08-30 20:53:29 +00002169 MangledName.consumeFront("$$$V") || MangledName.consumeFront("$$Z")) {
2170 // parameter pack separator
Zachary Turner32a8a202018-08-29 23:56:09 +00002171 continue;
2172 }
2173
Zachary Turner03312862018-08-27 03:48:03 +00002174 ++Count;
Zachary Turner32a8a202018-08-29 23:56:09 +00002175
Zachary Turner23df1312018-07-26 22:13:39 +00002176 // Template parameter lists don't participate in back-referencing.
Zachary Turner03312862018-08-27 03:48:03 +00002177 *Current = Arena.alloc<NodeList>();
Zachary Turner931e8792018-07-30 23:02:10 +00002178
Zachary Turner03312862018-08-27 03:48:03 +00002179 NodeList &TP = **Current;
Zachary Turner66555a72018-08-20 19:15:35 +00002180
Zachary Turner03312862018-08-27 03:48:03 +00002181 TemplateParameterReferenceNode *TPRN = nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +00002182 if (MangledName.consumeFront("$$Y")) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002183 // Template alias
Zachary Turner03312862018-08-27 03:48:03 +00002184 TP.N = demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002185 } else if (MangledName.consumeFront("$$B")) {
2186 // Array
Zachary Turner03312862018-08-27 03:48:03 +00002187 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turner073620b2018-08-10 19:57:36 +00002188 } else if (MangledName.consumeFront("$$C")) {
2189 // Type has qualifiers.
Zachary Turner03312862018-08-27 03:48:03 +00002190 TP.N = demangleType(MangledName, QualifierMangleMode::Mangle);
Zachary Turner66555a72018-08-20 19:15:35 +00002191 } else if (MangledName.startsWith("$1") || MangledName.startsWith("$H") ||
2192 MangledName.startsWith("$I") || MangledName.startsWith("$J")) {
Zachary Turner03312862018-08-27 03:48:03 +00002193 // Pointer to member
2194 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2195 TPRN->IsMemberPointer = true;
2196
Zachary Turner66555a72018-08-20 19:15:35 +00002197 MangledName = MangledName.dropFront();
2198 // 1 - single inheritance <name>
2199 // H - multiple inheritance <name> <number>
2200 // I - virtual inheritance <name> <number> <number> <number>
2201 // J - unspecified inheritance <name> <number> <number> <number>
2202 char InheritanceSpecifier = MangledName.popFront();
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00002203 SymbolNode *S = nullptr;
2204 if (MangledName.startsWith('?')) {
2205 S = parse(MangledName);
Nico Weber09fb2022019-05-22 15:53:23 +00002206 if (Error || !S->Name) {
2207 Error = true;
Nico Weberf2d8f092019-04-11 22:23:35 +00002208 return nullptr;
Nico Weber09fb2022019-05-22 15:53:23 +00002209 }
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00002210 memorizeIdentifier(S->Name->getUnqualifiedIdentifier());
2211 }
2212
Zachary Turner66555a72018-08-20 19:15:35 +00002213 switch (InheritanceSpecifier) {
2214 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00002215 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2216 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002217 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002218 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00002219 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2220 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002221 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002222 case 'H':
Zachary Turner03312862018-08-27 03:48:03 +00002223 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2224 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002225 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002226 case '1':
2227 break;
2228 default:
2229 Error = true;
2230 break;
2231 }
Zachary Turner03312862018-08-27 03:48:03 +00002232 TPRN->Affinity = PointerAffinity::Pointer;
2233 TPRN->Symbol = S;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002234 } else if (MangledName.startsWith("$E?")) {
2235 MangledName.consumeFront("$E");
2236 // Reference to symbol
Zachary Turner03312862018-08-27 03:48:03 +00002237 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2238 TPRN->Symbol = parse(MangledName);
2239 TPRN->Affinity = PointerAffinity::Reference;
Zachary Turner66555a72018-08-20 19:15:35 +00002240 } else if (MangledName.startsWith("$F") || MangledName.startsWith("$G")) {
Zachary Turner03312862018-08-27 03:48:03 +00002241 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2242
Zachary Turner66555a72018-08-20 19:15:35 +00002243 // Data member pointer.
2244 MangledName = MangledName.dropFront();
2245 char InheritanceSpecifier = MangledName.popFront();
2246
2247 switch (InheritanceSpecifier) {
2248 case 'G':
Zachary Turner03312862018-08-27 03:48:03 +00002249 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2250 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002251 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002252 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00002253 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2254 demangleSigned(MangledName);
2255 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2256 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002257 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002258 case '0':
2259 break;
2260 default:
2261 Error = true;
2262 break;
2263 }
Zachary Turner03312862018-08-27 03:48:03 +00002264 TPRN->IsMemberPointer = true;
Zachary Turner66555a72018-08-20 19:15:35 +00002265
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002266 } else if (MangledName.consumeFront("$0")) {
2267 // Integral non-type template parameter
2268 bool IsNegative = false;
2269 uint64_t Value = 0;
2270 std::tie(Value, IsNegative) = demangleNumber(MangledName);
2271
Zachary Turner03312862018-08-27 03:48:03 +00002272 TP.N = Arena.alloc<IntegerLiteralNode>(Value, IsNegative);
Zachary Turnerd30700f2018-07-31 17:16:44 +00002273 } else {
Zachary Turner03312862018-08-27 03:48:03 +00002274 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turnerd30700f2018-07-31 17:16:44 +00002275 }
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002276 if (Error)
2277 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002278
Zachary Turner66555a72018-08-20 19:15:35 +00002279 Current = &TP.Next;
Zachary Turner23df1312018-07-26 22:13:39 +00002280 }
2281
2282 if (Error)
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002283 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002284
2285 // Template parameter lists cannot be variadic, so it can only be terminated
2286 // by @.
2287 if (MangledName.consumeFront('@'))
Zachary Turner03312862018-08-27 03:48:03 +00002288 return nodeListToNodeArray(Arena, Head, Count);
Zachary Turner23df1312018-07-26 22:13:39 +00002289 Error = true;
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002290 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002291}
2292
Zachary Turner3a758e22018-08-01 18:33:04 +00002293void Demangler::dumpBackReferences() {
Zachary Turner5ae08b82018-08-01 18:44:12 +00002294 std::printf("%d function parameter backreferences\n",
Zachary Turnerd346cba2018-08-08 17:17:04 +00002295 (int)Backrefs.FunctionParamCount);
Zachary Turner3a758e22018-08-01 18:33:04 +00002296
2297 // Create an output stream so we can render each type.
Nico Weber1359d652018-09-15 18:24:20 +00002298 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +00002299 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00002300 std::terminate();
Zachary Turnerd346cba2018-08-08 17:17:04 +00002301 for (size_t I = 0; I < Backrefs.FunctionParamCount; ++I) {
Zachary Turner3a758e22018-08-01 18:33:04 +00002302 OS.setCurrentPosition(0);
2303
Zachary Turner03312862018-08-27 03:48:03 +00002304 TypeNode *T = Backrefs.FunctionParams[I];
Zachary Turner38d2edd2018-08-29 03:59:17 +00002305 T->output(OS, OF_Default);
Zachary Turner3a758e22018-08-01 18:33:04 +00002306
Zachary Turner7563ebe2018-08-02 17:08:24 +00002307 std::printf(" [%d] - %.*s\n", (int)I, (int)OS.getCurrentPosition(),
Zachary Turner5ae08b82018-08-01 18:44:12 +00002308 OS.getBuffer());
Zachary Turner3a758e22018-08-01 18:33:04 +00002309 }
2310 std::free(OS.getBuffer());
2311
Zachary Turnerd346cba2018-08-08 17:17:04 +00002312 if (Backrefs.FunctionParamCount > 0)
Zachary Turner5ae08b82018-08-01 18:44:12 +00002313 std::printf("\n");
Zachary Turnerd346cba2018-08-08 17:17:04 +00002314 std::printf("%d name backreferences\n", (int)Backrefs.NamesCount);
2315 for (size_t I = 0; I < Backrefs.NamesCount; ++I) {
Zachary Turner03312862018-08-27 03:48:03 +00002316 std::printf(" [%d] - %.*s\n", (int)I, (int)Backrefs.Names[I]->Name.size(),
2317 Backrefs.Names[I]->Name.begin());
Zachary Turner3a758e22018-08-01 18:33:04 +00002318 }
Zachary Turnerd346cba2018-08-08 17:17:04 +00002319 if (Backrefs.NamesCount > 0)
Zachary Turner5ae08b82018-08-01 18:44:12 +00002320 std::printf("\n");
Zachary Turner3a758e22018-08-01 18:33:04 +00002321}
2322
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002323char *llvm::microsoftDemangle(const char *MangledName, char *Buf, size_t *N,
Zachary Turner3a758e22018-08-01 18:33:04 +00002324 int *Status, MSDemangleFlags Flags) {
Nico Weber1359d652018-09-15 18:24:20 +00002325 int InternalStatus = demangle_success;
Zachary Turner316109b2018-07-29 16:38:02 +00002326 Demangler D;
Nico Weber1359d652018-09-15 18:24:20 +00002327 OutputStream S;
2328
Zachary Turner316109b2018-07-29 16:38:02 +00002329 StringView Name{MangledName};
Nico Weber1359d652018-09-15 18:24:20 +00002330 SymbolNode *AST = D.parse(Name);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002331
Zachary Turner3a758e22018-08-01 18:33:04 +00002332 if (Flags & MSDF_DumpBackrefs)
2333 D.dumpBackReferences();
Nico Weber1359d652018-09-15 18:24:20 +00002334
2335 if (D.Error)
2336 InternalStatus = demangle_invalid_mangled_name;
Nico Weber6808bc02018-11-11 10:04:00 +00002337 else if (!initializeOutputStream(Buf, N, S, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00002338 InternalStatus = demangle_memory_alloc_failure;
2339 else {
2340 AST->output(S, OF_Default);
2341 S += '\0';
2342 if (N != nullptr)
2343 *N = S.getCurrentPosition();
2344 Buf = S.getBuffer();
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002345 }
2346
Nico Weber1359d652018-09-15 18:24:20 +00002347 if (Status)
2348 *Status = InternalStatus;
2349 return InternalStatus == demangle_success ? Buf : nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002350}