blob: 425c7d3fd19bcafebaa2bd2d4ebb51c922ffb60a [file] [log] [blame]
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001//===- MicrosoftDemangle.cpp ----------------------------------------------===//
2//
Chandler Carruth57b08b02019-01-19 10:56:40 +00003// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
Zachary Turnerf435a7e2018-07-20 17:27:48 +00006//
7//===----------------------------------------------------------------------===//
8//
9// This file defines a demangler for MSVC-style mangled symbols.
10//
11// This file has no dependencies on the rest of LLVM so that it can be
12// easily reused in other programs such as libcxxabi.
13//
14//===----------------------------------------------------------------------===//
15
Zachary Turner7ba90562018-11-01 15:07:32 +000016#include "llvm/Demangle/MicrosoftDemangle.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000017#include "llvm/Demangle/Demangle.h"
Zachary Turner7ba90562018-11-01 15:07:32 +000018#include "llvm/Demangle/MicrosoftDemangleNodes.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000019
Erik Pilkington5094e5e2019-01-17 20:37:51 +000020#include "llvm/Demangle/DemangleConfig.h"
Richard Smith8a57f2e2018-08-20 19:44:01 +000021#include "llvm/Demangle/StringView.h"
22#include "llvm/Demangle/Utility.h"
Zachary Turnerf435a7e2018-07-20 17:27:48 +000023
Zachary Turner66555a72018-08-20 19:15:35 +000024#include <array>
Zachary Turnerf435a7e2018-07-20 17:27:48 +000025#include <cctype>
Zachary Turner5ae08b82018-08-01 18:44:12 +000026#include <cstdio>
Zachary Turnerd742d642018-07-26 19:56:09 +000027#include <tuple>
Zachary Turnerf435a7e2018-07-20 17:27:48 +000028
Zachary Turner03312862018-08-27 03:48:03 +000029using namespace llvm;
30using namespace ms_demangle;
Zachary Turnerf435a7e2018-07-20 17:27:48 +000031
32static bool startsWithDigit(StringView S) {
33 return !S.empty() && std::isdigit(S.front());
34}
35
Zachary Turnerd742d642018-07-26 19:56:09 +000036
Zachary Turner03312862018-08-27 03:48:03 +000037struct NodeList {
38 Node *N = nullptr;
39 NodeList *Next = nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +000040};
41
Zachary Turner8fb9a712018-12-14 18:10:13 +000042static bool isMemberPointer(StringView MangledName, bool &Error) {
43 Error = false;
Zachary Turnerd742d642018-07-26 19:56:09 +000044 switch (MangledName.popFront()) {
Zachary Turner931e8792018-07-30 23:02:10 +000045 case '$':
46 // This is probably an rvalue reference (e.g. $$Q), and you cannot have an
47 // rvalue reference to a member.
48 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +000049 case 'A':
50 // 'A' indicates a reference, and you cannot have a reference to a member
Zachary Turner931e8792018-07-30 23:02:10 +000051 // function or member.
Zachary Turnerd742d642018-07-26 19:56:09 +000052 return false;
53 case 'P':
54 case 'Q':
55 case 'R':
56 case 'S':
57 // These 4 values indicate some kind of pointer, but we still don't know
58 // what.
59 break;
60 default:
Zachary Turner8fb9a712018-12-14 18:10:13 +000061 Error = true;
62 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +000063 }
64
65 // If it starts with a number, then 6 indicates a non-member function
66 // pointer, and 8 indicates a member function pointer.
67 if (startsWithDigit(MangledName)) {
Nico Weber63b97d22019-04-08 19:46:53 +000068 if (MangledName[0] != '6' && MangledName[0] != '8') {
69 Error = true;
70 return false;
71 }
Zachary Turnerd742d642018-07-26 19:56:09 +000072 return (MangledName[0] == '8');
73 }
74
75 // Remove ext qualifiers since those can appear on either type and are
76 // therefore not indicative.
77 MangledName.consumeFront('E'); // 64-bit
78 MangledName.consumeFront('I'); // restrict
79 MangledName.consumeFront('F'); // unaligned
80
Nico Weber63b97d22019-04-08 19:46:53 +000081 if (MangledName.empty()) {
82 Error = true;
83 return false;
84 }
Zachary Turnerd742d642018-07-26 19:56:09 +000085
86 // The next value should be either ABCD (non-member) or QRST (member).
87 switch (MangledName.front()) {
88 case 'A':
89 case 'B':
90 case 'C':
91 case 'D':
92 return false;
93 case 'Q':
94 case 'R':
95 case 'S':
96 case 'T':
97 return true;
98 default:
Zachary Turner8fb9a712018-12-14 18:10:13 +000099 Error = true;
100 return false;
Zachary Turnerd742d642018-07-26 19:56:09 +0000101 }
Zachary Turnerd742d642018-07-26 19:56:09 +0000102}
103
Zachary Turner03312862018-08-27 03:48:03 +0000104static SpecialIntrinsicKind
105consumeSpecialIntrinsicKind(StringView &MangledName) {
106 if (MangledName.consumeFront("?_7"))
107 return SpecialIntrinsicKind::Vftable;
108 if (MangledName.consumeFront("?_8"))
109 return SpecialIntrinsicKind::Vbtable;
110 if (MangledName.consumeFront("?_9"))
111 return SpecialIntrinsicKind::VcallThunk;
112 if (MangledName.consumeFront("?_A"))
113 return SpecialIntrinsicKind::Typeof;
114 if (MangledName.consumeFront("?_B"))
115 return SpecialIntrinsicKind::LocalStaticGuard;
116 if (MangledName.consumeFront("?_C"))
117 return SpecialIntrinsicKind::StringLiteralSymbol;
118 if (MangledName.consumeFront("?_P"))
119 return SpecialIntrinsicKind::UdtReturning;
120 if (MangledName.consumeFront("?_R0"))
121 return SpecialIntrinsicKind::RttiTypeDescriptor;
122 if (MangledName.consumeFront("?_R1"))
123 return SpecialIntrinsicKind::RttiBaseClassDescriptor;
124 if (MangledName.consumeFront("?_R2"))
125 return SpecialIntrinsicKind::RttiBaseClassArray;
126 if (MangledName.consumeFront("?_R3"))
127 return SpecialIntrinsicKind::RttiClassHierarchyDescriptor;
128 if (MangledName.consumeFront("?_R4"))
129 return SpecialIntrinsicKind::RttiCompleteObjLocator;
130 if (MangledName.consumeFront("?_S"))
131 return SpecialIntrinsicKind::LocalVftable;
132 if (MangledName.consumeFront("?__E"))
133 return SpecialIntrinsicKind::DynamicInitializer;
134 if (MangledName.consumeFront("?__F"))
135 return SpecialIntrinsicKind::DynamicAtexitDestructor;
136 if (MangledName.consumeFront("?__J"))
137 return SpecialIntrinsicKind::LocalStaticThreadGuard;
138 return SpecialIntrinsicKind::None;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000139}
140
Zachary Turner71c91f92018-07-30 03:12:34 +0000141static bool startsWithLocalScopePattern(StringView S) {
142 if (!S.consumeFront('?'))
143 return false;
144 if (S.size() < 2)
145 return false;
146
147 size_t End = S.find('?');
148 if (End == StringView::npos)
149 return false;
150 StringView Candidate = S.substr(0, End);
151 if (Candidate.empty())
152 return false;
153
154 // \?[0-9]\?
155 // ?@? is the discriminator 0.
156 if (Candidate.size() == 1)
157 return Candidate[0] == '@' || (Candidate[0] >= '0' && Candidate[0] <= '9');
158
159 // If it's not 0-9, then it's an encoded number terminated with an @
160 if (Candidate.back() != '@')
161 return false;
162 Candidate = Candidate.dropBack();
163
164 // An encoded number starts with B-P and all subsequent digits are in A-P.
165 // Note that the reason the first digit cannot be A is two fold. First, it
166 // would create an ambiguity with ?A which delimits the beginning of an
167 // anonymous namespace. Second, A represents 0, and you don't start a multi
168 // digit number with a leading 0. Presumably the anonymous namespace
169 // ambiguity is also why single digit encoded numbers use 0-9 rather than A-J.
170 if (Candidate[0] < 'B' || Candidate[0] > 'P')
171 return false;
172 Candidate = Candidate.dropFront();
173 while (!Candidate.empty()) {
174 if (Candidate[0] < 'A' || Candidate[0] > 'P')
175 return false;
176 Candidate = Candidate.dropFront();
177 }
178
179 return true;
180}
181
Zachary Turner03312862018-08-27 03:48:03 +0000182static bool isTagType(StringView S) {
183 switch (S.front()) {
184 case 'T': // union
185 case 'U': // struct
186 case 'V': // class
187 case 'W': // enum
188 return true;
Zachary Turner38b78a72018-07-26 20:20:10 +0000189 }
Zachary Turner03312862018-08-27 03:48:03 +0000190 return false;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000191}
192
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000193static bool isCustomType(StringView S) { return S[0] == '?'; }
194
Zachary Turner03312862018-08-27 03:48:03 +0000195static bool isPointerType(StringView S) {
196 if (S.startsWith("$$Q")) // foo &&
197 return true;
198
199 switch (S.front()) {
200 case 'A': // foo &
201 case 'P': // foo *
202 case 'Q': // foo *const
203 case 'R': // foo *volatile
204 case 'S': // foo *const volatile
205 return true;
206 }
207 return false;
208}
209
210static bool isArrayType(StringView S) { return S[0] == 'Y'; }
211
212static bool isFunctionType(StringView S) {
213 return S.startsWith("$$A8@@") || S.startsWith("$$A6");
214}
215
216static FunctionRefQualifier
217demangleFunctionRefQualifier(StringView &MangledName) {
218 if (MangledName.consumeFront('G'))
219 return FunctionRefQualifier::Reference;
220 else if (MangledName.consumeFront('H'))
221 return FunctionRefQualifier::RValueReference;
222 return FunctionRefQualifier::None;
223}
224
225static std::pair<Qualifiers, PointerAffinity>
226demanglePointerCVQualifiers(StringView &MangledName) {
227 if (MangledName.consumeFront("$$Q"))
228 return std::make_pair(Q_None, PointerAffinity::RValueReference);
229
230 switch (MangledName.popFront()) {
231 case 'A':
232 return std::make_pair(Q_None, PointerAffinity::Reference);
233 case 'P':
234 return std::make_pair(Q_None, PointerAffinity::Pointer);
235 case 'Q':
236 return std::make_pair(Q_Const, PointerAffinity::Pointer);
237 case 'R':
238 return std::make_pair(Q_Volatile, PointerAffinity::Pointer);
239 case 'S':
240 return std::make_pair(Qualifiers(Q_Const | Q_Volatile),
241 PointerAffinity::Pointer);
Zachary Turner970fdc32018-08-16 16:17:36 +0000242 default:
Zachary Turner03312862018-08-27 03:48:03 +0000243 assert(false && "Ty is not a pointer type!");
Zachary Turner970fdc32018-08-16 16:17:36 +0000244 }
Zachary Turner03312862018-08-27 03:48:03 +0000245 return std::make_pair(Q_None, PointerAffinity::Pointer);
Zachary Turner970fdc32018-08-16 16:17:36 +0000246}
247
Zachary Turner71c91f92018-07-30 03:12:34 +0000248StringView Demangler::copyString(StringView Borrowed) {
249 char *Stable = Arena.allocUnalignedBuffer(Borrowed.size() + 1);
250 std::strcpy(Stable, Borrowed.begin());
251
252 return {Stable, Borrowed.size()};
253}
254
Zachary Turner03312862018-08-27 03:48:03 +0000255SpecialTableSymbolNode *
256Demangler::demangleSpecialTableSymbolNode(StringView &MangledName,
257 SpecialIntrinsicKind K) {
258 NamedIdentifierNode *NI = Arena.alloc<NamedIdentifierNode>();
259 switch (K) {
260 case SpecialIntrinsicKind::Vftable:
261 NI->Name = "`vftable'";
262 break;
263 case SpecialIntrinsicKind::Vbtable:
264 NI->Name = "`vbtable'";
265 break;
266 case SpecialIntrinsicKind::LocalVftable:
267 NI->Name = "`local vftable'";
268 break;
269 case SpecialIntrinsicKind::RttiCompleteObjLocator:
270 NI->Name = "`RTTI Complete Object Locator'";
271 break;
272 default:
Erik Pilkington5094e5e2019-01-17 20:37:51 +0000273 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000274 }
275 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
276 SpecialTableSymbolNode *STSN = Arena.alloc<SpecialTableSymbolNode>();
277 STSN->Name = QN;
Zachary Turner469f0762018-08-17 21:18:05 +0000278 bool IsMember = false;
Nico Weberae050d22019-04-14 23:32:37 +0000279 if (MangledName.empty()) {
280 Error = true;
281 return nullptr;
282 }
Zachary Turner03312862018-08-27 03:48:03 +0000283 char Front = MangledName.popFront();
284 if (Front != '6' && Front != '7') {
285 Error = true;
286 return nullptr;
287 }
288
289 std::tie(STSN->Quals, IsMember) = demangleQualifiers(MangledName);
290 if (!MangledName.consumeFront('@'))
291 STSN->TargetName = demangleFullyQualifiedTypeName(MangledName);
292 return STSN;
293}
294
295LocalStaticGuardVariableNode *
Nico Weber88ab2812019-05-28 14:54:49 +0000296Demangler::demangleLocalStaticGuard(StringView &MangledName, bool IsThread) {
Zachary Turner03312862018-08-27 03:48:03 +0000297 LocalStaticGuardIdentifierNode *LSGI =
298 Arena.alloc<LocalStaticGuardIdentifierNode>();
Nico Weber88ab2812019-05-28 14:54:49 +0000299 LSGI->IsThread = IsThread;
Zachary Turner03312862018-08-27 03:48:03 +0000300 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, LSGI);
301 LocalStaticGuardVariableNode *LSGVN =
302 Arena.alloc<LocalStaticGuardVariableNode>();
303 LSGVN->Name = QN;
304
305 if (MangledName.consumeFront("4IA"))
306 LSGVN->IsVisible = false;
307 else if (MangledName.consumeFront("5"))
308 LSGVN->IsVisible = true;
309 else {
310 Error = true;
311 return nullptr;
312 }
313
314 if (!MangledName.empty())
315 LSGI->ScopeIndex = demangleUnsigned(MangledName);
316 return LSGVN;
317}
318
319static NamedIdentifierNode *synthesizeNamedIdentifier(ArenaAllocator &Arena,
320 StringView Name) {
321 NamedIdentifierNode *Id = Arena.alloc<NamedIdentifierNode>();
322 Id->Name = Name;
323 return Id;
324}
325
326static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
327 IdentifierNode *Identifier) {
328 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
329 QN->Components = Arena.alloc<NodeArrayNode>();
330 QN->Components->Count = 1;
331 QN->Components->Nodes = Arena.allocArray<Node *>(1);
332 QN->Components->Nodes[0] = Identifier;
333 return QN;
334}
335
336static QualifiedNameNode *synthesizeQualifiedName(ArenaAllocator &Arena,
337 StringView Name) {
338 NamedIdentifierNode *Id = synthesizeNamedIdentifier(Arena, Name);
339 return synthesizeQualifiedName(Arena, Id);
340}
341
342static VariableSymbolNode *synthesizeVariable(ArenaAllocator &Arena,
343 TypeNode *Type,
344 StringView VariableName) {
345 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
346 VSN->Type = Type;
347 VSN->Name = synthesizeQualifiedName(Arena, VariableName);
348 return VSN;
349}
350
351VariableSymbolNode *Demangler::demangleUntypedVariable(
352 ArenaAllocator &Arena, StringView &MangledName, StringView VariableName) {
353 NamedIdentifierNode *NI = synthesizeNamedIdentifier(Arena, VariableName);
354 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, NI);
355 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
356 VSN->Name = QN;
357 if (MangledName.consumeFront("8"))
358 return VSN;
359
360 Error = true;
361 return nullptr;
362}
363
364VariableSymbolNode *
365Demangler::demangleRttiBaseClassDescriptorNode(ArenaAllocator &Arena,
366 StringView &MangledName) {
367 RttiBaseClassDescriptorNode *RBCDN =
368 Arena.alloc<RttiBaseClassDescriptorNode>();
369 RBCDN->NVOffset = demangleUnsigned(MangledName);
370 RBCDN->VBPtrOffset = demangleSigned(MangledName);
371 RBCDN->VBTableOffset = demangleUnsigned(MangledName);
372 RBCDN->Flags = demangleUnsigned(MangledName);
373 if (Error)
374 return nullptr;
375
376 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
377 VSN->Name = demangleNameScopeChain(MangledName, RBCDN);
378 MangledName.consumeFront('8');
379 return VSN;
380}
381
Zachary Turner32a8a202018-08-29 23:56:09 +0000382FunctionSymbolNode *Demangler::demangleInitFiniStub(StringView &MangledName,
383 bool IsDestructor) {
Zachary Turner03312862018-08-27 03:48:03 +0000384 DynamicStructorIdentifierNode *DSIN =
385 Arena.alloc<DynamicStructorIdentifierNode>();
386 DSIN->IsDestructor = IsDestructor;
Zachary Turner32a8a202018-08-29 23:56:09 +0000387
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000388 bool IsKnownStaticDataMember = false;
389 if (MangledName.consumeFront('?'))
390 IsKnownStaticDataMember = true;
391
Nico Weber63b97d22019-04-08 19:46:53 +0000392 SymbolNode *Symbol = demangleDeclarator(MangledName);
393 if (Error)
394 return nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +0000395
Zachary Turner32a8a202018-08-29 23:56:09 +0000396 FunctionSymbolNode *FSN = nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +0000397
398 if (Symbol->kind() == NodeKind::VariableSymbol) {
399 DSIN->Variable = static_cast<VariableSymbolNode *>(Symbol);
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000400
401 // Older versions of clang mangled this type of symbol incorrectly. They
402 // would omit the leading ? and they would only emit a single @ at the end.
403 // The correct mangling is a leading ? and 2 trailing @ signs. Handle
404 // both cases.
405 int AtCount = IsKnownStaticDataMember ? 2 : 1;
406 for (int I = 0; I < AtCount; ++I) {
407 if (MangledName.consumeFront('@'))
408 continue;
Zachary Turner32a8a202018-08-29 23:56:09 +0000409 Error = true;
410 return nullptr;
411 }
412
413 FSN = demangleFunctionEncoding(MangledName);
Nico Weber63b97d22019-04-08 19:46:53 +0000414 if (FSN)
415 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
Zachary Turner32a8a202018-08-29 23:56:09 +0000416 } else {
Zachary Turner78ab3cb2018-08-30 20:53:29 +0000417 if (IsKnownStaticDataMember) {
418 // This was supposed to be a static data member, but we got a function.
419 Error = true;
420 return nullptr;
421 }
422
Zachary Turner32a8a202018-08-29 23:56:09 +0000423 FSN = static_cast<FunctionSymbolNode *>(Symbol);
424 DSIN->Name = Symbol->Name;
425 FSN->Name = synthesizeQualifiedName(Arena, DSIN);
426 }
427
Zachary Turner03312862018-08-27 03:48:03 +0000428 return FSN;
429}
430
431SymbolNode *Demangler::demangleSpecialIntrinsic(StringView &MangledName) {
432 SpecialIntrinsicKind SIK = consumeSpecialIntrinsicKind(MangledName);
433 if (SIK == SpecialIntrinsicKind::None)
434 return nullptr;
435
436 switch (SIK) {
437 case SpecialIntrinsicKind::StringLiteralSymbol:
438 return demangleStringLiteral(MangledName);
439 case SpecialIntrinsicKind::Vftable:
440 case SpecialIntrinsicKind::Vbtable:
441 case SpecialIntrinsicKind::LocalVftable:
442 case SpecialIntrinsicKind::RttiCompleteObjLocator:
443 return demangleSpecialTableSymbolNode(MangledName, SIK);
444 case SpecialIntrinsicKind::VcallThunk:
445 return demangleVcallThunkNode(MangledName);
446 case SpecialIntrinsicKind::LocalStaticGuard:
Nico Weber88ab2812019-05-28 14:54:49 +0000447 return demangleLocalStaticGuard(MangledName, /*IsThread=*/false);
448 case SpecialIntrinsicKind::LocalStaticThreadGuard:
449 return demangleLocalStaticGuard(MangledName, /*IsThread=*/true);
Zachary Turner03312862018-08-27 03:48:03 +0000450 case SpecialIntrinsicKind::RttiTypeDescriptor: {
451 TypeNode *T = demangleType(MangledName, QualifierMangleMode::Result);
Zachary Turner469f0762018-08-17 21:18:05 +0000452 if (Error)
453 break;
454 if (!MangledName.consumeFront("@8"))
Zachary Turner03312862018-08-27 03:48:03 +0000455 break;
Zachary Turner469f0762018-08-17 21:18:05 +0000456 if (!MangledName.empty())
Zachary Turner03312862018-08-27 03:48:03 +0000457 break;
458 return synthesizeVariable(Arena, T, "`RTTI Type Descriptor'");
459 }
460 case SpecialIntrinsicKind::RttiBaseClassArray:
461 return demangleUntypedVariable(Arena, MangledName,
462 "`RTTI Base Class Array'");
463 case SpecialIntrinsicKind::RttiClassHierarchyDescriptor:
464 return demangleUntypedVariable(Arena, MangledName,
465 "`RTTI Class Hierarchy Descriptor'");
466 case SpecialIntrinsicKind::RttiBaseClassDescriptor:
467 return demangleRttiBaseClassDescriptorNode(Arena, MangledName);
468 case SpecialIntrinsicKind::DynamicInitializer:
Zachary Turner32a8a202018-08-29 23:56:09 +0000469 return demangleInitFiniStub(MangledName, false);
Zachary Turner03312862018-08-27 03:48:03 +0000470 case SpecialIntrinsicKind::DynamicAtexitDestructor:
Zachary Turner32a8a202018-08-29 23:56:09 +0000471 return demangleInitFiniStub(MangledName, true);
Zachary Turner469f0762018-08-17 21:18:05 +0000472 default:
Zachary Turner469f0762018-08-17 21:18:05 +0000473 break;
474 }
Zachary Turner03312862018-08-27 03:48:03 +0000475 Error = true;
476 return nullptr;
Zachary Turner469f0762018-08-17 21:18:05 +0000477}
478
Zachary Turner03312862018-08-27 03:48:03 +0000479IdentifierNode *
480Demangler::demangleFunctionIdentifierCode(StringView &MangledName) {
481 assert(MangledName.startsWith('?'));
482 MangledName = MangledName.dropFront();
Nico Weber321de482019-04-03 23:19:39 +0000483 if (MangledName.empty()) {
484 Error = true;
485 return nullptr;
486 }
Zachary Turner03312862018-08-27 03:48:03 +0000487
488 if (MangledName.consumeFront("__"))
489 return demangleFunctionIdentifierCode(
490 MangledName, FunctionIdentifierCodeGroup::DoubleUnder);
Nico Weberb4f33bb2019-04-11 22:47:18 +0000491 if (MangledName.consumeFront("_"))
Zachary Turner03312862018-08-27 03:48:03 +0000492 return demangleFunctionIdentifierCode(MangledName,
493 FunctionIdentifierCodeGroup::Under);
494 return demangleFunctionIdentifierCode(MangledName,
495 FunctionIdentifierCodeGroup::Basic);
496}
497
498StructorIdentifierNode *
499Demangler::demangleStructorIdentifier(StringView &MangledName,
500 bool IsDestructor) {
501 StructorIdentifierNode *N = Arena.alloc<StructorIdentifierNode>();
502 N->IsDestructor = IsDestructor;
503 return N;
504}
505
506ConversionOperatorIdentifierNode *
507Demangler::demangleConversionOperatorIdentifier(StringView &MangledName) {
508 ConversionOperatorIdentifierNode *N =
509 Arena.alloc<ConversionOperatorIdentifierNode>();
510 return N;
511}
512
513LiteralOperatorIdentifierNode *
514Demangler::demangleLiteralOperatorIdentifier(StringView &MangledName) {
515 LiteralOperatorIdentifierNode *N =
516 Arena.alloc<LiteralOperatorIdentifierNode>();
Nico Weberaf2ee7d2019-04-11 23:20:18 +0000517 N->Name = demangleSimpleString(MangledName, /*Memorize=*/false);
Zachary Turner03312862018-08-27 03:48:03 +0000518 return N;
519}
520
Nico Weber03db6252019-04-11 23:11:33 +0000521IntrinsicFunctionKind
522Demangler::translateIntrinsicFunctionCode(char CH,
523 FunctionIdentifierCodeGroup Group) {
524 using IFK = IntrinsicFunctionKind;
525 if (!(CH >= '0' && CH <= '9') && !(CH >= 'A' && CH <= 'Z')) {
526 Error = true;
527 return IFK::None;
528 }
529
Zachary Turner03312862018-08-27 03:48:03 +0000530 // Not all ? identifiers are intrinsics *functions*. This function only maps
531 // operator codes for the special functions, all others are handled elsewhere,
532 // hence the IFK::None entries in the table.
Zachary Turner03312862018-08-27 03:48:03 +0000533 static IFK Basic[36] = {
534 IFK::None, // ?0 # Foo::Foo()
535 IFK::None, // ?1 # Foo::~Foo()
536 IFK::New, // ?2 # operator new
537 IFK::Delete, // ?3 # operator delete
538 IFK::Assign, // ?4 # operator=
539 IFK::RightShift, // ?5 # operator>>
540 IFK::LeftShift, // ?6 # operator<<
541 IFK::LogicalNot, // ?7 # operator!
542 IFK::Equals, // ?8 # operator==
543 IFK::NotEquals, // ?9 # operator!=
544 IFK::ArraySubscript, // ?A # operator[]
545 IFK::None, // ?B # Foo::operator <type>()
546 IFK::Pointer, // ?C # operator->
547 IFK::Dereference, // ?D # operator*
548 IFK::Increment, // ?E # operator++
549 IFK::Decrement, // ?F # operator--
550 IFK::Minus, // ?G # operator-
551 IFK::Plus, // ?H # operator+
552 IFK::BitwiseAnd, // ?I # operator&
553 IFK::MemberPointer, // ?J # operator->*
554 IFK::Divide, // ?K # operator/
555 IFK::Modulus, // ?L # operator%
556 IFK::LessThan, // ?M operator<
557 IFK::LessThanEqual, // ?N operator<=
558 IFK::GreaterThan, // ?O operator>
559 IFK::GreaterThanEqual, // ?P operator>=
560 IFK::Comma, // ?Q operator,
561 IFK::Parens, // ?R operator()
562 IFK::BitwiseNot, // ?S operator~
563 IFK::BitwiseXor, // ?T operator^
564 IFK::BitwiseOr, // ?U operator|
565 IFK::LogicalAnd, // ?V operator&&
566 IFK::LogicalOr, // ?W operator||
567 IFK::TimesEqual, // ?X operator*=
568 IFK::PlusEqual, // ?Y operator+=
569 IFK::MinusEqual, // ?Z operator-=
570 };
571 static IFK Under[36] = {
572 IFK::DivEqual, // ?_0 operator/=
573 IFK::ModEqual, // ?_1 operator%=
574 IFK::RshEqual, // ?_2 operator>>=
575 IFK::LshEqual, // ?_3 operator<<=
576 IFK::BitwiseAndEqual, // ?_4 operator&=
577 IFK::BitwiseOrEqual, // ?_5 operator|=
578 IFK::BitwiseXorEqual, // ?_6 operator^=
579 IFK::None, // ?_7 # vftable
580 IFK::None, // ?_8 # vbtable
581 IFK::None, // ?_9 # vcall
582 IFK::None, // ?_A # typeof
583 IFK::None, // ?_B # local static guard
584 IFK::None, // ?_C # string literal
585 IFK::VbaseDtor, // ?_D # vbase destructor
586 IFK::VecDelDtor, // ?_E # vector deleting destructor
587 IFK::DefaultCtorClosure, // ?_F # default constructor closure
588 IFK::ScalarDelDtor, // ?_G # scalar deleting destructor
589 IFK::VecCtorIter, // ?_H # vector constructor iterator
590 IFK::VecDtorIter, // ?_I # vector destructor iterator
591 IFK::VecVbaseCtorIter, // ?_J # vector vbase constructor iterator
592 IFK::VdispMap, // ?_K # virtual displacement map
593 IFK::EHVecCtorIter, // ?_L # eh vector constructor iterator
594 IFK::EHVecDtorIter, // ?_M # eh vector destructor iterator
595 IFK::EHVecVbaseCtorIter, // ?_N # eh vector vbase constructor iterator
596 IFK::CopyCtorClosure, // ?_O # copy constructor closure
597 IFK::None, // ?_P<name> # udt returning <name>
598 IFK::None, // ?_Q # <unknown>
599 IFK::None, // ?_R0 - ?_R4 # RTTI Codes
600 IFK::None, // ?_S # local vftable
601 IFK::LocalVftableCtorClosure, // ?_T # local vftable constructor closure
602 IFK::ArrayNew, // ?_U operator new[]
603 IFK::ArrayDelete, // ?_V operator delete[]
604 IFK::None, // ?_W <unused>
605 IFK::None, // ?_X <unused>
606 IFK::None, // ?_Y <unused>
607 IFK::None, // ?_Z <unused>
608 };
609 static IFK DoubleUnder[36] = {
610 IFK::None, // ?__0 <unused>
611 IFK::None, // ?__1 <unused>
612 IFK::None, // ?__2 <unused>
613 IFK::None, // ?__3 <unused>
614 IFK::None, // ?__4 <unused>
615 IFK::None, // ?__5 <unused>
616 IFK::None, // ?__6 <unused>
617 IFK::None, // ?__7 <unused>
618 IFK::None, // ?__8 <unused>
619 IFK::None, // ?__9 <unused>
620 IFK::ManVectorCtorIter, // ?__A managed vector ctor iterator
621 IFK::ManVectorDtorIter, // ?__B managed vector dtor iterator
622 IFK::EHVectorCopyCtorIter, // ?__C EH vector copy ctor iterator
623 IFK::EHVectorVbaseCopyCtorIter, // ?__D EH vector vbase copy ctor iter
624 IFK::None, // ?__E dynamic initializer for `T'
625 IFK::None, // ?__F dynamic atexit destructor for `T'
626 IFK::VectorCopyCtorIter, // ?__G vector copy constructor iter
627 IFK::VectorVbaseCopyCtorIter, // ?__H vector vbase copy ctor iter
628 IFK::ManVectorVbaseCopyCtorIter, // ?__I managed vector vbase copy ctor
629 // iter
630 IFK::None, // ?__J local static thread guard
631 IFK::None, // ?__K operator ""_name
Nico Webere8f21b12019-04-23 16:20:27 +0000632 IFK::CoAwait, // ?__L operator co_await
633 IFK::Spaceship, // ?__M operator<=>
Zachary Turner03312862018-08-27 03:48:03 +0000634 IFK::None, // ?__N <unused>
635 IFK::None, // ?__O <unused>
636 IFK::None, // ?__P <unused>
637 IFK::None, // ?__Q <unused>
638 IFK::None, // ?__R <unused>
639 IFK::None, // ?__S <unused>
640 IFK::None, // ?__T <unused>
641 IFK::None, // ?__U <unused>
642 IFK::None, // ?__V <unused>
643 IFK::None, // ?__W <unused>
644 IFK::None, // ?__X <unused>
645 IFK::None, // ?__Y <unused>
646 IFK::None, // ?__Z <unused>
647 };
648
649 int Index = (CH >= '0' && CH <= '9') ? (CH - '0') : (CH - 'A' + 10);
650 switch (Group) {
651 case FunctionIdentifierCodeGroup::Basic:
652 return Basic[Index];
653 case FunctionIdentifierCodeGroup::Under:
654 return Under[Index];
655 case FunctionIdentifierCodeGroup::DoubleUnder:
656 return DoubleUnder[Index];
657 }
Erik Pilkington5094e5e2019-01-17 20:37:51 +0000658 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000659}
660
661IdentifierNode *
662Demangler::demangleFunctionIdentifierCode(StringView &MangledName,
663 FunctionIdentifierCodeGroup Group) {
Nico Weber63fe2592019-04-14 23:08:12 +0000664 if (MangledName.empty()) {
665 Error = true;
666 return nullptr;
667 }
Zachary Turner03312862018-08-27 03:48:03 +0000668 switch (Group) {
669 case FunctionIdentifierCodeGroup::Basic:
670 switch (char CH = MangledName.popFront()) {
671 case '0':
672 case '1':
673 return demangleStructorIdentifier(MangledName, CH == '1');
674 case 'B':
675 return demangleConversionOperatorIdentifier(MangledName);
676 default:
677 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
678 translateIntrinsicFunctionCode(CH, Group));
679 }
Zachary Turner03312862018-08-27 03:48:03 +0000680 case FunctionIdentifierCodeGroup::Under:
681 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
682 translateIntrinsicFunctionCode(MangledName.popFront(), Group));
683 case FunctionIdentifierCodeGroup::DoubleUnder:
684 switch (char CH = MangledName.popFront()) {
685 case 'K':
686 return demangleLiteralOperatorIdentifier(MangledName);
687 default:
688 return Arena.alloc<IntrinsicFunctionIdentifierNode>(
689 translateIntrinsicFunctionCode(CH, Group));
690 }
691 }
Zachary Turner03312862018-08-27 03:48:03 +0000692
Nico Weberef035182019-04-11 23:23:00 +0000693 DEMANGLE_UNREACHABLE;
Zachary Turner03312862018-08-27 03:48:03 +0000694}
695
696SymbolNode *Demangler::demangleEncodedSymbol(StringView &MangledName,
697 QualifiedNameNode *Name) {
Nico Weber63b97d22019-04-08 19:46:53 +0000698 if (MangledName.empty()) {
699 Error = true;
700 return nullptr;
701 }
702
Zachary Turner469f0762018-08-17 21:18:05 +0000703 // Read a variable.
704 switch (MangledName.front()) {
705 case '0':
706 case '1':
707 case '2':
708 case '3':
Zachary Turner03312862018-08-27 03:48:03 +0000709 case '4': {
710 StorageClass SC = demangleVariableStorageClass(MangledName);
711 return demangleVariableEncoding(MangledName, SC);
Zachary Turner469f0762018-08-17 21:18:05 +0000712 }
Zachary Turner03312862018-08-27 03:48:03 +0000713 }
714 FunctionSymbolNode *FSN = demangleFunctionEncoding(MangledName);
715
716 IdentifierNode *UQN = Name->getUnqualifiedIdentifier();
717 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
718 ConversionOperatorIdentifierNode *COIN =
719 static_cast<ConversionOperatorIdentifierNode *>(UQN);
Nico Weber63b97d22019-04-08 19:46:53 +0000720 if (FSN)
721 COIN->TargetType = FSN->Signature->ReturnType;
Zachary Turner03312862018-08-27 03:48:03 +0000722 }
723 return FSN;
Zachary Turner469f0762018-08-17 21:18:05 +0000724}
725
Nico Weber63b97d22019-04-08 19:46:53 +0000726SymbolNode *Demangler::demangleDeclarator(StringView &MangledName) {
727 // What follows is a main symbol name. This may include namespaces or class
728 // back references.
729 QualifiedNameNode *QN = demangleFullyQualifiedSymbolName(MangledName);
730 if (Error)
731 return nullptr;
732
733 SymbolNode *Symbol = demangleEncodedSymbol(MangledName, QN);
734 if (Error)
735 return nullptr;
736 Symbol->Name = QN;
737
738 IdentifierNode *UQN = QN->getUnqualifiedIdentifier();
739 if (UQN->kind() == NodeKind::ConversionOperatorIdentifier) {
740 ConversionOperatorIdentifierNode *COIN =
741 static_cast<ConversionOperatorIdentifierNode *>(UQN);
742 if (!COIN->TargetType) {
743 Error = true;
744 return nullptr;
745 }
746 }
747 return Symbol;
748}
749
Nico Weber82dc06c2019-05-27 23:10:42 +0000750SymbolNode *Demangler::demangleMD5Name(StringView &MangledName) {
751 assert(MangledName.startsWith("??@"));
752 // This is an MD5 mangled name. We can't demangle it, just return the
753 // mangled name.
754 // An MD5 mangled name is ??@ followed by 32 characters and a terminating @.
755 size_t MD5Last = MangledName.find('@', strlen("??@"));
756 if (MD5Last == StringView::npos) {
757 Error = true;
758 return nullptr;
759 }
760 const char *Start = MangledName.begin();
761 MangledName = MangledName.dropFront(MD5Last + 1);
762
763 // There are two additional special cases for MD5 names:
764 // 1. For complete object locators where the object name is long enough
765 // for the object to have an MD5 name, the complete object locator is
766 // called ??@...@??_R4@ (with a trailing "??_R4@" instead of the usual
767 // leading "??_R4". This is handled here.
768 // 2. For catchable types, in versions of MSVC before 2015 (<1900) or after
769 // 2017.2 (>= 1914), the catchable type mangling is _CT??@...@??@...@8
770 // instead of_CT??@...@8 with just one MD5 name. Since we don't yet
771 // demangle catchable types anywhere, this isn't handled for MD5 names
772 // either.
773 MangledName.consumeFront("??_R4@");
774
775 StringView MD5(Start, MangledName.begin());
776 SymbolNode *S = Arena.alloc<SymbolNode>(NodeKind::Md5Symbol);
777 S->Name = synthesizeQualifiedName(Arena, MD5);
778
779 return S;
780}
781
Zachary Turner469f0762018-08-17 21:18:05 +0000782// Parser entry point.
Zachary Turner03312862018-08-27 03:48:03 +0000783SymbolNode *Demangler::parse(StringView &MangledName) {
Nico Weber82dc06c2019-05-27 23:10:42 +0000784 if (MangledName.startsWith("??@"))
785 return demangleMD5Name(MangledName);
Zachary Turner83313f82018-08-16 16:17:17 +0000786
Nico Webercfe08bc2019-05-27 00:48:59 +0000787 // MSVC-style mangled symbols must start with '?'.
Zachary Turner03312862018-08-27 03:48:03 +0000788 if (!MangledName.startsWith('?')) {
789 Error = true;
790 return nullptr;
791 }
792
Zachary Turner469f0762018-08-17 21:18:05 +0000793 MangledName.consumeFront('?');
Zachary Turner970fdc32018-08-16 16:17:36 +0000794
Zachary Turner469f0762018-08-17 21:18:05 +0000795 // ?$ is a template instantiation, but all other names that start with ? are
796 // operators / special names.
Zachary Turner03312862018-08-27 03:48:03 +0000797 if (SymbolNode *SI = demangleSpecialIntrinsic(MangledName))
798 return SI;
Zachary Turner469f0762018-08-17 21:18:05 +0000799
Nico Weber63b97d22019-04-08 19:46:53 +0000800 return demangleDeclarator(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000801}
802
Zachary Turner7ba90562018-11-01 15:07:32 +0000803TagTypeNode *Demangler::parseTagUniqueName(StringView &MangledName) {
804 if (!MangledName.consumeFront(".?A"))
805 return nullptr;
806 MangledName.consumeFront(".?A");
807 if (MangledName.empty())
808 return nullptr;
809
810 return demangleClassType(MangledName);
811}
812
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000813// <type-encoding> ::= <storage-class> <variable-type>
814// <storage-class> ::= 0 # private static member
815// ::= 1 # protected static member
816// ::= 2 # public static member
817// ::= 3 # global
818// ::= 4 # static local
819
Zachary Turner03312862018-08-27 03:48:03 +0000820VariableSymbolNode *Demangler::demangleVariableEncoding(StringView &MangledName,
821 StorageClass SC) {
822 VariableSymbolNode *VSN = Arena.alloc<VariableSymbolNode>();
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000823
Zachary Turner03312862018-08-27 03:48:03 +0000824 VSN->Type = demangleType(MangledName, QualifierMangleMode::Drop);
825 VSN->SC = SC;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000826
Nico Weber63b97d22019-04-08 19:46:53 +0000827 if (Error)
828 return nullptr;
829
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000830 // <variable-type> ::= <type> <cvr-qualifiers>
831 // ::= <type> <pointee-cvr-qualifiers> # pointers, references
Zachary Turner03312862018-08-27 03:48:03 +0000832 switch (VSN->Type->kind()) {
833 case NodeKind::PointerType: {
834 PointerTypeNode *PTN = static_cast<PointerTypeNode *>(VSN->Type);
835
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000836 Qualifiers ExtraChildQuals = Q_None;
Zachary Turner03312862018-08-27 03:48:03 +0000837 PTN->Quals = Qualifiers(VSN->Type->Quals |
838 demanglePointerExtQualifiers(MangledName));
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000839
Zachary Turnerd742d642018-07-26 19:56:09 +0000840 bool IsMember = false;
Zachary Turner316109b2018-07-29 16:38:02 +0000841 std::tie(ExtraChildQuals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000842
Zachary Turner03312862018-08-27 03:48:03 +0000843 if (PTN->ClassParent) {
844 QualifiedNameNode *BackRefName =
845 demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000846 (void)BackRefName;
847 }
Zachary Turner03312862018-08-27 03:48:03 +0000848 PTN->Pointee->Quals = Qualifiers(PTN->Pointee->Quals | ExtraChildQuals);
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000849
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000850 break;
851 }
852 default:
Zachary Turner03312862018-08-27 03:48:03 +0000853 VSN->Type->Quals = demangleQualifiers(MangledName).first;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000854 break;
855 }
856
Zachary Turner03312862018-08-27 03:48:03 +0000857 return VSN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000858}
859
860// Sometimes numbers are encoded in mangled symbols. For example,
861// "int (*x)[20]" is a valid C type (x is a pointer to an array of
862// length 20), so we need some way to embed numbers as part of symbols.
863// This function parses it.
864//
865// <number> ::= [?] <non-negative integer>
866//
867// <non-negative integer> ::= <decimal digit> # when 1 <= Number <= 10
Nico Weber502cf4b2019-04-18 19:30:21 +0000868// ::= <hex digit>+ @ # when Number == 0 or >= 10
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000869//
870// <hex-digit> ::= [A-P] # A = 0, B = 1, ...
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000871std::pair<uint64_t, bool> Demangler::demangleNumber(StringView &MangledName) {
872 bool IsNegative = MangledName.consumeFront('?');
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000873
874 if (startsWithDigit(MangledName)) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000875 uint64_t Ret = MangledName[0] - '0' + 1;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000876 MangledName = MangledName.dropFront(1);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000877 return {Ret, IsNegative};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000878 }
879
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000880 uint64_t Ret = 0;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000881 for (size_t i = 0; i < MangledName.size(); ++i) {
882 char C = MangledName[i];
883 if (C == '@') {
884 MangledName = MangledName.dropFront(i + 1);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000885 return {Ret, IsNegative};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000886 }
887 if ('A' <= C && C <= 'P') {
888 Ret = (Ret << 4) + (C - 'A');
889 continue;
890 }
891 break;
892 }
893
894 Error = true;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +0000895 return {0ULL, false};
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000896}
897
Zachary Turner469f0762018-08-17 21:18:05 +0000898uint64_t Demangler::demangleUnsigned(StringView &MangledName) {
899 bool IsNegative = false;
900 uint64_t Number = 0;
901 std::tie(Number, IsNegative) = demangleNumber(MangledName);
902 if (IsNegative)
903 Error = true;
904 return Number;
905}
906
907int64_t Demangler::demangleSigned(StringView &MangledName) {
908 bool IsNegative = false;
909 uint64_t Number = 0;
910 std::tie(Number, IsNegative) = demangleNumber(MangledName);
911 if (Number > INT64_MAX)
912 Error = true;
913 int64_t I = static_cast<int64_t>(Number);
914 return IsNegative ? -I : I;
915}
916
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000917// First 10 strings can be referenced by special BackReferences ?0, ?1, ..., ?9.
918// Memorize it.
919void Demangler::memorizeString(StringView S) {
Zachary Turnerd346cba2018-08-08 17:17:04 +0000920 if (Backrefs.NamesCount >= BackrefContext::Max)
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000921 return;
Zachary Turnerd346cba2018-08-08 17:17:04 +0000922 for (size_t i = 0; i < Backrefs.NamesCount; ++i)
Zachary Turner03312862018-08-27 03:48:03 +0000923 if (S == Backrefs.Names[i]->Name)
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000924 return;
Zachary Turner03312862018-08-27 03:48:03 +0000925 NamedIdentifierNode *N = Arena.alloc<NamedIdentifierNode>();
926 N->Name = S;
927 Backrefs.Names[Backrefs.NamesCount++] = N;
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000928}
929
Zachary Turner03312862018-08-27 03:48:03 +0000930NamedIdentifierNode *Demangler::demangleBackRefName(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +0000931 assert(startsWithDigit(MangledName));
Zachary Turnerd9e925f2018-08-18 18:49:48 +0000932
933 size_t I = MangledName[0] - '0';
934 if (I >= Backrefs.NamesCount) {
935 Error = true;
936 return nullptr;
937 }
938
Zachary Turner172aea12018-08-02 17:08:03 +0000939 MangledName = MangledName.dropFront();
Zachary Turner03312862018-08-27 03:48:03 +0000940 return Backrefs.Names[I];
Zachary Turnerf435a7e2018-07-20 17:27:48 +0000941}
942
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000943void Demangler::memorizeIdentifier(IdentifierNode *Identifier) {
944 // Render this class template name into a string buffer so that we can
945 // memorize it for the purpose of back-referencing.
Nico Weber1359d652018-09-15 18:24:20 +0000946 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +0000947 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +0000948 // FIXME: Propagate out-of-memory as an error?
949 std::terminate();
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000950 Identifier->output(OS, OF_Default);
951 OS << '\0';
952 char *Name = OS.getBuffer();
953
954 StringView Owned = copyString(Name);
955 memorizeString(Owned);
956 std::free(Name);
957}
958
Zachary Turner03312862018-08-27 03:48:03 +0000959IdentifierNode *
960Demangler::demangleTemplateInstantiationName(StringView &MangledName,
961 NameBackrefBehavior NBB) {
Zachary Turnera7dffb12018-07-28 22:10:42 +0000962 assert(MangledName.startsWith("?$"));
963 MangledName.consumeFront("?$");
964
Zachary Turnerd346cba2018-08-08 17:17:04 +0000965 BackrefContext OuterContext;
966 std::swap(OuterContext, Backrefs);
Zachary Turner54d4ffe2018-08-01 18:32:28 +0000967
Zachary Turner03312862018-08-27 03:48:03 +0000968 IdentifierNode *Identifier =
969 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
Zachary Turnerd346cba2018-08-08 17:17:04 +0000970 if (!Error)
Zachary Turner03312862018-08-27 03:48:03 +0000971 Identifier->TemplateParams = demangleTemplateParameterList(MangledName);
Zachary Turnerd346cba2018-08-08 17:17:04 +0000972
973 std::swap(OuterContext, Backrefs);
Zachary Turner54d4ffe2018-08-01 18:32:28 +0000974 if (Error)
975 return nullptr;
Zachary Turner71c91f92018-07-30 03:12:34 +0000976
Nico Weber64041d72019-04-15 16:42:44 +0000977 if (NBB & NBB_Template) {
978 // NBB_Template is only set for types and non-leaf names ("a::" in "a::b").
Nico Weberc035c242019-04-16 14:10:34 +0000979 // Structors and conversion operators only makes sense in a leaf name, so
980 // reject them in NBB_Template contexts.
981 if (Identifier->kind() == NodeKind::ConversionOperatorIdentifier ||
982 Identifier->kind() == NodeKind::StructorIdentifier) {
Nico Weber64041d72019-04-15 16:42:44 +0000983 Error = true;
984 return nullptr;
985 }
986
Zachary Turnerb2fef1a2018-08-29 04:12:44 +0000987 memorizeIdentifier(Identifier);
Nico Weber64041d72019-04-15 16:42:44 +0000988 }
Zachary Turner71c91f92018-07-30 03:12:34 +0000989
Zachary Turner03312862018-08-27 03:48:03 +0000990 return Identifier;
Zachary Turnera7dffb12018-07-28 22:10:42 +0000991}
992
Zachary Turner03312862018-08-27 03:48:03 +0000993NamedIdentifierNode *Demangler::demangleSimpleName(StringView &MangledName,
994 bool Memorize) {
Zachary Turner931e8792018-07-30 23:02:10 +0000995 StringView S = demangleSimpleString(MangledName, Memorize);
996 if (Error)
997 return nullptr;
998
Zachary Turner03312862018-08-27 03:48:03 +0000999 NamedIdentifierNode *Name = Arena.alloc<NamedIdentifierNode>();
1000 Name->Name = S;
1001 return Name;
Zachary Turner931e8792018-07-30 23:02:10 +00001002}
1003
Zachary Turner970fdc32018-08-16 16:17:36 +00001004static bool isRebasedHexDigit(char C) { return (C >= 'A' && C <= 'P'); }
1005
1006static uint8_t rebasedHexDigitToNumber(char C) {
1007 assert(isRebasedHexDigit(C));
1008 return (C <= 'J') ? (C - 'A') : (10 + C - 'K');
1009}
1010
1011uint8_t Demangler::demangleCharLiteral(StringView &MangledName) {
Nico Webera0ac65c2019-04-18 19:52:32 +00001012 assert(!MangledName.empty());
Zachary Turner970fdc32018-08-16 16:17:36 +00001013 if (!MangledName.startsWith('?'))
1014 return MangledName.popFront();
1015
1016 MangledName = MangledName.dropFront();
1017 if (MangledName.empty())
1018 goto CharLiteralError;
1019
1020 if (MangledName.consumeFront('$')) {
1021 // Two hex digits
1022 if (MangledName.size() < 2)
1023 goto CharLiteralError;
1024 StringView Nibbles = MangledName.substr(0, 2);
1025 if (!isRebasedHexDigit(Nibbles[0]) || !isRebasedHexDigit(Nibbles[1]))
1026 goto CharLiteralError;
1027 // Don't append the null terminator.
1028 uint8_t C1 = rebasedHexDigitToNumber(Nibbles[0]);
1029 uint8_t C2 = rebasedHexDigitToNumber(Nibbles[1]);
1030 MangledName = MangledName.dropFront(2);
1031 return (C1 << 4) | C2;
1032 }
1033
1034 if (startsWithDigit(MangledName)) {
1035 const char *Lookup = ",/\\:. \n\t'-";
1036 char C = Lookup[MangledName[0] - '0'];
1037 MangledName = MangledName.dropFront();
1038 return C;
1039 }
1040
1041 if (MangledName[0] >= 'a' && MangledName[0] <= 'z') {
1042 char Lookup[26] = {'\xE1', '\xE2', '\xE3', '\xE4', '\xE5', '\xE6', '\xE7',
1043 '\xE8', '\xE9', '\xEA', '\xEB', '\xEC', '\xED', '\xEE',
1044 '\xEF', '\xF0', '\xF1', '\xF2', '\xF3', '\xF4', '\xF5',
1045 '\xF6', '\xF7', '\xF8', '\xF9', '\xFA'};
1046 char C = Lookup[MangledName[0] - 'a'];
1047 MangledName = MangledName.dropFront();
1048 return C;
1049 }
1050
1051 if (MangledName[0] >= 'A' && MangledName[0] <= 'Z') {
1052 char Lookup[26] = {'\xC1', '\xC2', '\xC3', '\xC4', '\xC5', '\xC6', '\xC7',
1053 '\xC8', '\xC9', '\xCA', '\xCB', '\xCC', '\xCD', '\xCE',
1054 '\xCF', '\xD0', '\xD1', '\xD2', '\xD3', '\xD4', '\xD5',
1055 '\xD6', '\xD7', '\xD8', '\xD9', '\xDA'};
1056 char C = Lookup[MangledName[0] - 'A'];
1057 MangledName = MangledName.dropFront();
1058 return C;
1059 }
1060
1061CharLiteralError:
1062 Error = true;
1063 return '\0';
1064}
1065
1066wchar_t Demangler::demangleWcharLiteral(StringView &MangledName) {
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001067 uint8_t C1, C2;
1068
1069 C1 = demangleCharLiteral(MangledName);
Nico Weberf5c7f3a2019-04-22 15:05:18 +00001070 if (Error || MangledName.empty())
Zachary Turner970fdc32018-08-16 16:17:36 +00001071 goto WCharLiteralError;
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001072 C2 = demangleCharLiteral(MangledName);
Zachary Turner970fdc32018-08-16 16:17:36 +00001073 if (Error)
1074 goto WCharLiteralError;
1075
1076 return ((wchar_t)C1 << 8) | (wchar_t)C2;
1077
1078WCharLiteralError:
1079 Error = true;
1080 return L'\0';
1081}
1082
1083static void writeHexDigit(char *Buffer, uint8_t Digit) {
1084 assert(Digit <= 15);
1085 *Buffer = (Digit < 10) ? ('0' + Digit) : ('A' + Digit - 10);
1086}
1087
1088static void outputHex(OutputStream &OS, unsigned C) {
1089 if (C == 0) {
1090 OS << "\\x00";
1091 return;
1092 }
1093 // It's easier to do the math if we can work from right to left, but we need
1094 // to print the numbers from left to right. So render this into a temporary
1095 // buffer first, then output the temporary buffer. Each byte is of the form
1096 // \xAB, which means that each byte needs 4 characters. Since there are at
1097 // most 4 bytes, we need a 4*4+1 = 17 character temporary buffer.
1098 char TempBuffer[17];
1099
1100 ::memset(TempBuffer, 0, sizeof(TempBuffer));
Nico Weber8fc99022019-04-21 16:58:25 +00001101 constexpr int MaxPos = sizeof(TempBuffer) - 1;
Zachary Turner970fdc32018-08-16 16:17:36 +00001102
Nico Weber8fc99022019-04-21 16:58:25 +00001103 int Pos = MaxPos - 1; // TempBuffer[MaxPos] is the terminating \0.
Zachary Turner970fdc32018-08-16 16:17:36 +00001104 while (C != 0) {
1105 for (int I = 0; I < 2; ++I) {
1106 writeHexDigit(&TempBuffer[Pos--], C % 16);
1107 C /= 16;
1108 }
Zachary Turner970fdc32018-08-16 16:17:36 +00001109 }
Nico Weberce67a412019-04-21 17:19:27 +00001110 TempBuffer[Pos--] = 'x';
1111 assert(Pos >= 0);
1112 TempBuffer[Pos--] = '\\';
Zachary Turner970fdc32018-08-16 16:17:36 +00001113 OS << StringView(&TempBuffer[Pos + 1]);
1114}
1115
1116static void outputEscapedChar(OutputStream &OS, unsigned C) {
1117 switch (C) {
Nico Weber8eeaf512019-04-20 23:59:06 +00001118 case '\0': // nul
1119 OS << "\\0";
1120 return;
Zachary Turner970fdc32018-08-16 16:17:36 +00001121 case '\'': // single quote
1122 OS << "\\\'";
1123 return;
1124 case '\"': // double quote
1125 OS << "\\\"";
1126 return;
1127 case '\\': // backslash
1128 OS << "\\\\";
1129 return;
1130 case '\a': // bell
1131 OS << "\\a";
1132 return;
1133 case '\b': // backspace
1134 OS << "\\b";
1135 return;
1136 case '\f': // form feed
1137 OS << "\\f";
1138 return;
1139 case '\n': // new line
1140 OS << "\\n";
1141 return;
1142 case '\r': // carriage return
1143 OS << "\\r";
1144 return;
1145 case '\t': // tab
1146 OS << "\\t";
1147 return;
1148 case '\v': // vertical tab
1149 OS << "\\v";
1150 return;
1151 default:
1152 break;
1153 }
1154
1155 if (C > 0x1F && C < 0x7F) {
1156 // Standard ascii char.
1157 OS << (char)C;
1158 return;
1159 }
1160
1161 outputHex(OS, C);
1162}
1163
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001164static unsigned countTrailingNullBytes(const uint8_t *StringBytes, int Length) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001165 const uint8_t *End = StringBytes + Length - 1;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001166 unsigned Count = 0;
Zachary Turner970fdc32018-08-16 16:17:36 +00001167 while (Length > 0 && *End == 0) {
1168 --Length;
1169 --End;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001170 ++Count;
Zachary Turner970fdc32018-08-16 16:17:36 +00001171 }
Zachary Turner3461bfa2018-08-17 16:14:05 +00001172 return Count;
Zachary Turner970fdc32018-08-16 16:17:36 +00001173}
1174
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001175static unsigned countEmbeddedNulls(const uint8_t *StringBytes,
1176 unsigned Length) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001177 unsigned Result = 0;
1178 for (unsigned I = 0; I < Length; ++I) {
1179 if (*StringBytes++ == 0)
1180 ++Result;
1181 }
1182 return Result;
1183}
1184
Nico Weber8d05eb82019-04-24 16:09:38 +00001185// A mangled (non-wide) string literal stores the total length of the string it
1186// refers to (passed in NumBytes), and it contains up to 32 bytes of actual text
1187// (passed in StringBytes, NumChars).
Benjamin Kramerc55e9972018-10-13 22:18:22 +00001188static unsigned guessCharByteSize(const uint8_t *StringBytes, unsigned NumChars,
Nico Weber8d05eb82019-04-24 16:09:38 +00001189 uint64_t NumBytes) {
Zachary Turner970fdc32018-08-16 16:17:36 +00001190 assert(NumBytes > 0);
1191
1192 // If the number of bytes is odd, this is guaranteed to be a char string.
1193 if (NumBytes % 2 == 1)
1194 return 1;
1195
1196 // All strings can encode at most 32 bytes of data. If it's less than that,
1197 // then we encoded the entire string. In this case we check for a 1-byte,
1198 // 2-byte, or 4-byte null terminator.
1199 if (NumBytes < 32) {
1200 unsigned TrailingNulls = countTrailingNullBytes(StringBytes, NumChars);
Nico Weber8eeaf512019-04-20 23:59:06 +00001201 if (TrailingNulls >= 4 && NumBytes % 4 == 0)
Zachary Turner970fdc32018-08-16 16:17:36 +00001202 return 4;
1203 if (TrailingNulls >= 2)
1204 return 2;
1205 return 1;
1206 }
1207
1208 // The whole string was not able to be encoded. Try to look at embedded null
1209 // terminators to guess. The heuristic is that we count all embedded null
1210 // terminators. If more than 2/3 are null, it's a char32. If more than 1/3
1211 // are null, it's a char16. Otherwise it's a char8. This obviously isn't
1212 // perfect and is biased towards languages that have ascii alphabets, but this
1213 // was always going to be best effort since the encoding is lossy.
1214 unsigned Nulls = countEmbeddedNulls(StringBytes, NumChars);
Nico Weber8eeaf512019-04-20 23:59:06 +00001215 if (Nulls >= 2 * NumChars / 3 && NumBytes % 4 == 0)
Zachary Turner970fdc32018-08-16 16:17:36 +00001216 return 4;
1217 if (Nulls >= NumChars / 3)
1218 return 2;
1219 return 1;
1220}
1221
1222static unsigned decodeMultiByteChar(const uint8_t *StringBytes,
1223 unsigned CharIndex, unsigned CharBytes) {
1224 assert(CharBytes == 1 || CharBytes == 2 || CharBytes == 4);
1225 unsigned Offset = CharIndex * CharBytes;
1226 unsigned Result = 0;
1227 StringBytes = StringBytes + Offset;
1228 for (unsigned I = 0; I < CharBytes; ++I) {
1229 unsigned C = static_cast<unsigned>(StringBytes[I]);
1230 Result |= C << (8 * I);
1231 }
1232 return Result;
1233}
1234
Zachary Turner03312862018-08-27 03:48:03 +00001235FunctionSymbolNode *Demangler::demangleVcallThunkNode(StringView &MangledName) {
1236 FunctionSymbolNode *FSN = Arena.alloc<FunctionSymbolNode>();
1237 VcallThunkIdentifierNode *VTIN = Arena.alloc<VcallThunkIdentifierNode>();
1238 FSN->Signature = Arena.alloc<ThunkSignatureNode>();
1239 FSN->Signature->FunctionClass = FC_NoParameterList;
1240
1241 FSN->Name = demangleNameScopeChain(MangledName, VTIN);
1242 if (!Error)
1243 Error = !MangledName.consumeFront("$B");
1244 if (!Error)
1245 VTIN->OffsetInVTable = demangleUnsigned(MangledName);
1246 if (!Error)
1247 Error = !MangledName.consumeFront('A');
1248 if (!Error)
1249 FSN->Signature->CallConvention = demangleCallingConvention(MangledName);
1250 return (Error) ? nullptr : FSN;
1251}
1252
1253EncodedStringLiteralNode *
1254Demangler::demangleStringLiteral(StringView &MangledName) {
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001255 // This function uses goto, so declare all variables up front.
Zachary Turner970fdc32018-08-16 16:17:36 +00001256 OutputStream OS;
1257 StringView CRC;
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001258 uint64_t StringByteSize;
1259 bool IsWcharT = false;
1260 bool IsNegative = false;
1261 size_t CrcEndPos = 0;
1262 char *ResultBuffer = nullptr;
1263
Zachary Turner03312862018-08-27 03:48:03 +00001264 EncodedStringLiteralNode *Result = Arena.alloc<EncodedStringLiteralNode>();
Zachary Turner970fdc32018-08-16 16:17:36 +00001265
Nico Webere145a542019-04-19 14:13:11 +00001266 // Must happen before the first `goto StringLiteralError`.
1267 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
1268 // FIXME: Propagate out-of-memory as an error?
1269 std::terminate();
1270
Zachary Turner970fdc32018-08-16 16:17:36 +00001271 // Prefix indicating the beginning of a string literal
Zachary Turner3461bfa2018-08-17 16:14:05 +00001272 if (!MangledName.consumeFront("@_"))
1273 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001274 if (MangledName.empty())
1275 goto StringLiteralError;
1276
1277 // Char Type (regular or wchar_t)
Zachary Turner970fdc32018-08-16 16:17:36 +00001278 switch (MangledName.popFront()) {
1279 case '1':
1280 IsWcharT = true;
Erik Pilkington5094e5e2019-01-17 20:37:51 +00001281 DEMANGLE_FALLTHROUGH;
Zachary Turner970fdc32018-08-16 16:17:36 +00001282 case '0':
1283 break;
1284 default:
1285 goto StringLiteralError;
1286 }
1287
1288 // Encoded Length
Zachary Turner970fdc32018-08-16 16:17:36 +00001289 std::tie(StringByteSize, IsNegative) = demangleNumber(MangledName);
Nico Webera0ac65c2019-04-18 19:52:32 +00001290 if (Error || IsNegative || StringByteSize < (IsWcharT ? 2 : 1))
Zachary Turner970fdc32018-08-16 16:17:36 +00001291 goto StringLiteralError;
1292
1293 // CRC 32 (always 8 characters plus a terminator)
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001294 CrcEndPos = MangledName.find('@');
Zachary Turner970fdc32018-08-16 16:17:36 +00001295 if (CrcEndPos == StringView::npos)
1296 goto StringLiteralError;
1297 CRC = MangledName.substr(0, CrcEndPos);
1298 MangledName = MangledName.dropFront(CrcEndPos + 1);
1299 if (MangledName.empty())
1300 goto StringLiteralError;
1301
Zachary Turner970fdc32018-08-16 16:17:36 +00001302 if (IsWcharT) {
Zachary Turner03312862018-08-27 03:48:03 +00001303 Result->Char = CharKind::Wchar;
Zachary Turner970fdc32018-08-16 16:17:36 +00001304 if (StringByteSize > 64)
Zachary Turner3461bfa2018-08-17 16:14:05 +00001305 Result->IsTruncated = true;
Zachary Turner970fdc32018-08-16 16:17:36 +00001306
1307 while (!MangledName.consumeFront('@')) {
Nico Webera0ac65c2019-04-18 19:52:32 +00001308 if (MangledName.size() < 2)
Nico Weber502cf4b2019-04-18 19:30:21 +00001309 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001310 wchar_t W = demangleWcharLiteral(MangledName);
Zachary Turner3461bfa2018-08-17 16:14:05 +00001311 if (StringByteSize != 2 || Result->IsTruncated)
Zachary Turner970fdc32018-08-16 16:17:36 +00001312 outputEscapedChar(OS, W);
1313 StringByteSize -= 2;
1314 if (Error)
1315 goto StringLiteralError;
1316 }
1317 } else {
Zachary Turner32a8a202018-08-29 23:56:09 +00001318 // The max byte length is actually 32, but some compilers mangled strings
1319 // incorrectly, so we have to assume it can go higher.
1320 constexpr unsigned MaxStringByteLength = 32 * 4;
Zachary Turner970fdc32018-08-16 16:17:36 +00001321 uint8_t StringBytes[MaxStringByteLength];
1322
1323 unsigned BytesDecoded = 0;
1324 while (!MangledName.consumeFront('@')) {
Nico Weberaa162682019-04-21 14:25:07 +00001325 if (MangledName.size() < 1 || BytesDecoded >= MaxStringByteLength)
Nico Weber502cf4b2019-04-18 19:30:21 +00001326 goto StringLiteralError;
Zachary Turner970fdc32018-08-16 16:17:36 +00001327 StringBytes[BytesDecoded++] = demangleCharLiteral(MangledName);
1328 }
1329
Zachary Turner32a8a202018-08-29 23:56:09 +00001330 if (StringByteSize > BytesDecoded)
1331 Result->IsTruncated = true;
1332
Zachary Turner970fdc32018-08-16 16:17:36 +00001333 unsigned CharBytes =
1334 guessCharByteSize(StringBytes, BytesDecoded, StringByteSize);
1335 assert(StringByteSize % CharBytes == 0);
1336 switch (CharBytes) {
1337 case 1:
Zachary Turner03312862018-08-27 03:48:03 +00001338 Result->Char = CharKind::Char;
Zachary Turner970fdc32018-08-16 16:17:36 +00001339 break;
1340 case 2:
Zachary Turner03312862018-08-27 03:48:03 +00001341 Result->Char = CharKind::Char16;
Zachary Turner970fdc32018-08-16 16:17:36 +00001342 break;
1343 case 4:
Zachary Turner03312862018-08-27 03:48:03 +00001344 Result->Char = CharKind::Char32;
Zachary Turner970fdc32018-08-16 16:17:36 +00001345 break;
1346 default:
Erik Pilkington5094e5e2019-01-17 20:37:51 +00001347 DEMANGLE_UNREACHABLE;
Zachary Turner970fdc32018-08-16 16:17:36 +00001348 }
1349 const unsigned NumChars = BytesDecoded / CharBytes;
1350 for (unsigned CharIndex = 0; CharIndex < NumChars; ++CharIndex) {
1351 unsigned NextChar =
1352 decodeMultiByteChar(StringBytes, CharIndex, CharBytes);
Zachary Turner3461bfa2018-08-17 16:14:05 +00001353 if (CharIndex + 1 < NumChars || Result->IsTruncated)
Zachary Turner970fdc32018-08-16 16:17:36 +00001354 outputEscapedChar(OS, NextChar);
1355 }
1356 }
1357
1358 OS << '\0';
Zachary Turnerd78fe2f2018-08-16 16:30:27 +00001359 ResultBuffer = OS.getBuffer();
Zachary Turner03312862018-08-27 03:48:03 +00001360 Result->DecodedString = copyString(ResultBuffer);
Zachary Turneraf738f72018-08-16 17:48:32 +00001361 std::free(ResultBuffer);
Zachary Turner970fdc32018-08-16 16:17:36 +00001362 return Result;
1363
1364StringLiteralError:
1365 Error = true;
Nico Webere145a542019-04-19 14:13:11 +00001366 std::free(OS.getBuffer());
Zachary Turner970fdc32018-08-16 16:17:36 +00001367 return nullptr;
1368}
1369
Nico Weberc7444dd2019-04-03 23:15:56 +00001370// Returns MangledName's prefix before the first '@', or an error if
1371// MangledName contains no '@' or the prefix has length 0.
Zachary Turner931e8792018-07-30 23:02:10 +00001372StringView Demangler::demangleSimpleString(StringView &MangledName,
1373 bool Memorize) {
1374 StringView S;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001375 for (size_t i = 0; i < MangledName.size(); ++i) {
1376 if (MangledName[i] != '@')
1377 continue;
Nico Weberc7444dd2019-04-03 23:15:56 +00001378 if (i == 0)
1379 break;
Zachary Turner931e8792018-07-30 23:02:10 +00001380 S = MangledName.substr(0, i);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001381 MangledName = MangledName.dropFront(i + 1);
1382
1383 if (Memorize)
Zachary Turner931e8792018-07-30 23:02:10 +00001384 memorizeString(S);
1385 return S;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001386 }
1387
1388 Error = true;
Zachary Turner931e8792018-07-30 23:02:10 +00001389 return {};
Zachary Turnera7dffb12018-07-28 22:10:42 +00001390}
1391
Zachary Turner03312862018-08-27 03:48:03 +00001392NamedIdentifierNode *
1393Demangler::demangleAnonymousNamespaceName(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001394 assert(MangledName.startsWith("?A"));
1395 MangledName.consumeFront("?A");
1396
Zachary Turner03312862018-08-27 03:48:03 +00001397 NamedIdentifierNode *Node = Arena.alloc<NamedIdentifierNode>();
1398 Node->Name = "`anonymous namespace'";
Zachary Turner91c98a82018-08-20 23:58:35 +00001399 size_t EndPos = MangledName.find('@');
1400 if (EndPos == StringView::npos) {
1401 Error = true;
1402 return nullptr;
1403 }
Zachary Turner0002dd42018-08-20 23:58:58 +00001404 StringView NamespaceKey = MangledName.substr(0, EndPos);
1405 memorizeString(NamespaceKey);
Zachary Turner91c98a82018-08-20 23:58:35 +00001406 MangledName = MangledName.substr(EndPos + 1);
1407 return Node;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001408}
1409
Zachary Turner03312862018-08-27 03:48:03 +00001410NamedIdentifierNode *
1411Demangler::demangleLocallyScopedNamePiece(StringView &MangledName) {
Zachary Turner71c91f92018-07-30 03:12:34 +00001412 assert(startsWithLocalScopePattern(MangledName));
1413
Zachary Turner03312862018-08-27 03:48:03 +00001414 NamedIdentifierNode *Identifier = Arena.alloc<NamedIdentifierNode>();
Zachary Turner71c91f92018-07-30 03:12:34 +00001415 MangledName.consumeFront('?');
Nico Weberc5615c22019-04-03 23:29:05 +00001416 uint64_t Number = 0;
1417 bool IsNegative = false;
1418 std::tie(Number, IsNegative) = demangleNumber(MangledName);
1419 assert(!IsNegative);
Zachary Turner71c91f92018-07-30 03:12:34 +00001420
1421 // One ? to terminate the number
1422 MangledName.consumeFront('?');
1423
1424 assert(!Error);
Zachary Turner03312862018-08-27 03:48:03 +00001425 Node *Scope = parse(MangledName);
Zachary Turner71c91f92018-07-30 03:12:34 +00001426 if (Error)
1427 return nullptr;
1428
1429 // Render the parent symbol's name into a buffer.
Nico Weber1359d652018-09-15 18:24:20 +00001430 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +00001431 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00001432 // FIXME: Propagate out-of-memory as an error?
1433 std::terminate();
Zachary Turner71c91f92018-07-30 03:12:34 +00001434 OS << '`';
Zachary Turner38d2edd2018-08-29 03:59:17 +00001435 Scope->output(OS, OF_Default);
Zachary Turner71c91f92018-07-30 03:12:34 +00001436 OS << '\'';
Nico Weberc5615c22019-04-03 23:29:05 +00001437 OS << "::`" << Number << "'";
Zachary Turner71c91f92018-07-30 03:12:34 +00001438 OS << '\0';
1439 char *Result = OS.getBuffer();
Zachary Turner03312862018-08-27 03:48:03 +00001440 Identifier->Name = copyString(Result);
Zachary Turner71c91f92018-07-30 03:12:34 +00001441 std::free(Result);
Zachary Turner03312862018-08-27 03:48:03 +00001442 return Identifier;
Zachary Turner71c91f92018-07-30 03:12:34 +00001443}
1444
Zachary Turnera7dffb12018-07-28 22:10:42 +00001445// Parses a type name in the form of A@B@C@@ which represents C::B::A.
Zachary Turner03312862018-08-27 03:48:03 +00001446QualifiedNameNode *
1447Demangler::demangleFullyQualifiedTypeName(StringView &MangledName) {
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001448 IdentifierNode *Identifier =
1449 demangleUnqualifiedTypeName(MangledName, /*Memorize=*/true);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001450 if (Error)
1451 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001452 assert(Identifier);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001453
Zachary Turner03312862018-08-27 03:48:03 +00001454 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001455 if (Error)
1456 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001457 assert(QN);
1458 return QN;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001459}
1460
1461// Parses a symbol name in the form of A@B@C@@ which represents C::B::A.
1462// Symbol names have slightly different rules regarding what can appear
1463// so we separate out the implementations for flexibility.
Zachary Turner03312862018-08-27 03:48:03 +00001464QualifiedNameNode *
1465Demangler::demangleFullyQualifiedSymbolName(StringView &MangledName) {
Zachary Turner58d29cf2018-08-08 00:43:31 +00001466 // This is the final component of a symbol name (i.e. the leftmost component
1467 // of a mangled name. Since the only possible template instantiation that
1468 // can appear in this context is a function template, and since those are
1469 // not saved for the purposes of name backreferences, only backref simple
1470 // names.
Zachary Turner03312862018-08-27 03:48:03 +00001471 IdentifierNode *Identifier =
1472 demangleUnqualifiedSymbolName(MangledName, NBB_Simple);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001473 if (Error)
1474 return nullptr;
Zachary Turner3461bfa2018-08-17 16:14:05 +00001475
Zachary Turner03312862018-08-27 03:48:03 +00001476 QualifiedNameNode *QN = demangleNameScopeChain(MangledName, Identifier);
Zachary Turner54d4ffe2018-08-01 18:32:28 +00001477 if (Error)
1478 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00001479
1480 if (Identifier->kind() == NodeKind::StructorIdentifier) {
Nico Webera9886f82019-04-03 23:23:32 +00001481 if (QN->Components->Count < 2) {
1482 Error = true;
1483 return nullptr;
1484 }
Zachary Turner03312862018-08-27 03:48:03 +00001485 StructorIdentifierNode *SIN =
1486 static_cast<StructorIdentifierNode *>(Identifier);
Zachary Turner03312862018-08-27 03:48:03 +00001487 Node *ClassNode = QN->Components->Nodes[QN->Components->Count - 2];
1488 SIN->Class = static_cast<IdentifierNode *>(ClassNode);
1489 }
1490 assert(QN);
1491 return QN;
Zachary Turnera7dffb12018-07-28 22:10:42 +00001492}
1493
Zachary Turner03312862018-08-27 03:48:03 +00001494IdentifierNode *Demangler::demangleUnqualifiedTypeName(StringView &MangledName,
1495 bool Memorize) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001496 // An inner-most name can be a back-reference, because a fully-qualified name
1497 // (e.g. Scope + Inner) can contain other fully qualified names inside of
1498 // them (for example template parameters), and these nested parameters can
1499 // refer to previously mangled types.
1500 if (startsWithDigit(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001501 return demangleBackRefName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001502
1503 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001504 return demangleTemplateInstantiationName(MangledName, NBB_Template);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001505
Zachary Turner44ebbc22018-08-01 18:32:47 +00001506 return demangleSimpleName(MangledName, Memorize);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001507}
1508
Zachary Turner03312862018-08-27 03:48:03 +00001509IdentifierNode *
1510Demangler::demangleUnqualifiedSymbolName(StringView &MangledName,
1511 NameBackrefBehavior NBB) {
Zachary Turner71c91f92018-07-30 03:12:34 +00001512 if (startsWithDigit(MangledName))
1513 return demangleBackRefName(MangledName);
1514 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001515 return demangleTemplateInstantiationName(MangledName, NBB);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001516 if (MangledName.startsWith('?'))
Zachary Turner03312862018-08-27 03:48:03 +00001517 return demangleFunctionIdentifierCode(MangledName);
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001518 return demangleSimpleName(MangledName, /*Memorize=*/(NBB & NBB_Simple) != 0);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001519}
1520
Zachary Turner03312862018-08-27 03:48:03 +00001521IdentifierNode *Demangler::demangleNameScopePiece(StringView &MangledName) {
Zachary Turnera7dffb12018-07-28 22:10:42 +00001522 if (startsWithDigit(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001523 return demangleBackRefName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001524
1525 if (MangledName.startsWith("?$"))
Zachary Turner58d29cf2018-08-08 00:43:31 +00001526 return demangleTemplateInstantiationName(MangledName, NBB_Template);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001527
1528 if (MangledName.startsWith("?A"))
Zachary Turner316109b2018-07-29 16:38:02 +00001529 return demangleAnonymousNamespaceName(MangledName);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001530
Zachary Turner71c91f92018-07-30 03:12:34 +00001531 if (startsWithLocalScopePattern(MangledName))
1532 return demangleLocallyScopedNamePiece(MangledName);
1533
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001534 return demangleSimpleName(MangledName, /*Memorize=*/true);
Zachary Turnera7dffb12018-07-28 22:10:42 +00001535}
1536
Zachary Turner03312862018-08-27 03:48:03 +00001537static NodeArrayNode *nodeListToNodeArray(ArenaAllocator &Arena, NodeList *Head,
1538 size_t Count) {
1539 NodeArrayNode *N = Arena.alloc<NodeArrayNode>();
1540 N->Count = Count;
1541 N->Nodes = Arena.allocArray<Node *>(Count);
1542 for (size_t I = 0; I < Count; ++I) {
1543 N->Nodes[I] = Head->N;
1544 Head = Head->Next;
1545 }
1546 return N;
1547}
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001548
Zachary Turner03312862018-08-27 03:48:03 +00001549QualifiedNameNode *
1550Demangler::demangleNameScopeChain(StringView &MangledName,
1551 IdentifierNode *UnqualifiedName) {
1552 NodeList *Head = Arena.alloc<NodeList>();
1553
1554 Head->N = UnqualifiedName;
1555
1556 size_t Count = 1;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001557 while (!MangledName.consumeFront("@")) {
Zachary Turner03312862018-08-27 03:48:03 +00001558 ++Count;
1559 NodeList *NewHead = Arena.alloc<NodeList>();
1560 NewHead->Next = Head;
1561 Head = NewHead;
1562
Zachary Turnera7dffb12018-07-28 22:10:42 +00001563 if (MangledName.empty()) {
1564 Error = true;
1565 return nullptr;
1566 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001567
1568 assert(!Error);
Zachary Turner03312862018-08-27 03:48:03 +00001569 IdentifierNode *Elem = demangleNameScopePiece(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001570 if (Error)
1571 return nullptr;
1572
Zachary Turner03312862018-08-27 03:48:03 +00001573 Head->N = Elem;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001574 }
Zachary Turner03312862018-08-27 03:48:03 +00001575
1576 QualifiedNameNode *QN = Arena.alloc<QualifiedNameNode>();
1577 QN->Components = nodeListToNodeArray(Arena, Head, Count);
1578 return QN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001579}
1580
Zachary Turner316109b2018-07-29 16:38:02 +00001581FuncClass Demangler::demangleFunctionClass(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001582 switch (MangledName.popFront()) {
Zachary Turner29ec67b2018-08-10 21:09:05 +00001583 case '9':
Zachary Turner03312862018-08-27 03:48:03 +00001584 return FuncClass(FC_ExternC | FC_NoParameterList);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001585 case 'A':
Zachary Turner03312862018-08-27 03:48:03 +00001586 return FC_Private;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001587 case 'B':
Zachary Turner03312862018-08-27 03:48:03 +00001588 return FuncClass(FC_Private | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001589 case 'C':
Zachary Turner03312862018-08-27 03:48:03 +00001590 return FuncClass(FC_Private | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001591 case 'D':
Zachary Turner03312862018-08-27 03:48:03 +00001592 return FuncClass(FC_Private | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001593 case 'E':
Zachary Turner03312862018-08-27 03:48:03 +00001594 return FuncClass(FC_Private | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001595 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00001596 return FuncClass(FC_Private | FC_Virtual);
Zachary Turner32a8a202018-08-29 23:56:09 +00001597 case 'G':
1598 return FuncClass(FC_Private | FC_StaticThisAdjust);
1599 case 'H':
1600 return FuncClass(FC_Private | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001601 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00001602 return FuncClass(FC_Protected);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001603 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001604 return FuncClass(FC_Protected | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001605 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001606 return FuncClass(FC_Protected | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001607 case 'L':
Zachary Turner03312862018-08-27 03:48:03 +00001608 return FuncClass(FC_Protected | FC_Static | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001609 case 'M':
Zachary Turner03312862018-08-27 03:48:03 +00001610 return FuncClass(FC_Protected | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001611 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001612 return FuncClass(FC_Protected | FC_Virtual | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001613 case 'O':
Zachary Turner03312862018-08-27 03:48:03 +00001614 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust);
Zachary Turner469f0762018-08-17 21:18:05 +00001615 case 'P':
Zachary Turner03312862018-08-27 03:48:03 +00001616 return FuncClass(FC_Protected | FC_Virtual | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001617 case 'Q':
Zachary Turner03312862018-08-27 03:48:03 +00001618 return FuncClass(FC_Public);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001619 case 'R':
Zachary Turner03312862018-08-27 03:48:03 +00001620 return FuncClass(FC_Public | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001621 case 'S':
Zachary Turner03312862018-08-27 03:48:03 +00001622 return FuncClass(FC_Public | FC_Static);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001623 case 'T':
Zachary Turner03312862018-08-27 03:48:03 +00001624 return FuncClass(FC_Public | FC_Static | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001625 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001626 return FuncClass(FC_Public | FC_Virtual);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001627 case 'V':
Zachary Turner03312862018-08-27 03:48:03 +00001628 return FuncClass(FC_Public | FC_Virtual | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001629 case 'W':
Zachary Turner03312862018-08-27 03:48:03 +00001630 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust);
Zachary Turner469f0762018-08-17 21:18:05 +00001631 case 'X':
Zachary Turner03312862018-08-27 03:48:03 +00001632 return FuncClass(FC_Public | FC_Virtual | FC_StaticThisAdjust | FC_Far);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001633 case 'Y':
Zachary Turner03312862018-08-27 03:48:03 +00001634 return FuncClass(FC_Global);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001635 case 'Z':
Zachary Turner03312862018-08-27 03:48:03 +00001636 return FuncClass(FC_Global | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001637 case '$': {
Zachary Turner03312862018-08-27 03:48:03 +00001638 FuncClass VFlag = FC_VirtualThisAdjust;
Zachary Turner469f0762018-08-17 21:18:05 +00001639 if (MangledName.consumeFront('R'))
Zachary Turner03312862018-08-27 03:48:03 +00001640 VFlag = FuncClass(VFlag | FC_VirtualThisAdjustEx);
Nico Weberb4f33bb2019-04-11 22:47:18 +00001641 if (MangledName.empty())
1642 break;
Zachary Turner469f0762018-08-17 21:18:05 +00001643 switch (MangledName.popFront()) {
1644 case '0':
Zachary Turner03312862018-08-27 03:48:03 +00001645 return FuncClass(FC_Private | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001646 case '1':
Zachary Turner03312862018-08-27 03:48:03 +00001647 return FuncClass(FC_Private | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001648 case '2':
Zachary Turner03312862018-08-27 03:48:03 +00001649 return FuncClass(FC_Protected | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001650 case '3':
Zachary Turner03312862018-08-27 03:48:03 +00001651 return FuncClass(FC_Protected | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001652 case '4':
Zachary Turner03312862018-08-27 03:48:03 +00001653 return FuncClass(FC_Public | FC_Virtual | VFlag);
Zachary Turner469f0762018-08-17 21:18:05 +00001654 case '5':
Zachary Turner03312862018-08-27 03:48:03 +00001655 return FuncClass(FC_Public | FC_Virtual | VFlag | FC_Far);
Zachary Turner469f0762018-08-17 21:18:05 +00001656 }
1657 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001658 }
1659
1660 Error = true;
Zachary Turner03312862018-08-27 03:48:03 +00001661 return FC_Public;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001662}
1663
Zachary Turner316109b2018-07-29 16:38:02 +00001664CallingConv Demangler::demangleCallingConvention(StringView &MangledName) {
Nico Weber63b97d22019-04-08 19:46:53 +00001665 if (MangledName.empty()) {
1666 Error = true;
1667 return CallingConv::None;
1668 }
1669
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001670 switch (MangledName.popFront()) {
1671 case 'A':
1672 case 'B':
1673 return CallingConv::Cdecl;
1674 case 'C':
1675 case 'D':
1676 return CallingConv::Pascal;
1677 case 'E':
1678 case 'F':
1679 return CallingConv::Thiscall;
1680 case 'G':
1681 case 'H':
1682 return CallingConv::Stdcall;
1683 case 'I':
1684 case 'J':
1685 return CallingConv::Fastcall;
1686 case 'M':
1687 case 'N':
1688 return CallingConv::Clrcall;
1689 case 'O':
1690 case 'P':
1691 return CallingConv::Eabi;
1692 case 'Q':
1693 return CallingConv::Vectorcall;
1694 }
1695
1696 return CallingConv::None;
Martin Storsjo0f2abd82018-07-20 18:43:42 +00001697}
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001698
Zachary Turner316109b2018-07-29 16:38:02 +00001699StorageClass Demangler::demangleVariableStorageClass(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001700 assert(std::isdigit(MangledName.front()));
1701
1702 switch (MangledName.popFront()) {
1703 case '0':
1704 return StorageClass::PrivateStatic;
1705 case '1':
1706 return StorageClass::ProtectedStatic;
1707 case '2':
1708 return StorageClass::PublicStatic;
1709 case '3':
1710 return StorageClass::Global;
1711 case '4':
1712 return StorageClass::FunctionLocalStatic;
1713 }
1714 Error = true;
1715 return StorageClass::None;
1716}
1717
Zachary Turner316109b2018-07-29 16:38:02 +00001718std::pair<Qualifiers, bool>
1719Demangler::demangleQualifiers(StringView &MangledName) {
Nico Weber63b97d22019-04-08 19:46:53 +00001720 if (MangledName.empty()) {
1721 Error = true;
1722 return std::make_pair(Q_None, false);
1723 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001724
1725 switch (MangledName.popFront()) {
Zachary Turnerd742d642018-07-26 19:56:09 +00001726 // Member qualifiers
1727 case 'Q':
1728 return std::make_pair(Q_None, true);
1729 case 'R':
1730 return std::make_pair(Q_Const, true);
1731 case 'S':
1732 return std::make_pair(Q_Volatile, true);
1733 case 'T':
1734 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), true);
1735 // Non-Member qualifiers
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001736 case 'A':
Zachary Turnerd742d642018-07-26 19:56:09 +00001737 return std::make_pair(Q_None, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001738 case 'B':
Zachary Turnerd742d642018-07-26 19:56:09 +00001739 return std::make_pair(Q_Const, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001740 case 'C':
Zachary Turnerd742d642018-07-26 19:56:09 +00001741 return std::make_pair(Q_Volatile, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001742 case 'D':
Zachary Turnerd742d642018-07-26 19:56:09 +00001743 return std::make_pair(Qualifiers(Q_Const | Q_Volatile), false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001744 }
1745 Error = true;
Zachary Turnerd742d642018-07-26 19:56:09 +00001746 return std::make_pair(Q_None, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001747}
1748
1749// <variable-type> ::= <type> <cvr-qualifiers>
1750// ::= <type> <pointee-cvr-qualifiers> # pointers, references
Zachary Turner03312862018-08-27 03:48:03 +00001751TypeNode *Demangler::demangleType(StringView &MangledName,
1752 QualifierMangleMode QMM) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001753 Qualifiers Quals = Q_None;
Zachary Turnerd742d642018-07-26 19:56:09 +00001754 bool IsMember = false;
Zachary Turnerd742d642018-07-26 19:56:09 +00001755 if (QMM == QualifierMangleMode::Mangle) {
Zachary Turner316109b2018-07-29 16:38:02 +00001756 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00001757 } else if (QMM == QualifierMangleMode::Result) {
Zachary Turnerdf4cd7c2018-08-21 21:23:49 +00001758 if (MangledName.consumeFront('?'))
Zachary Turner316109b2018-07-29 16:38:02 +00001759 std::tie(Quals, IsMember) = demangleQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001760 }
1761
Nico Weber63b97d22019-04-08 19:46:53 +00001762 if (MangledName.empty()) {
1763 Error = true;
1764 return nullptr;
1765 }
1766
Zachary Turner03312862018-08-27 03:48:03 +00001767 TypeNode *Ty = nullptr;
Zachary Turner931e8792018-07-30 23:02:10 +00001768 if (isTagType(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001769 Ty = demangleClassType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001770 else if (isPointerType(MangledName)) {
Zachary Turner8fb9a712018-12-14 18:10:13 +00001771 if (isMemberPointer(MangledName, Error))
Zachary Turner316109b2018-07-29 16:38:02 +00001772 Ty = demangleMemberPointerType(MangledName);
Zachary Turner8fb9a712018-12-14 18:10:13 +00001773 else if (!Error)
Zachary Turner316109b2018-07-29 16:38:02 +00001774 Ty = demanglePointerType(MangledName);
Zachary Turner8fb9a712018-12-14 18:10:13 +00001775 else
1776 return nullptr;
Zachary Turner931e8792018-07-30 23:02:10 +00001777 } else if (isArrayType(MangledName))
Zachary Turner316109b2018-07-29 16:38:02 +00001778 Ty = demangleArrayType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001779 else if (isFunctionType(MangledName)) {
1780 if (MangledName.consumeFront("$$A8@@"))
Zachary Turner03312862018-08-27 03:48:03 +00001781 Ty = demangleFunctionType(MangledName, true);
Zachary Turner931e8792018-07-30 23:02:10 +00001782 else {
1783 assert(MangledName.startsWith("$$A6"));
1784 MangledName.consumeFront("$$A6");
Zachary Turner03312862018-08-27 03:48:03 +00001785 Ty = demangleFunctionType(MangledName, false);
Zachary Turner931e8792018-07-30 23:02:10 +00001786 }
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001787 } else if (isCustomType(MangledName)) {
1788 Ty = demangleCustomType(MangledName);
Zachary Turner931e8792018-07-30 23:02:10 +00001789 } else {
Zachary Turner03312862018-08-27 03:48:03 +00001790 Ty = demanglePrimitiveType(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001791 }
Zachary Turner931e8792018-07-30 23:02:10 +00001792
Zachary Turner2cd32862018-12-14 17:43:56 +00001793 if (!Ty || Error)
1794 return Ty;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001795 Ty->Quals = Qualifiers(Ty->Quals | Quals);
1796 return Ty;
1797}
1798
Zachary Turner2fe49002019-01-08 21:05:51 +00001799bool Demangler::demangleThrowSpecification(StringView &MangledName) {
1800 if (MangledName.consumeFront("_E"))
1801 return true;
Zachary Turner38b78a72018-07-26 20:20:10 +00001802 if (MangledName.consumeFront('Z'))
Zachary Turner2fe49002019-01-08 21:05:51 +00001803 return false;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001804
Zachary Turner38b78a72018-07-26 20:20:10 +00001805 Error = true;
Zachary Turner2fe49002019-01-08 21:05:51 +00001806 return false;
Zachary Turner38b78a72018-07-26 20:20:10 +00001807}
1808
Zachary Turner03312862018-08-27 03:48:03 +00001809FunctionSignatureNode *Demangler::demangleFunctionType(StringView &MangledName,
1810 bool HasThisQuals) {
1811 FunctionSignatureNode *FTy = Arena.alloc<FunctionSignatureNode>();
Zachary Turner38b78a72018-07-26 20:20:10 +00001812
1813 if (HasThisQuals) {
Zachary Turner316109b2018-07-29 16:38:02 +00001814 FTy->Quals = demanglePointerExtQualifiers(MangledName);
Zachary Turner03312862018-08-27 03:48:03 +00001815 FTy->RefQualifier = demangleFunctionRefQualifier(MangledName);
Zachary Turner316109b2018-07-29 16:38:02 +00001816 FTy->Quals = Qualifiers(FTy->Quals | demangleQualifiers(MangledName).first);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001817 }
1818
1819 // Fields that appear on both member and non-member functions.
Zachary Turner316109b2018-07-29 16:38:02 +00001820 FTy->CallConvention = demangleCallingConvention(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001821
1822 // <return-type> ::= <type>
1823 // ::= @ # structors (they have no declared return type)
1824 bool IsStructor = MangledName.consumeFront('@');
1825 if (!IsStructor)
Zachary Turner316109b2018-07-29 16:38:02 +00001826 FTy->ReturnType = demangleType(MangledName, QualifierMangleMode::Result);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001827
Zachary Turner316109b2018-07-29 16:38:02 +00001828 FTy->Params = demangleFunctionParameterList(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001829
Zachary Turner2fe49002019-01-08 21:05:51 +00001830 FTy->IsNoexcept = demangleThrowSpecification(MangledName);
Zachary Turner38b78a72018-07-26 20:20:10 +00001831
1832 return FTy;
1833}
1834
Zachary Turner03312862018-08-27 03:48:03 +00001835FunctionSymbolNode *
1836Demangler::demangleFunctionEncoding(StringView &MangledName) {
1837 FuncClass ExtraFlags = FC_None;
Zachary Turner469f0762018-08-17 21:18:05 +00001838 if (MangledName.consumeFront("$$J0"))
Zachary Turner03312862018-08-27 03:48:03 +00001839 ExtraFlags = FC_ExternC;
Zachary Turner469f0762018-08-17 21:18:05 +00001840
Nico Weber63b97d22019-04-08 19:46:53 +00001841 if (MangledName.empty()) {
1842 Error = true;
1843 return nullptr;
1844 }
1845
Zachary Turner316109b2018-07-29 16:38:02 +00001846 FuncClass FC = demangleFunctionClass(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001847 FC = FuncClass(ExtraFlags | FC);
1848
Zachary Turner03312862018-08-27 03:48:03 +00001849 FunctionSignatureNode *FSN = nullptr;
1850 ThunkSignatureNode *TTN = nullptr;
1851 if (FC & FC_StaticThisAdjust) {
1852 TTN = Arena.alloc<ThunkSignatureNode>();
1853 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
1854 } else if (FC & FC_VirtualThisAdjust) {
1855 TTN = Arena.alloc<ThunkSignatureNode>();
1856 if (FC & FC_VirtualThisAdjustEx) {
1857 TTN->ThisAdjust.VBPtrOffset = demangleSigned(MangledName);
1858 TTN->ThisAdjust.VBOffsetOffset = demangleSigned(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001859 }
Zachary Turner03312862018-08-27 03:48:03 +00001860 TTN->ThisAdjust.VtordispOffset = demangleSigned(MangledName);
1861 TTN->ThisAdjust.StaticOffset = demangleSigned(MangledName);
Zachary Turner469f0762018-08-17 21:18:05 +00001862 }
1863
Zachary Turner03312862018-08-27 03:48:03 +00001864 if (FC & FC_NoParameterList) {
Zachary Turner29ec67b2018-08-10 21:09:05 +00001865 // This is an extern "C" function whose full signature hasn't been mangled.
1866 // This happens when we need to mangle a local symbol inside of an extern
1867 // "C" function.
Zachary Turner03312862018-08-27 03:48:03 +00001868 FSN = Arena.alloc<FunctionSignatureNode>();
Zachary Turner29ec67b2018-08-10 21:09:05 +00001869 } else {
Zachary Turner03312862018-08-27 03:48:03 +00001870 bool HasThisQuals = !(FC & (FC_Global | FC_Static));
1871 FSN = demangleFunctionType(MangledName, HasThisQuals);
Zachary Turner29ec67b2018-08-10 21:09:05 +00001872 }
Nico Weber63b97d22019-04-08 19:46:53 +00001873
1874 if (Error)
1875 return nullptr;
1876
Zachary Turner03312862018-08-27 03:48:03 +00001877 if (TTN) {
1878 *static_cast<FunctionSignatureNode *>(TTN) = *FSN;
1879 FSN = TTN;
1880 }
1881 FSN->FunctionClass = FC;
Zachary Turner38b78a72018-07-26 20:20:10 +00001882
Zachary Turner03312862018-08-27 03:48:03 +00001883 FunctionSymbolNode *Symbol = Arena.alloc<FunctionSymbolNode>();
1884 Symbol->Signature = FSN;
1885 return Symbol;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001886}
1887
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001888CustomTypeNode *Demangler::demangleCustomType(StringView &MangledName) {
1889 assert(MangledName.startsWith('?'));
1890 MangledName.popFront();
1891
1892 CustomTypeNode *CTN = Arena.alloc<CustomTypeNode>();
Nico Weberaf2ee7d2019-04-11 23:20:18 +00001893 CTN->Identifier = demangleUnqualifiedTypeName(MangledName, /*Memorize=*/true);
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00001894 if (!MangledName.consumeFront('@'))
1895 Error = true;
1896 if (Error)
1897 return nullptr;
1898 return CTN;
1899}
1900
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001901// Reads a primitive type.
Zachary Turner03312862018-08-27 03:48:03 +00001902PrimitiveTypeNode *Demangler::demanglePrimitiveType(StringView &MangledName) {
1903 if (MangledName.consumeFront("$$T"))
1904 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Nullptr);
Zachary Turner931e8792018-07-30 23:02:10 +00001905
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001906 switch (MangledName.popFront()) {
1907 case 'X':
Zachary Turner03312862018-08-27 03:48:03 +00001908 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Void);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001909 case 'D':
Zachary Turner03312862018-08-27 03:48:03 +00001910 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001911 case 'C':
Zachary Turner03312862018-08-27 03:48:03 +00001912 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Schar);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001913 case 'E':
Zachary Turner03312862018-08-27 03:48:03 +00001914 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uchar);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001915 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00001916 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Short);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001917 case 'G':
Zachary Turner03312862018-08-27 03:48:03 +00001918 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ushort);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001919 case 'H':
Zachary Turner03312862018-08-27 03:48:03 +00001920 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001921 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00001922 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001923 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001924 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Long);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001925 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001926 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ulong);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001927 case 'M':
Zachary Turner03312862018-08-27 03:48:03 +00001928 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Float);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001929 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001930 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Double);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001931 case 'O':
Zachary Turner03312862018-08-27 03:48:03 +00001932 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Ldouble);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001933 case '_': {
Zachary Turner91ecedd2018-07-20 18:07:33 +00001934 if (MangledName.empty()) {
1935 Error = true;
1936 return nullptr;
1937 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001938 switch (MangledName.popFront()) {
1939 case 'N':
Zachary Turner03312862018-08-27 03:48:03 +00001940 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Bool);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001941 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00001942 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Int64);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001943 case 'K':
Zachary Turner03312862018-08-27 03:48:03 +00001944 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Uint64);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001945 case 'W':
Zachary Turner03312862018-08-27 03:48:03 +00001946 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Wchar);
Nico Webera2ca6e72019-05-28 15:30:04 +00001947 case 'Q':
1948 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char8);
Zachary Turner931e8792018-07-30 23:02:10 +00001949 case 'S':
Zachary Turner03312862018-08-27 03:48:03 +00001950 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char16);
Zachary Turner931e8792018-07-30 23:02:10 +00001951 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001952 return Arena.alloc<PrimitiveTypeNode>(PrimitiveKind::Char32);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001953 }
1954 break;
1955 }
1956 }
Zachary Turner03312862018-08-27 03:48:03 +00001957 Error = true;
1958 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001959}
1960
Zachary Turner03312862018-08-27 03:48:03 +00001961TagTypeNode *Demangler::demangleClassType(StringView &MangledName) {
1962 TagTypeNode *TT = nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001963
1964 switch (MangledName.popFront()) {
1965 case 'T':
Zachary Turner03312862018-08-27 03:48:03 +00001966 TT = Arena.alloc<TagTypeNode>(TagKind::Union);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001967 break;
1968 case 'U':
Zachary Turner03312862018-08-27 03:48:03 +00001969 TT = Arena.alloc<TagTypeNode>(TagKind::Struct);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001970 break;
1971 case 'V':
Zachary Turner03312862018-08-27 03:48:03 +00001972 TT = Arena.alloc<TagTypeNode>(TagKind::Class);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001973 break;
1974 case 'W':
Nico Webere5b62652019-04-11 22:59:25 +00001975 if (!MangledName.consumeFront('4')) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001976 Error = true;
1977 return nullptr;
1978 }
Zachary Turner03312862018-08-27 03:48:03 +00001979 TT = Arena.alloc<TagTypeNode>(TagKind::Enum);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001980 break;
1981 default:
1982 assert(false);
1983 }
1984
Zachary Turner03312862018-08-27 03:48:03 +00001985 TT->QualifiedName = demangleFullyQualifiedTypeName(MangledName);
1986 return TT;
Zachary Turnerd742d642018-07-26 19:56:09 +00001987}
1988
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001989// <pointer-type> ::= E? <pointer-cvr-qualifiers> <ext-qualifiers> <type>
1990// # the E is required for 64-bit non-static pointers
Zachary Turner03312862018-08-27 03:48:03 +00001991PointerTypeNode *Demangler::demanglePointerType(StringView &MangledName) {
1992 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001993
Zachary Turner931e8792018-07-30 23:02:10 +00001994 std::tie(Pointer->Quals, Pointer->Affinity) =
1995 demanglePointerCVQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001996
1997 if (MangledName.consumeFront("6")) {
Zachary Turner03312862018-08-27 03:48:03 +00001998 Pointer->Pointee = demangleFunctionType(MangledName, false);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00001999 return Pointer;
2000 }
2001
Zachary Turner316109b2018-07-29 16:38:02 +00002002 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002003 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
2004
Zachary Turner316109b2018-07-29 16:38:02 +00002005 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Mangle);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002006 return Pointer;
2007}
2008
Zachary Turner03312862018-08-27 03:48:03 +00002009PointerTypeNode *Demangler::demangleMemberPointerType(StringView &MangledName) {
2010 PointerTypeNode *Pointer = Arena.alloc<PointerTypeNode>();
Zachary Turnerd742d642018-07-26 19:56:09 +00002011
Zachary Turner03312862018-08-27 03:48:03 +00002012 std::tie(Pointer->Quals, Pointer->Affinity) =
2013 demanglePointerCVQualifiers(MangledName);
2014 assert(Pointer->Affinity == PointerAffinity::Pointer);
Zachary Turnerd742d642018-07-26 19:56:09 +00002015
Zachary Turner316109b2018-07-29 16:38:02 +00002016 Qualifiers ExtQuals = demanglePointerExtQualifiers(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00002017 Pointer->Quals = Qualifiers(Pointer->Quals | ExtQuals);
2018
Nico Weber63b97d22019-04-08 19:46:53 +00002019 // isMemberPointer() only returns true if there is at least one character
2020 // after the qualifiers.
Zachary Turner38b78a72018-07-26 20:20:10 +00002021 if (MangledName.consumeFront("8")) {
Zachary Turner32a8a202018-08-29 23:56:09 +00002022 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
Zachary Turner03312862018-08-27 03:48:03 +00002023 Pointer->Pointee = demangleFunctionType(MangledName, true);
Zachary Turner38b78a72018-07-26 20:20:10 +00002024 } else {
2025 Qualifiers PointeeQuals = Q_None;
2026 bool IsMember = false;
Zachary Turner316109b2018-07-29 16:38:02 +00002027 std::tie(PointeeQuals, IsMember) = demangleQualifiers(MangledName);
Nico Weber63b97d22019-04-08 19:46:53 +00002028 assert(IsMember || Error);
Zachary Turner32a8a202018-08-29 23:56:09 +00002029 Pointer->ClassParent = demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerd742d642018-07-26 19:56:09 +00002030
Zachary Turner316109b2018-07-29 16:38:02 +00002031 Pointer->Pointee = demangleType(MangledName, QualifierMangleMode::Drop);
Nico Weber63b97d22019-04-08 19:46:53 +00002032 if (Pointer->Pointee)
2033 Pointer->Pointee->Quals = PointeeQuals;
Zachary Turner38b78a72018-07-26 20:20:10 +00002034 }
2035
Zachary Turnerd742d642018-07-26 19:56:09 +00002036 return Pointer;
2037}
2038
Zachary Turner316109b2018-07-29 16:38:02 +00002039Qualifiers Demangler::demanglePointerExtQualifiers(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002040 Qualifiers Quals = Q_None;
2041 if (MangledName.consumeFront('E'))
2042 Quals = Qualifiers(Quals | Q_Pointer64);
2043 if (MangledName.consumeFront('I'))
2044 Quals = Qualifiers(Quals | Q_Restrict);
2045 if (MangledName.consumeFront('F'))
2046 Quals = Qualifiers(Quals | Q_Unaligned);
2047
2048 return Quals;
2049}
2050
Zachary Turner03312862018-08-27 03:48:03 +00002051ArrayTypeNode *Demangler::demangleArrayType(StringView &MangledName) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002052 assert(MangledName.front() == 'Y');
2053 MangledName.popFront();
2054
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002055 uint64_t Rank = 0;
2056 bool IsNegative = false;
2057 std::tie(Rank, IsNegative) = demangleNumber(MangledName);
2058 if (IsNegative || Rank == 0) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002059 Error = true;
2060 return nullptr;
2061 }
2062
Zachary Turner03312862018-08-27 03:48:03 +00002063 ArrayTypeNode *ATy = Arena.alloc<ArrayTypeNode>();
2064 NodeList *Head = Arena.alloc<NodeList>();
2065 NodeList *Tail = Head;
2066
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002067 for (uint64_t I = 0; I < Rank; ++I) {
Zachary Turner03312862018-08-27 03:48:03 +00002068 uint64_t D = 0;
2069 std::tie(D, IsNegative) = demangleNumber(MangledName);
Nico Weber16725812019-04-03 23:27:18 +00002070 if (Error || IsNegative) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002071 Error = true;
2072 return nullptr;
2073 }
Zachary Turner03312862018-08-27 03:48:03 +00002074 Tail->N = Arena.alloc<IntegerLiteralNode>(D, IsNegative);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002075 if (I + 1 < Rank) {
Zachary Turner03312862018-08-27 03:48:03 +00002076 Tail->Next = Arena.alloc<NodeList>();
2077 Tail = Tail->Next;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002078 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002079 }
Zachary Turner03312862018-08-27 03:48:03 +00002080 ATy->Dimensions = nodeListToNodeArray(Arena, Head, Rank);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002081
2082 if (MangledName.consumeFront("$$C")) {
Zachary Turner2bbb23b2018-08-14 18:54:28 +00002083 bool IsMember = false;
2084 std::tie(ATy->Quals, IsMember) = demangleQualifiers(MangledName);
2085 if (IsMember) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002086 Error = true;
Zachary Turner2bbb23b2018-08-14 18:54:28 +00002087 return nullptr;
2088 }
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002089 }
2090
Zachary Turner316109b2018-07-29 16:38:02 +00002091 ATy->ElementType = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002092 return ATy;
2093}
2094
2095// Reads a function or a template parameters.
Zachary Turner03312862018-08-27 03:48:03 +00002096NodeArrayNode *
Zachary Turnerd30700f2018-07-31 17:16:44 +00002097Demangler::demangleFunctionParameterList(StringView &MangledName) {
Zachary Turner38b78a72018-07-26 20:20:10 +00002098 // Empty parameter list.
Zachary Turner38b78a72018-07-26 20:20:10 +00002099 if (MangledName.consumeFront('X'))
Nico Weber930994c2019-04-16 14:24:42 +00002100 return nullptr;
Zachary Turner38b78a72018-07-26 20:20:10 +00002101
Zachary Turner03312862018-08-27 03:48:03 +00002102 NodeList *Head = Arena.alloc<NodeList>();
2103 NodeList **Current = &Head;
2104 size_t Count = 0;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002105 while (!Error && !MangledName.startsWith('@') &&
2106 !MangledName.startsWith('Z')) {
Zachary Turner03312862018-08-27 03:48:03 +00002107 ++Count;
Zachary Turner23df1312018-07-26 22:13:39 +00002108
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002109 if (startsWithDigit(MangledName)) {
Zachary Turner30375de2018-07-26 22:24:01 +00002110 size_t N = MangledName[0] - '0';
Zachary Turnerd346cba2018-08-08 17:17:04 +00002111 if (N >= Backrefs.FunctionParamCount) {
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002112 Error = true;
Nico Weber930994c2019-04-16 14:24:42 +00002113 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002114 }
2115 MangledName = MangledName.dropFront();
2116
Zachary Turner03312862018-08-27 03:48:03 +00002117 *Current = Arena.alloc<NodeList>();
2118 (*Current)->N = Backrefs.FunctionParams[N];
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002119 Current = &(*Current)->Next;
2120 continue;
2121 }
2122
Zachary Turner23df1312018-07-26 22:13:39 +00002123 size_t OldSize = MangledName.size();
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002124
Zachary Turner03312862018-08-27 03:48:03 +00002125 *Current = Arena.alloc<NodeList>();
2126 TypeNode *TN = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turner8fb9a712018-12-14 18:10:13 +00002127 if (!TN || Error)
2128 return nullptr;
Zachary Turner03312862018-08-27 03:48:03 +00002129
2130 (*Current)->N = TN;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002131
Zachary Turner23df1312018-07-26 22:13:39 +00002132 size_t CharsConsumed = OldSize - MangledName.size();
2133 assert(CharsConsumed != 0);
2134
2135 // Single-letter types are ignored for backreferences because memorizing
2136 // them doesn't save anything.
Zachary Turnerd346cba2018-08-08 17:17:04 +00002137 if (Backrefs.FunctionParamCount <= 9 && CharsConsumed > 1)
Zachary Turner03312862018-08-27 03:48:03 +00002138 Backrefs.FunctionParams[Backrefs.FunctionParamCount++] = TN;
Zachary Turner23df1312018-07-26 22:13:39 +00002139
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002140 Current = &(*Current)->Next;
2141 }
2142
Zachary Turner38b78a72018-07-26 20:20:10 +00002143 if (Error)
Nico Weber930994c2019-04-16 14:24:42 +00002144 return nullptr;
Zachary Turner38b78a72018-07-26 20:20:10 +00002145
Zachary Turner03312862018-08-27 03:48:03 +00002146 NodeArrayNode *NA = nodeListToNodeArray(Arena, Head, Count);
Zachary Turner38b78a72018-07-26 20:20:10 +00002147 // A non-empty parameter list is terminated by either 'Z' (variadic) parameter
2148 // list or '@' (non variadic). Careful not to consume "@Z", as in that case
2149 // the following Z could be a throw specifier.
2150 if (MangledName.consumeFront('@'))
Zachary Turner03312862018-08-27 03:48:03 +00002151 return NA;
Zachary Turner38b78a72018-07-26 20:20:10 +00002152
2153 if (MangledName.consumeFront('Z')) {
Zachary Turner03312862018-08-27 03:48:03 +00002154 // This is a variadic parameter list. We probably need a variadic node to
2155 // append to the end.
2156 return NA;
Zachary Turner38b78a72018-07-26 20:20:10 +00002157 }
2158
2159 Error = true;
Nico Weber930994c2019-04-16 14:24:42 +00002160 return nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002161}
2162
Zachary Turner03312862018-08-27 03:48:03 +00002163NodeArrayNode *
Zachary Turnerd30700f2018-07-31 17:16:44 +00002164Demangler::demangleTemplateParameterList(StringView &MangledName) {
Zachary Turner03312862018-08-27 03:48:03 +00002165 NodeList *Head;
2166 NodeList **Current = &Head;
2167 size_t Count = 0;
2168
Zachary Turner23df1312018-07-26 22:13:39 +00002169 while (!Error && !MangledName.startsWith('@')) {
Zachary Turner32a8a202018-08-29 23:56:09 +00002170 if (MangledName.consumeFront("$S") || MangledName.consumeFront("$$V") ||
Zachary Turner78ab3cb2018-08-30 20:53:29 +00002171 MangledName.consumeFront("$$$V") || MangledName.consumeFront("$$Z")) {
2172 // parameter pack separator
Zachary Turner32a8a202018-08-29 23:56:09 +00002173 continue;
2174 }
2175
Zachary Turner03312862018-08-27 03:48:03 +00002176 ++Count;
Zachary Turner32a8a202018-08-29 23:56:09 +00002177
Zachary Turner23df1312018-07-26 22:13:39 +00002178 // Template parameter lists don't participate in back-referencing.
Zachary Turner03312862018-08-27 03:48:03 +00002179 *Current = Arena.alloc<NodeList>();
Zachary Turner931e8792018-07-30 23:02:10 +00002180
Zachary Turner03312862018-08-27 03:48:03 +00002181 NodeList &TP = **Current;
Zachary Turner66555a72018-08-20 19:15:35 +00002182
Zachary Turner03312862018-08-27 03:48:03 +00002183 TemplateParameterReferenceNode *TPRN = nullptr;
Zachary Turner32a8a202018-08-29 23:56:09 +00002184 if (MangledName.consumeFront("$$Y")) {
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002185 // Template alias
Zachary Turner03312862018-08-27 03:48:03 +00002186 TP.N = demangleFullyQualifiedTypeName(MangledName);
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002187 } else if (MangledName.consumeFront("$$B")) {
2188 // Array
Zachary Turner03312862018-08-27 03:48:03 +00002189 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turner073620b2018-08-10 19:57:36 +00002190 } else if (MangledName.consumeFront("$$C")) {
2191 // Type has qualifiers.
Zachary Turner03312862018-08-27 03:48:03 +00002192 TP.N = demangleType(MangledName, QualifierMangleMode::Mangle);
Zachary Turner66555a72018-08-20 19:15:35 +00002193 } else if (MangledName.startsWith("$1") || MangledName.startsWith("$H") ||
2194 MangledName.startsWith("$I") || MangledName.startsWith("$J")) {
Zachary Turner03312862018-08-27 03:48:03 +00002195 // Pointer to member
2196 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2197 TPRN->IsMemberPointer = true;
2198
Zachary Turner66555a72018-08-20 19:15:35 +00002199 MangledName = MangledName.dropFront();
2200 // 1 - single inheritance <name>
2201 // H - multiple inheritance <name> <number>
2202 // I - virtual inheritance <name> <number> <number> <number>
2203 // J - unspecified inheritance <name> <number> <number> <number>
2204 char InheritanceSpecifier = MangledName.popFront();
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00002205 SymbolNode *S = nullptr;
2206 if (MangledName.startsWith('?')) {
2207 S = parse(MangledName);
Nico Weber09fb2022019-05-22 15:53:23 +00002208 if (Error || !S->Name) {
2209 Error = true;
Nico Weberf2d8f092019-04-11 22:23:35 +00002210 return nullptr;
Nico Weber09fb2022019-05-22 15:53:23 +00002211 }
Zachary Turnerb2fef1a2018-08-29 04:12:44 +00002212 memorizeIdentifier(S->Name->getUnqualifiedIdentifier());
2213 }
2214
Zachary Turner66555a72018-08-20 19:15:35 +00002215 switch (InheritanceSpecifier) {
2216 case 'J':
Zachary Turner03312862018-08-27 03:48:03 +00002217 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2218 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002219 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002220 case 'I':
Zachary Turner03312862018-08-27 03:48:03 +00002221 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2222 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002223 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002224 case 'H':
Zachary Turner03312862018-08-27 03:48:03 +00002225 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2226 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002227 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002228 case '1':
2229 break;
2230 default:
2231 Error = true;
2232 break;
2233 }
Zachary Turner03312862018-08-27 03:48:03 +00002234 TPRN->Affinity = PointerAffinity::Pointer;
2235 TPRN->Symbol = S;
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002236 } else if (MangledName.startsWith("$E?")) {
2237 MangledName.consumeFront("$E");
2238 // Reference to symbol
Zachary Turner03312862018-08-27 03:48:03 +00002239 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2240 TPRN->Symbol = parse(MangledName);
2241 TPRN->Affinity = PointerAffinity::Reference;
Zachary Turner66555a72018-08-20 19:15:35 +00002242 } else if (MangledName.startsWith("$F") || MangledName.startsWith("$G")) {
Zachary Turner03312862018-08-27 03:48:03 +00002243 TP.N = TPRN = Arena.alloc<TemplateParameterReferenceNode>();
2244
Zachary Turner66555a72018-08-20 19:15:35 +00002245 // Data member pointer.
2246 MangledName = MangledName.dropFront();
2247 char InheritanceSpecifier = MangledName.popFront();
2248
2249 switch (InheritanceSpecifier) {
2250 case 'G':
Zachary Turner03312862018-08-27 03:48:03 +00002251 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2252 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002253 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002254 case 'F':
Zachary Turner03312862018-08-27 03:48:03 +00002255 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2256 demangleSigned(MangledName);
2257 TPRN->ThunkOffsets[TPRN->ThunkOffsetCount++] =
2258 demangleSigned(MangledName);
Erik Pilkington5094e5e2019-01-17 20:37:51 +00002259 DEMANGLE_FALLTHROUGH;
Zachary Turner66555a72018-08-20 19:15:35 +00002260 case '0':
2261 break;
2262 default:
2263 Error = true;
2264 break;
2265 }
Zachary Turner03312862018-08-27 03:48:03 +00002266 TPRN->IsMemberPointer = true;
Zachary Turner66555a72018-08-20 19:15:35 +00002267
Zachary Turnerdbefc6c2018-08-10 14:31:04 +00002268 } else if (MangledName.consumeFront("$0")) {
2269 // Integral non-type template parameter
2270 bool IsNegative = false;
2271 uint64_t Value = 0;
2272 std::tie(Value, IsNegative) = demangleNumber(MangledName);
2273
Zachary Turner03312862018-08-27 03:48:03 +00002274 TP.N = Arena.alloc<IntegerLiteralNode>(Value, IsNegative);
Zachary Turnerd30700f2018-07-31 17:16:44 +00002275 } else {
Zachary Turner03312862018-08-27 03:48:03 +00002276 TP.N = demangleType(MangledName, QualifierMangleMode::Drop);
Zachary Turnerd30700f2018-07-31 17:16:44 +00002277 }
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002278 if (Error)
2279 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002280
Zachary Turner66555a72018-08-20 19:15:35 +00002281 Current = &TP.Next;
Zachary Turner23df1312018-07-26 22:13:39 +00002282 }
2283
2284 if (Error)
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002285 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002286
2287 // Template parameter lists cannot be variadic, so it can only be terminated
2288 // by @.
2289 if (MangledName.consumeFront('@'))
Zachary Turner03312862018-08-27 03:48:03 +00002290 return nodeListToNodeArray(Arena, Head, Count);
Zachary Turner23df1312018-07-26 22:13:39 +00002291 Error = true;
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002292 return nullptr;
Zachary Turner23df1312018-07-26 22:13:39 +00002293}
2294
Zachary Turner3a758e22018-08-01 18:33:04 +00002295void Demangler::dumpBackReferences() {
Zachary Turner5ae08b82018-08-01 18:44:12 +00002296 std::printf("%d function parameter backreferences\n",
Zachary Turnerd346cba2018-08-08 17:17:04 +00002297 (int)Backrefs.FunctionParamCount);
Zachary Turner3a758e22018-08-01 18:33:04 +00002298
2299 // Create an output stream so we can render each type.
Nico Weber1359d652018-09-15 18:24:20 +00002300 OutputStream OS;
Nico Weber6808bc02018-11-11 10:04:00 +00002301 if (!initializeOutputStream(nullptr, nullptr, OS, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00002302 std::terminate();
Zachary Turnerd346cba2018-08-08 17:17:04 +00002303 for (size_t I = 0; I < Backrefs.FunctionParamCount; ++I) {
Zachary Turner3a758e22018-08-01 18:33:04 +00002304 OS.setCurrentPosition(0);
2305
Zachary Turner03312862018-08-27 03:48:03 +00002306 TypeNode *T = Backrefs.FunctionParams[I];
Zachary Turner38d2edd2018-08-29 03:59:17 +00002307 T->output(OS, OF_Default);
Zachary Turner3a758e22018-08-01 18:33:04 +00002308
Zachary Turner7563ebe2018-08-02 17:08:24 +00002309 std::printf(" [%d] - %.*s\n", (int)I, (int)OS.getCurrentPosition(),
Zachary Turner5ae08b82018-08-01 18:44:12 +00002310 OS.getBuffer());
Zachary Turner3a758e22018-08-01 18:33:04 +00002311 }
2312 std::free(OS.getBuffer());
2313
Zachary Turnerd346cba2018-08-08 17:17:04 +00002314 if (Backrefs.FunctionParamCount > 0)
Zachary Turner5ae08b82018-08-01 18:44:12 +00002315 std::printf("\n");
Zachary Turnerd346cba2018-08-08 17:17:04 +00002316 std::printf("%d name backreferences\n", (int)Backrefs.NamesCount);
2317 for (size_t I = 0; I < Backrefs.NamesCount; ++I) {
Zachary Turner03312862018-08-27 03:48:03 +00002318 std::printf(" [%d] - %.*s\n", (int)I, (int)Backrefs.Names[I]->Name.size(),
2319 Backrefs.Names[I]->Name.begin());
Zachary Turner3a758e22018-08-01 18:33:04 +00002320 }
Zachary Turnerd346cba2018-08-08 17:17:04 +00002321 if (Backrefs.NamesCount > 0)
Zachary Turner5ae08b82018-08-01 18:44:12 +00002322 std::printf("\n");
Zachary Turner3a758e22018-08-01 18:33:04 +00002323}
2324
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002325char *llvm::microsoftDemangle(const char *MangledName, char *Buf, size_t *N,
Zachary Turner3a758e22018-08-01 18:33:04 +00002326 int *Status, MSDemangleFlags Flags) {
Nico Weber1359d652018-09-15 18:24:20 +00002327 int InternalStatus = demangle_success;
Zachary Turner316109b2018-07-29 16:38:02 +00002328 Demangler D;
Nico Weber1359d652018-09-15 18:24:20 +00002329 OutputStream S;
2330
Zachary Turner316109b2018-07-29 16:38:02 +00002331 StringView Name{MangledName};
Nico Weber1359d652018-09-15 18:24:20 +00002332 SymbolNode *AST = D.parse(Name);
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002333
Zachary Turner3a758e22018-08-01 18:33:04 +00002334 if (Flags & MSDF_DumpBackrefs)
2335 D.dumpBackReferences();
Nico Weber1359d652018-09-15 18:24:20 +00002336
2337 if (D.Error)
2338 InternalStatus = demangle_invalid_mangled_name;
Nico Weber6808bc02018-11-11 10:04:00 +00002339 else if (!initializeOutputStream(Buf, N, S, 1024))
Nico Weber1359d652018-09-15 18:24:20 +00002340 InternalStatus = demangle_memory_alloc_failure;
2341 else {
2342 AST->output(S, OF_Default);
2343 S += '\0';
2344 if (N != nullptr)
2345 *N = S.getCurrentPosition();
2346 Buf = S.getBuffer();
Zachary Turner54d4ffe2018-08-01 18:32:28 +00002347 }
2348
Nico Weber1359d652018-09-15 18:24:20 +00002349 if (Status)
2350 *Status = InternalStatus;
2351 return InternalStatus == demangle_success ? Buf : nullptr;
Zachary Turnerf435a7e2018-07-20 17:27:48 +00002352}