Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 1 | //===----------------- ItaniumManglingCanonicalizer.cpp -------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is dual licensed under the MIT and the University of Illinois Open |
| 6 | // Source Licenses. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
| 10 | #include "llvm/Support/ItaniumManglingCanonicalizer.h" |
| 11 | |
| 12 | #include "llvm/ADT/FoldingSet.h" |
| 13 | #include "llvm/ADT/StringRef.h" |
| 14 | #include "llvm/Demangle/ItaniumDemangle.h" |
| 15 | #include "llvm/Support/Allocator.h" |
| 16 | |
| 17 | #include "llvm/ADT/DenseMap.h" |
| 18 | #include "llvm/ADT/FoldingSet.h" |
| 19 | #include "llvm/ADT/StringRef.h" |
| 20 | |
| 21 | using namespace llvm; |
| 22 | using llvm::itanium_demangle::ForwardTemplateReference; |
| 23 | using llvm::itanium_demangle::Node; |
| 24 | using llvm::itanium_demangle::NodeKind; |
| 25 | |
| 26 | namespace { |
| 27 | struct FoldingSetNodeIDBuilder { |
| 28 | llvm::FoldingSetNodeID &ID; |
| 29 | void operator()(const Node *P) { ID.AddPointer(P); } |
| 30 | void operator()(StringView Str) { |
| 31 | ID.AddString(llvm::StringRef(Str.begin(), Str.size())); |
| 32 | } |
| 33 | template<typename T> |
| 34 | typename std::enable_if<std::is_integral<T>::value || |
| 35 | std::is_enum<T>::value>::type |
| 36 | operator()(T V) { |
| 37 | ID.AddInteger((unsigned long long)V); |
| 38 | } |
| 39 | void operator()(itanium_demangle::NodeOrString NS) { |
| 40 | if (NS.isNode()) { |
| 41 | ID.AddInteger(0); |
| 42 | (*this)(NS.asNode()); |
| 43 | } else if (NS.isString()) { |
| 44 | ID.AddInteger(1); |
| 45 | (*this)(NS.asString()); |
| 46 | } else { |
| 47 | ID.AddInteger(2); |
| 48 | } |
| 49 | } |
| 50 | void operator()(itanium_demangle::NodeArray A) { |
| 51 | ID.AddInteger(A.size()); |
| 52 | for (const Node *N : A) |
| 53 | (*this)(N); |
| 54 | } |
| 55 | }; |
| 56 | |
| 57 | template<typename ...T> |
| 58 | void profileCtor(llvm::FoldingSetNodeID &ID, Node::Kind K, T ...V) { |
| 59 | FoldingSetNodeIDBuilder Builder = {ID}; |
| 60 | Builder(K); |
| 61 | int VisitInOrder[] = { |
| 62 | (Builder(V), 0) ..., |
| 63 | 0 // Avoid empty array if there are no arguments. |
| 64 | }; |
| 65 | (void)VisitInOrder; |
| 66 | } |
| 67 | |
| 68 | // FIXME: Convert this to a generic lambda when possible. |
| 69 | template<typename NodeT> struct ProfileSpecificNode { |
| 70 | FoldingSetNodeID &ID; |
| 71 | template<typename ...T> void operator()(T ...V) { |
| 72 | profileCtor(ID, NodeKind<NodeT>::Kind, V...); |
| 73 | } |
| 74 | }; |
| 75 | |
| 76 | struct ProfileNode { |
| 77 | FoldingSetNodeID &ID; |
| 78 | template<typename NodeT> void operator()(const NodeT *N) { |
| 79 | N->match(ProfileSpecificNode<NodeT>{ID}); |
| 80 | } |
| 81 | }; |
| 82 | |
| 83 | template<> void ProfileNode::operator()(const ForwardTemplateReference *N) { |
| 84 | llvm_unreachable("should never canonicalize a ForwardTemplateReference"); |
Simon Pilgrim | 9894733 | 2018-08-25 16:49:35 +0000 | [diff] [blame] | 85 | } |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 86 | |
| 87 | void profileNode(llvm::FoldingSetNodeID &ID, const Node *N) { |
| 88 | N->visit(ProfileNode{ID}); |
| 89 | } |
| 90 | |
| 91 | class FoldingNodeAllocator { |
| 92 | class alignas(alignof(Node *)) NodeHeader : public llvm::FoldingSetNode { |
| 93 | public: |
| 94 | // 'Node' in this context names the injected-class-name of the base class. |
| 95 | itanium_demangle::Node *getNode() { |
| 96 | return reinterpret_cast<itanium_demangle::Node *>(this + 1); |
| 97 | } |
| 98 | void Profile(llvm::FoldingSetNodeID &ID) { profileNode(ID, getNode()); } |
| 99 | }; |
| 100 | |
| 101 | BumpPtrAllocator RawAlloc; |
| 102 | llvm::FoldingSet<NodeHeader> Nodes; |
| 103 | |
| 104 | public: |
| 105 | void reset() {} |
| 106 | |
Chandler Carruth | d38d950 | 2018-08-26 09:17:49 +0000 | [diff] [blame^] | 107 | template <typename T, typename... Args> |
| 108 | std::pair<Node *, bool> getOrCreateNode(bool CreateNewNodes, Args &&... As) { |
| 109 | // FIXME: Don't canonicalize forward template references for now, because |
| 110 | // they contain state (the resolved template node) that's not known at their |
| 111 | // point of creation. |
| 112 | if (std::is_same<T, ForwardTemplateReference>::value) { |
| 113 | // Note that we don't use if-constexpr here and so we must still write |
| 114 | // this code in a generic form. |
| 115 | return {new (RawAlloc.Allocate(sizeof(T), alignof(T))) |
| 116 | T(std::forward<Args>(As)...), |
| 117 | true}; |
| 118 | } |
| 119 | |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 120 | llvm::FoldingSetNodeID ID; |
| 121 | profileCtor(ID, NodeKind<T>::Kind, As...); |
| 122 | |
| 123 | void *InsertPos; |
| 124 | if (NodeHeader *Existing = Nodes.FindNodeOrInsertPos(ID, InsertPos)) |
| 125 | return {static_cast<T*>(Existing->getNode()), false}; |
| 126 | |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 127 | if (!CreateNewNodes) |
| 128 | return {nullptr, true}; |
| 129 | |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 130 | static_assert(alignof(T) <= alignof(NodeHeader), |
| 131 | "underaligned node header for specific node kind"); |
| 132 | void *Storage = |
| 133 | RawAlloc.Allocate(sizeof(NodeHeader) + sizeof(T), alignof(NodeHeader)); |
| 134 | NodeHeader *New = new (Storage) NodeHeader; |
| 135 | T *Result = new (New->getNode()) T(std::forward<Args>(As)...); |
| 136 | Nodes.InsertNode(New, InsertPos); |
| 137 | return {Result, true}; |
| 138 | } |
| 139 | |
| 140 | template<typename T, typename... Args> |
| 141 | Node *makeNode(Args &&...As) { |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 142 | return getOrCreateNode<T>(true, std::forward<Args>(As)...).first; |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 143 | } |
| 144 | |
| 145 | void *allocateNodeArray(size_t sz) { |
| 146 | return RawAlloc.Allocate(sizeof(Node *) * sz, alignof(Node *)); |
| 147 | } |
| 148 | }; |
| 149 | |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 150 | class CanonicalizerAllocator : public FoldingNodeAllocator { |
| 151 | Node *MostRecentlyCreated = nullptr; |
| 152 | Node *TrackedNode = nullptr; |
| 153 | bool TrackedNodeIsUsed = false; |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 154 | bool CreateNewNodes = true; |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 155 | llvm::SmallDenseMap<Node*, Node*, 32> Remappings; |
| 156 | |
| 157 | template<typename T, typename ...Args> Node *makeNodeSimple(Args &&...As) { |
| 158 | std::pair<Node *, bool> Result = |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 159 | getOrCreateNode<T>(CreateNewNodes, std::forward<Args>(As)...); |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 160 | if (Result.second) { |
| 161 | // Node is new. Make a note of that. |
| 162 | MostRecentlyCreated = Result.first; |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 163 | } else if (Result.first) { |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 164 | // Node is pre-existing; check if it's in our remapping table. |
| 165 | if (auto *N = Remappings.lookup(Result.first)) { |
| 166 | Result.first = N; |
| 167 | assert(Remappings.find(Result.first) == Remappings.end() && |
| 168 | "should never need multiple remap steps"); |
| 169 | } |
| 170 | if (Result.first == TrackedNode) |
| 171 | TrackedNodeIsUsed = true; |
| 172 | } |
| 173 | return Result.first; |
| 174 | } |
| 175 | |
| 176 | /// Helper to allow makeNode to be partially-specialized on T. |
| 177 | template<typename T> struct MakeNodeImpl { |
| 178 | CanonicalizerAllocator &Self; |
| 179 | template<typename ...Args> Node *make(Args &&...As) { |
| 180 | return Self.makeNodeSimple<T>(std::forward<Args>(As)...); |
| 181 | } |
| 182 | }; |
| 183 | |
| 184 | public: |
| 185 | template<typename T, typename ...Args> Node *makeNode(Args &&...As) { |
| 186 | return MakeNodeImpl<T>{*this}.make(std::forward<Args>(As)...); |
| 187 | } |
| 188 | |
| 189 | void reset() { MostRecentlyCreated = nullptr; } |
| 190 | |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 191 | void setCreateNewNodes(bool CNN) { CreateNewNodes = CNN; } |
| 192 | |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 193 | void addRemapping(Node *A, Node *B) { |
| 194 | // Note, we don't need to check whether B is also remapped, because if it |
| 195 | // was we would have already remapped it when building it. |
| 196 | Remappings.insert(std::make_pair(A, B)); |
| 197 | } |
| 198 | |
| 199 | bool isMostRecentlyCreated(Node *N) const { return MostRecentlyCreated == N; } |
| 200 | |
| 201 | void trackUsesOf(Node *N) { |
| 202 | TrackedNode = N; |
| 203 | TrackedNodeIsUsed = false; |
| 204 | } |
| 205 | bool trackedNodeIsUsed() const { return TrackedNodeIsUsed; } |
| 206 | }; |
| 207 | |
| 208 | /// Convert St3foo to NSt3fooE so that equivalences naming one also affect the |
| 209 | /// other. |
| 210 | template<> |
| 211 | struct CanonicalizerAllocator::MakeNodeImpl< |
| 212 | itanium_demangle::StdQualifiedName> { |
| 213 | CanonicalizerAllocator &Self; |
| 214 | Node *make(Node *Child) { |
| 215 | Node *StdNamespace = Self.makeNode<itanium_demangle::NameType>("std"); |
| 216 | if (!StdNamespace) |
| 217 | return nullptr; |
| 218 | return Self.makeNode<itanium_demangle::NestedName>(StdNamespace, Child); |
| 219 | } |
| 220 | }; |
| 221 | |
| 222 | // FIXME: Also expand built-in substitutions? |
| 223 | |
| 224 | using CanonicalizingDemangler = itanium_demangle::Db<CanonicalizerAllocator>; |
| 225 | } |
| 226 | |
| 227 | struct ItaniumManglingCanonicalizer::Impl { |
| 228 | CanonicalizingDemangler Demangler = {nullptr, nullptr}; |
| 229 | }; |
| 230 | |
| 231 | ItaniumManglingCanonicalizer::ItaniumManglingCanonicalizer() : P(new Impl) {} |
| 232 | ItaniumManglingCanonicalizer::~ItaniumManglingCanonicalizer() { delete P; } |
| 233 | |
| 234 | ItaniumManglingCanonicalizer::EquivalenceError |
| 235 | ItaniumManglingCanonicalizer::addEquivalence(FragmentKind Kind, StringRef First, |
| 236 | StringRef Second) { |
| 237 | auto &Alloc = P->Demangler.ASTAllocator; |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 238 | Alloc.setCreateNewNodes(true); |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 239 | |
| 240 | auto Parse = [&](StringRef Str) { |
| 241 | P->Demangler.reset(Str.begin(), Str.end()); |
| 242 | Node *N = nullptr; |
| 243 | switch (Kind) { |
| 244 | // A <name>, with minor extensions to allow arbitrary namespace and |
| 245 | // template names that can't easily be written as <name>s. |
| 246 | case FragmentKind::Name: |
| 247 | // Very special case: allow "St" as a shorthand for "3std". It's not |
| 248 | // valid as a <name> mangling, but is nonetheless the most natural |
| 249 | // way to name the 'std' namespace. |
| 250 | if (Str.size() == 2 && P->Demangler.consumeIf("St")) |
| 251 | N = P->Demangler.make<itanium_demangle::NameType>("std"); |
| 252 | // We permit substitutions to name templates without their template |
| 253 | // arguments. This mostly just falls out, as almost all template names |
| 254 | // are valid as <name>s, but we also want to parse <substitution>s as |
| 255 | // <name>s, even though they're not. |
| 256 | else if (Str.startswith("S")) |
| 257 | // Parse the substitution and optional following template arguments. |
| 258 | N = P->Demangler.parseType(); |
| 259 | else |
| 260 | N = P->Demangler.parseName(); |
| 261 | break; |
| 262 | |
| 263 | // A <type>. |
| 264 | case FragmentKind::Type: |
| 265 | N = P->Demangler.parseType(); |
| 266 | break; |
| 267 | |
| 268 | // An <encoding>. |
| 269 | case FragmentKind::Encoding: |
| 270 | N = P->Demangler.parseEncoding(); |
| 271 | break; |
| 272 | } |
| 273 | |
| 274 | // If we have trailing junk, the mangling is invalid. |
| 275 | if (P->Demangler.numLeft() != 0) |
| 276 | N = nullptr; |
| 277 | |
| 278 | // If any node was created after N, then we cannot safely remap it because |
| 279 | // it might already be in use by another node. |
| 280 | return std::make_pair(N, Alloc.isMostRecentlyCreated(N)); |
| 281 | }; |
| 282 | |
| 283 | Node *FirstNode, *SecondNode; |
| 284 | bool FirstIsNew, SecondIsNew; |
| 285 | |
| 286 | std::tie(FirstNode, FirstIsNew) = Parse(First); |
| 287 | if (!FirstNode) |
| 288 | return EquivalenceError::InvalidFirstMangling; |
| 289 | |
| 290 | Alloc.trackUsesOf(FirstNode); |
| 291 | std::tie(SecondNode, SecondIsNew) = Parse(Second); |
| 292 | if (!SecondNode) |
| 293 | return EquivalenceError::InvalidSecondMangling; |
| 294 | |
| 295 | // If they're already equivalent, there's nothing to do. |
| 296 | if (FirstNode == SecondNode) |
| 297 | return EquivalenceError::Success; |
| 298 | |
| 299 | if (FirstIsNew && !Alloc.trackedNodeIsUsed()) |
| 300 | Alloc.addRemapping(FirstNode, SecondNode); |
| 301 | else if (SecondIsNew) |
| 302 | Alloc.addRemapping(SecondNode, FirstNode); |
| 303 | else |
| 304 | return EquivalenceError::ManglingAlreadyUsed; |
| 305 | |
| 306 | return EquivalenceError::Success; |
| 307 | } |
| 308 | |
| 309 | ItaniumManglingCanonicalizer::Key |
| 310 | ItaniumManglingCanonicalizer::canonicalize(StringRef Mangling) { |
Richard Smith | 9c2e4f3 | 2018-08-24 23:26:05 +0000 | [diff] [blame] | 311 | P->Demangler.ASTAllocator.setCreateNewNodes(true); |
| 312 | P->Demangler.reset(Mangling.begin(), Mangling.end()); |
| 313 | return reinterpret_cast<Key>(P->Demangler.parse()); |
| 314 | } |
| 315 | |
| 316 | ItaniumManglingCanonicalizer::Key |
| 317 | ItaniumManglingCanonicalizer::lookup(StringRef Mangling) { |
| 318 | P->Demangler.ASTAllocator.setCreateNewNodes(false); |
Richard Smith | 2ae8468 | 2018-08-24 22:31:51 +0000 | [diff] [blame] | 319 | P->Demangler.reset(Mangling.begin(), Mangling.end()); |
| 320 | return reinterpret_cast<Key>(P->Demangler.parse()); |
| 321 | } |