| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 1 | //===- Strings.cpp -------------------------------------------------------===// |
| 2 | // |
| 3 | // The LLVM Linker |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
| 10 | #include "Strings.h" |
| 11 | #include "Error.h" |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 12 | #include "llvm/ADT/ArrayRef.h" |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 13 | #include "llvm/ADT/StringRef.h" |
| 14 | #include "llvm/ADT/Twine.h" |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 15 | #include "llvm/Config/config.h" |
| Rafael Espindola | d194213 | 2016-09-06 19:17:14 +0000 | [diff] [blame] | 16 | #include "llvm/Demangle/Demangle.h" |
| Rui Ueyama | fbbde54 | 2016-06-29 09:08:02 +0000 | [diff] [blame] | 17 | #include <algorithm> |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 18 | |
| 19 | using namespace llvm; |
| 20 | using namespace lld; |
| 21 | using namespace lld::elf; |
| 22 | |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 23 | bool elf::hasWildcard(StringRef S) { |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 24 | return S.find_first_of("?*[") != StringRef::npos; |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 25 | } |
| 26 | |
| Rui Ueyama | dad2b88 | 2016-09-02 22:15:08 +0000 | [diff] [blame] | 27 | // Converts a glob pattern to a regular expression. |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 28 | static std::string toRegex(StringRef S) { |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 29 | std::string T; |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 30 | bool InBracket = false; |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 31 | while (!S.empty()) { |
| 32 | char C = S.front(); |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 33 | if (InBracket) { |
| 34 | InBracket = C != ']'; |
| 35 | T += C; |
| 36 | S = S.drop_front(); |
| 37 | continue; |
| 38 | } |
| 39 | |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 40 | if (C == '*') |
| 41 | T += ".*"; |
| 42 | else if (C == '?') |
| 43 | T += '.'; |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 44 | else if (StringRef(".+^${}()|/\\").find_first_of(C) != StringRef::npos) |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 45 | T += std::string("\\") + C; |
| 46 | else |
| 47 | T += C; |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 48 | |
| 49 | InBracket = C == '['; |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 50 | S = S.substr(1); |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 51 | } |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 52 | return T; |
| 53 | } |
| 54 | |
| Rui Ueyama | dad2b88 | 2016-09-02 22:15:08 +0000 | [diff] [blame] | 55 | // Converts multiple glob patterns to a regular expression. |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 56 | Regex elf::compileGlobPatterns(ArrayRef<StringRef> V) { |
| 57 | std::string T = "^(" + toRegex(V[0]); |
| 58 | for (StringRef S : V.slice(1)) |
| 59 | T += "|" + toRegex(S); |
| 60 | return Regex(T + ")$"); |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 61 | } |
| 62 | |
| 63 | // Converts a hex string (e.g. "deadbeef") to a vector. |
| 64 | std::vector<uint8_t> elf::parseHex(StringRef S) { |
| 65 | std::vector<uint8_t> Hex; |
| 66 | while (!S.empty()) { |
| 67 | StringRef B = S.substr(0, 2); |
| 68 | S = S.substr(2); |
| 69 | uint8_t H; |
| 70 | if (B.getAsInteger(16, H)) { |
| 71 | error("not a hexadecimal value: " + B); |
| 72 | return {}; |
| 73 | } |
| 74 | Hex.push_back(H); |
| 75 | } |
| 76 | return Hex; |
| 77 | } |
| Rui Ueyama | fbbde54 | 2016-06-29 09:08:02 +0000 | [diff] [blame] | 78 | |
| 79 | static bool isAlpha(char C) { |
| 80 | return ('a' <= C && C <= 'z') || ('A' <= C && C <= 'Z') || C == '_'; |
| 81 | } |
| 82 | |
| 83 | static bool isAlnum(char C) { return isAlpha(C) || ('0' <= C && C <= '9'); } |
| 84 | |
| 85 | // Returns true if S is valid as a C language identifier. |
| 86 | bool elf::isValidCIdentifier(StringRef S) { |
| 87 | return !S.empty() && isAlpha(S[0]) && |
| 88 | std::all_of(S.begin() + 1, S.end(), isAlnum); |
| 89 | } |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 90 | |
| 91 | // Returns the demangled C++ symbol name for Name. |
| 92 | std::string elf::demangle(StringRef Name) { |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 93 | // __cxa_demangle can be used to demangle strings other than symbol |
| 94 | // names which do not necessarily start with "_Z". Name can be |
| 95 | // either a C or C++ symbol. Don't call __cxa_demangle if the name |
| 96 | // does not look like a C++ symbol name to avoid getting unexpected |
| 97 | // result for a C symbol that happens to match a mangled type name. |
| 98 | if (!Name.startswith("_Z")) |
| 99 | return Name; |
| 100 | |
| Rafael Espindola | d194213 | 2016-09-06 19:17:14 +0000 | [diff] [blame] | 101 | char *Buf = itaniumDemangle(Name.str().c_str(), nullptr, nullptr, nullptr); |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 102 | if (!Buf) |
| 103 | return Name; |
| 104 | std::string S(Buf); |
| 105 | free(Buf); |
| 106 | return S; |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 107 | } |