| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 1 | //===- Strings.cpp -------------------------------------------------------===// |
| 2 | // |
| 3 | // The LLVM Linker |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | |
| 10 | #include "Strings.h" |
| 11 | #include "Error.h" |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 12 | #include "llvm/ADT/ArrayRef.h" |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 13 | #include "llvm/ADT/StringRef.h" |
| 14 | #include "llvm/ADT/Twine.h" |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 15 | #include "llvm/Config/config.h" |
| Rafael Espindola | d194213 | 2016-09-06 19:17:14 +0000 | [diff] [blame] | 16 | #include "llvm/Demangle/Demangle.h" |
| Rui Ueyama | fbbde54 | 2016-06-29 09:08:02 +0000 | [diff] [blame] | 17 | #include <algorithm> |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 18 | |
| 19 | using namespace llvm; |
| 20 | using namespace lld; |
| 21 | using namespace lld::elf; |
| 22 | |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 23 | bool elf::hasWildcard(StringRef S) { |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 24 | return S.find_first_of("?*[") != StringRef::npos; |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 25 | } |
| 26 | |
| George Rimar | cd574a5 | 2016-09-09 14:35:36 +0000 | [diff] [blame^] | 27 | StringRef elf::unquote(StringRef S) { |
| 28 | if (!S.startswith("\"")) |
| 29 | return S; |
| 30 | return S.substr(1, S.size() - 2); |
| 31 | } |
| 32 | |
| Rui Ueyama | dad2b88 | 2016-09-02 22:15:08 +0000 | [diff] [blame] | 33 | // Converts a glob pattern to a regular expression. |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 34 | static std::string toRegex(StringRef S) { |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 35 | std::string T; |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 36 | bool InBracket = false; |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 37 | while (!S.empty()) { |
| 38 | char C = S.front(); |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 39 | if (InBracket) { |
| 40 | InBracket = C != ']'; |
| 41 | T += C; |
| 42 | S = S.drop_front(); |
| 43 | continue; |
| 44 | } |
| 45 | |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 46 | if (C == '*') |
| 47 | T += ".*"; |
| 48 | else if (C == '?') |
| 49 | T += '.'; |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 50 | else if (StringRef(".+^${}()|/\\").find_first_of(C) != StringRef::npos) |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 51 | T += std::string("\\") + C; |
| 52 | else |
| 53 | T += C; |
| George Rimar | 51da9c7 | 2016-09-07 10:19:44 +0000 | [diff] [blame] | 54 | |
| 55 | InBracket = C == '['; |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 56 | S = S.substr(1); |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 57 | } |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 58 | return T; |
| 59 | } |
| 60 | |
| Rui Ueyama | dad2b88 | 2016-09-02 22:15:08 +0000 | [diff] [blame] | 61 | // Converts multiple glob patterns to a regular expression. |
| George Rimar | c91930a | 2016-09-02 21:17:20 +0000 | [diff] [blame] | 62 | Regex elf::compileGlobPatterns(ArrayRef<StringRef> V) { |
| 63 | std::string T = "^(" + toRegex(V[0]); |
| 64 | for (StringRef S : V.slice(1)) |
| 65 | T += "|" + toRegex(S); |
| 66 | return Regex(T + ")$"); |
| Rui Ueyama | 93c9af4 | 2016-06-29 08:01:32 +0000 | [diff] [blame] | 67 | } |
| 68 | |
| 69 | // Converts a hex string (e.g. "deadbeef") to a vector. |
| 70 | std::vector<uint8_t> elf::parseHex(StringRef S) { |
| 71 | std::vector<uint8_t> Hex; |
| 72 | while (!S.empty()) { |
| 73 | StringRef B = S.substr(0, 2); |
| 74 | S = S.substr(2); |
| 75 | uint8_t H; |
| 76 | if (B.getAsInteger(16, H)) { |
| 77 | error("not a hexadecimal value: " + B); |
| 78 | return {}; |
| 79 | } |
| 80 | Hex.push_back(H); |
| 81 | } |
| 82 | return Hex; |
| 83 | } |
| Rui Ueyama | fbbde54 | 2016-06-29 09:08:02 +0000 | [diff] [blame] | 84 | |
| 85 | static bool isAlpha(char C) { |
| 86 | return ('a' <= C && C <= 'z') || ('A' <= C && C <= 'Z') || C == '_'; |
| 87 | } |
| 88 | |
| 89 | static bool isAlnum(char C) { return isAlpha(C) || ('0' <= C && C <= '9'); } |
| 90 | |
| 91 | // Returns true if S is valid as a C language identifier. |
| 92 | bool elf::isValidCIdentifier(StringRef S) { |
| 93 | return !S.empty() && isAlpha(S[0]) && |
| 94 | std::all_of(S.begin() + 1, S.end(), isAlnum); |
| 95 | } |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 96 | |
| 97 | // Returns the demangled C++ symbol name for Name. |
| 98 | std::string elf::demangle(StringRef Name) { |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 99 | // __cxa_demangle can be used to demangle strings other than symbol |
| 100 | // names which do not necessarily start with "_Z". Name can be |
| 101 | // either a C or C++ symbol. Don't call __cxa_demangle if the name |
| 102 | // does not look like a C++ symbol name to avoid getting unexpected |
| 103 | // result for a C symbol that happens to match a mangled type name. |
| 104 | if (!Name.startswith("_Z")) |
| 105 | return Name; |
| 106 | |
| Rafael Espindola | d194213 | 2016-09-06 19:17:14 +0000 | [diff] [blame] | 107 | char *Buf = itaniumDemangle(Name.str().c_str(), nullptr, nullptr, nullptr); |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 108 | if (!Buf) |
| 109 | return Name; |
| 110 | std::string S(Buf); |
| 111 | free(Buf); |
| 112 | return S; |
| Rui Ueyama | f4d9338 | 2016-07-07 23:04:15 +0000 | [diff] [blame] | 113 | } |