Chris Lattner | 1587e6d | 2007-12-17 08:22:46 +0000 | [diff] [blame] | 1 | //===--- HeaderMap.cpp - A file that acts like dir of symlinks ------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
Chris Lattner | 5b12ab8 | 2007-12-29 19:59:25 +0000 | [diff] [blame] | 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
Chris Lattner | 1587e6d | 2007-12-17 08:22:46 +0000 | [diff] [blame] | 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // |
| 10 | // This file implements the HeaderMap interface. |
| 11 | // |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "clang/Lex/HeaderMap.h" |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 15 | #include "clang/Lex/HeaderMapTypes.h" |
Jordan Rose | 4938f27 | 2013-02-09 10:09:43 +0000 | [diff] [blame] | 16 | #include "clang/Basic/CharInfo.h" |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 17 | #include "clang/Basic/FileManager.h" |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 18 | #include "llvm/ADT/SmallString.h" |
Michael J. Spencer | 8aaf499 | 2010-11-29 18:12:39 +0000 | [diff] [blame] | 19 | #include "llvm/Support/DataTypes.h" |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 20 | #include "llvm/Support/MathExtras.h" |
| 21 | #include "llvm/Support/MemoryBuffer.h" |
Duncan P. N. Exon Smith | dfe8530 | 2016-02-20 21:00:58 +0000 | [diff] [blame] | 22 | #include "llvm/Support/SwapByteOrder.h" |
Chris Lattner | c25d8a7 | 2009-03-02 22:20:04 +0000 | [diff] [blame] | 23 | #include <cstdio> |
Ahmed Charles | dfca6f9 | 2014-03-09 11:36:40 +0000 | [diff] [blame] | 24 | #include <memory> |
Chris Lattner | 1587e6d | 2007-12-17 08:22:46 +0000 | [diff] [blame] | 25 | using namespace clang; |
| 26 | |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 27 | /// HashHMapKey - This is the 'well known' hash function required by the file |
| 28 | /// format, used to look up keys in the hash table. The hash table uses simple |
| 29 | /// linear probing based on this function. |
Chris Lattner | 0e62c1c | 2011-07-23 10:55:15 +0000 | [diff] [blame] | 30 | static inline unsigned HashHMapKey(StringRef Str) { |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 31 | unsigned Result = 0; |
Chris Lattner | d081f8c | 2010-01-10 01:35:12 +0000 | [diff] [blame] | 32 | const char *S = Str.begin(), *End = Str.end(); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 33 | |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 34 | for (; S != End; S++) |
Jordan Rose | 4938f27 | 2013-02-09 10:09:43 +0000 | [diff] [blame] | 35 | Result += toLowercase(*S) * 13; |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 36 | return Result; |
| 37 | } |
| 38 | |
| 39 | |
| 40 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 41 | //===----------------------------------------------------------------------===// |
| 42 | // Verification and Construction |
| 43 | //===----------------------------------------------------------------------===// |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 44 | |
| 45 | /// HeaderMap::Create - This attempts to load the specified file as a header |
| 46 | /// map. If it doesn't look like a HeaderMap, it gives up and returns null. |
| 47 | /// If it looks like a HeaderMap but is obviously corrupted, it puts a reason |
| 48 | /// into the string error argument and returns null. |
Chris Lattner | 5159f61 | 2010-11-23 08:35:12 +0000 | [diff] [blame] | 49 | const HeaderMap *HeaderMap::Create(const FileEntry *FE, FileManager &FM) { |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 50 | // If the file is too small to be a header map, ignore it. |
| 51 | unsigned FileSize = FE->getSize(); |
Craig Topper | d2d442c | 2014-05-17 23:10:59 +0000 | [diff] [blame] | 52 | if (FileSize <= sizeof(HMapHeader)) return nullptr; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 53 | |
Benjamin Kramer | a885796 | 2014-10-26 22:44:13 +0000 | [diff] [blame] | 54 | auto FileBuffer = FM.getBufferForFile(FE); |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 55 | if (!FileBuffer || !*FileBuffer) |
| 56 | return nullptr; |
| 57 | bool NeedsByteSwap; |
| 58 | if (!checkHeader(**FileBuffer, NeedsByteSwap)) |
| 59 | return nullptr; |
| 60 | return new HeaderMap(std::move(*FileBuffer), NeedsByteSwap); |
| 61 | } |
| 62 | |
| 63 | bool HeaderMapImpl::checkHeader(const llvm::MemoryBuffer &File, |
| 64 | bool &NeedsByteSwap) { |
| 65 | if (File.getBufferSize() <= sizeof(HMapHeader)) |
| 66 | return false; |
| 67 | const char *FileStart = File.getBufferStart(); |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 68 | |
| 69 | // We know the file is at least as big as the header, check it now. |
| 70 | const HMapHeader *Header = reinterpret_cast<const HMapHeader*>(FileStart); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 71 | |
Chris Lattner | d39b8c0 | 2007-12-17 18:59:44 +0000 | [diff] [blame] | 72 | // Sniff it to see if it's a headermap by checking the magic number and |
| 73 | // version. |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 74 | if (Header->Magic == HMAP_HeaderMagicNumber && |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 75 | Header->Version == HMAP_HeaderVersion) |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 76 | NeedsByteSwap = false; |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 77 | else if (Header->Magic == llvm::ByteSwap_32(HMAP_HeaderMagicNumber) && |
| 78 | Header->Version == llvm::ByteSwap_16(HMAP_HeaderVersion)) |
Chris Lattner | 4ffe46c | 2007-12-17 18:34:53 +0000 | [diff] [blame] | 79 | NeedsByteSwap = true; // Mixed endianness headermap. |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 80 | else |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 81 | return false; // Not a header map. |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 82 | |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 83 | if (Header->Reserved != 0) |
| 84 | return false; |
Chris Lattner | 79764a6 | 2007-12-17 18:44:09 +0000 | [diff] [blame] | 85 | |
Duncan P. N. Exon Smith | 8d6a31c02 | 2016-02-20 21:24:31 +0000 | [diff] [blame] | 86 | // Check the number of buckets. It should be a power of two, and there |
| 87 | // should be enough space in the file for all of them. |
Duncan P. N. Exon Smith | dfe8530 | 2016-02-20 21:00:58 +0000 | [diff] [blame] | 88 | auto NumBuckets = NeedsByteSwap |
| 89 | ? llvm::sys::getSwappedBytes(Header->NumBuckets) |
| 90 | : Header->NumBuckets; |
Duncan P. N. Exon Smith | dfe8530 | 2016-02-20 21:00:58 +0000 | [diff] [blame] | 91 | if (NumBuckets & (NumBuckets - 1)) |
| 92 | return false; |
Duncan P. N. Exon Smith | 8d6a31c02 | 2016-02-20 21:24:31 +0000 | [diff] [blame] | 93 | if (File.getBufferSize() < |
| 94 | sizeof(HMapHeader) + sizeof(HMapBucket) * NumBuckets) |
| 95 | return false; |
Duncan P. N. Exon Smith | dfe8530 | 2016-02-20 21:00:58 +0000 | [diff] [blame] | 96 | |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 97 | // Okay, everything looks good. |
| 98 | return true; |
Chris Lattner | 79764a6 | 2007-12-17 18:44:09 +0000 | [diff] [blame] | 99 | } |
| 100 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 101 | //===----------------------------------------------------------------------===// |
| 102 | // Utility Methods |
| 103 | //===----------------------------------------------------------------------===// |
| 104 | |
Chris Lattner | 79764a6 | 2007-12-17 18:44:09 +0000 | [diff] [blame] | 105 | |
| 106 | /// getFileName - Return the filename of the headermap. |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 107 | const char *HeaderMapImpl::getFileName() const { |
Chris Lattner | 79764a6 | 2007-12-17 18:44:09 +0000 | [diff] [blame] | 108 | return FileBuffer->getBufferIdentifier(); |
Chris Lattner | 1587e6d | 2007-12-17 08:22:46 +0000 | [diff] [blame] | 109 | } |
| 110 | |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 111 | unsigned HeaderMapImpl::getEndianAdjustedWord(unsigned X) const { |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 112 | if (!NeedsBSwap) return X; |
| 113 | return llvm::ByteSwap_32(X); |
| 114 | } |
| 115 | |
| 116 | /// getHeader - Return a reference to the file header, in unbyte-swapped form. |
| 117 | /// This method cannot fail. |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 118 | const HMapHeader &HeaderMapImpl::getHeader() const { |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 119 | // We know the file is at least as big as the header. Return it. |
| 120 | return *reinterpret_cast<const HMapHeader*>(FileBuffer->getBufferStart()); |
| 121 | } |
| 122 | |
| 123 | /// getBucket - Return the specified hash table bucket from the header map, |
| 124 | /// bswap'ing its fields as appropriate. If the bucket number is not valid, |
| 125 | /// this return a bucket with an empty key (0). |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 126 | HMapBucket HeaderMapImpl::getBucket(unsigned BucketNo) const { |
Duncan P. N. Exon Smith | 8d6a31c02 | 2016-02-20 21:24:31 +0000 | [diff] [blame] | 127 | assert(FileBuffer->getBufferSize() >= |
| 128 | sizeof(HMapHeader) + sizeof(HMapBucket) * BucketNo && |
| 129 | "Expected bucket to be in range"); |
| 130 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 131 | HMapBucket Result; |
| 132 | Result.Key = HMAP_EmptyBucketKey; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 133 | |
| 134 | const HMapBucket *BucketArray = |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 135 | reinterpret_cast<const HMapBucket*>(FileBuffer->getBufferStart() + |
| 136 | sizeof(HMapHeader)); |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 137 | const HMapBucket *BucketPtr = BucketArray+BucketNo; |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 138 | |
Duncan P. N. Exon Smith | 8d6a31c02 | 2016-02-20 21:24:31 +0000 | [diff] [blame] | 139 | // Load the values, bswapping as needed. |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 140 | Result.Key = getEndianAdjustedWord(BucketPtr->Key); |
| 141 | Result.Prefix = getEndianAdjustedWord(BucketPtr->Prefix); |
| 142 | Result.Suffix = getEndianAdjustedWord(BucketPtr->Suffix); |
| 143 | return Result; |
| 144 | } |
| 145 | |
| 146 | /// getString - Look up the specified string in the string table. If the string |
| 147 | /// index is not valid, it returns an empty string. |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 148 | const char *HeaderMapImpl::getString(unsigned StrTabIdx) const { |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 149 | // Add the start of the string table to the idx. |
| 150 | StrTabIdx += getEndianAdjustedWord(getHeader().StringsOffset); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 151 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 152 | // Check for invalid index. |
| 153 | if (StrTabIdx >= FileBuffer->getBufferSize()) |
Craig Topper | d2d442c | 2014-05-17 23:10:59 +0000 | [diff] [blame] | 154 | return nullptr; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 155 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 156 | // Otherwise, we have a valid pointer into the file. Just return it. We know |
| 157 | // that the "string" can not overrun the end of the file, because the buffer |
| 158 | // is nul terminated by virtue of being a MemoryBuffer. |
| 159 | return FileBuffer->getBufferStart()+StrTabIdx; |
| 160 | } |
| 161 | |
| 162 | //===----------------------------------------------------------------------===// |
| 163 | // The Main Drivers |
| 164 | //===----------------------------------------------------------------------===// |
| 165 | |
| 166 | /// dump - Print the contents of this headermap to stderr. |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 167 | LLVM_DUMP_METHOD void HeaderMapImpl::dump() const { |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 168 | const HMapHeader &Hdr = getHeader(); |
| 169 | unsigned NumBuckets = getEndianAdjustedWord(Hdr.NumBuckets); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 170 | |
| 171 | fprintf(stderr, "Header Map %s:\n %d buckets, %d entries\n", |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 172 | getFileName(), NumBuckets, |
| 173 | getEndianAdjustedWord(Hdr.NumEntries)); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 174 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 175 | for (unsigned i = 0; i != NumBuckets; ++i) { |
| 176 | HMapBucket B = getBucket(i); |
| 177 | if (B.Key == HMAP_EmptyBucketKey) continue; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 178 | |
Chris Lattner | 9f9a619 | 2007-12-17 21:06:11 +0000 | [diff] [blame] | 179 | const char *Key = getString(B.Key); |
| 180 | const char *Prefix = getString(B.Prefix); |
| 181 | const char *Suffix = getString(B.Suffix); |
| 182 | fprintf(stderr, " %d. %s -> '%s' '%s'\n", i, Key, Prefix, Suffix); |
| 183 | } |
| 184 | } |
| 185 | |
Chris Lattner | 1587e6d | 2007-12-17 08:22:46 +0000 | [diff] [blame] | 186 | /// LookupFile - Check to see if the specified relative filename is located in |
| 187 | /// this HeaderMap. If so, open it and return its FileEntry. |
Chandler Carruth | 3cc331a | 2011-03-16 18:34:36 +0000 | [diff] [blame] | 188 | const FileEntry *HeaderMap::LookupFile( |
Chris Lattner | 0e62c1c | 2011-07-23 10:55:15 +0000 | [diff] [blame] | 189 | StringRef Filename, FileManager &FM) const { |
Argyrios Kyrtzidis | 75fa9ed | 2014-02-14 14:58:28 +0000 | [diff] [blame] | 190 | |
| 191 | SmallString<1024> Path; |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 192 | StringRef Dest = HeaderMapImpl::lookupFilename(Filename, Path); |
Argyrios Kyrtzidis | 75fa9ed | 2014-02-14 14:58:28 +0000 | [diff] [blame] | 193 | if (Dest.empty()) |
Craig Topper | d2d442c | 2014-05-17 23:10:59 +0000 | [diff] [blame] | 194 | return nullptr; |
Argyrios Kyrtzidis | 75fa9ed | 2014-02-14 14:58:28 +0000 | [diff] [blame] | 195 | |
| 196 | return FM.getFile(Dest); |
| 197 | } |
| 198 | |
Duncan P. N. Exon Smith | 9ab99ee | 2016-02-20 20:39:51 +0000 | [diff] [blame] | 199 | StringRef HeaderMapImpl::lookupFilename(StringRef Filename, |
| 200 | SmallVectorImpl<char> &DestPath) const { |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 201 | const HMapHeader &Hdr = getHeader(); |
| 202 | unsigned NumBuckets = getEndianAdjustedWord(Hdr.NumBuckets); |
| 203 | |
Duncan P. N. Exon Smith | dfe8530 | 2016-02-20 21:00:58 +0000 | [diff] [blame] | 204 | // Don't probe infinitely. This should be checked before constructing. |
| 205 | assert(!(NumBuckets & (NumBuckets - 1)) && "Expected power of 2"); |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 206 | |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 207 | // Linearly probe the hash table. |
Chris Lattner | d081f8c | 2010-01-10 01:35:12 +0000 | [diff] [blame] | 208 | for (unsigned Bucket = HashHMapKey(Filename);; ++Bucket) { |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 209 | HMapBucket B = getBucket(Bucket & (NumBuckets-1)); |
Argyrios Kyrtzidis | 75fa9ed | 2014-02-14 14:58:28 +0000 | [diff] [blame] | 210 | if (B.Key == HMAP_EmptyBucketKey) return StringRef(); // Hash miss. |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 211 | |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 212 | // See if the key matches. If not, probe on. |
Benjamin Kramer | 307c2c7 | 2010-01-10 09:51:00 +0000 | [diff] [blame] | 213 | if (!Filename.equals_lower(getString(B.Key))) |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 214 | continue; |
Mike Stump | 11289f4 | 2009-09-09 15:08:12 +0000 | [diff] [blame] | 215 | |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 216 | // If so, we have a match in the hash table. Construct the destination |
| 217 | // path. |
Argyrios Kyrtzidis | 75fa9ed | 2014-02-14 14:58:28 +0000 | [diff] [blame] | 218 | StringRef Prefix = getString(B.Prefix); |
| 219 | StringRef Suffix = getString(B.Suffix); |
| 220 | DestPath.clear(); |
| 221 | DestPath.append(Prefix.begin(), Prefix.end()); |
| 222 | DestPath.append(Suffix.begin(), Suffix.end()); |
| 223 | return StringRef(DestPath.begin(), DestPath.size()); |
Chris Lattner | 619e18c | 2007-12-17 21:38:04 +0000 | [diff] [blame] | 224 | } |
Chris Lattner | 1587e6d | 2007-12-17 08:22:46 +0000 | [diff] [blame] | 225 | } |