| //===- NameHashTable.cpp - PDB Name Hash Table ------------------*- C++ -*-===// |
| // |
| // The LLVM Compiler Infrastructure |
| // |
| // This file is distributed under the University of Illinois Open Source |
| // License. See LICENSE.TXT for details. |
| // |
| //===----------------------------------------------------------------------===// |
| |
| #include "llvm/DebugInfo/PDB/Raw/NameHashTable.h" |
| |
| #include "llvm/ADT/ArrayRef.h" |
| #include "llvm/DebugInfo/PDB/Raw/ByteStream.h" |
| #include "llvm/DebugInfo/PDB/Raw/RawError.h" |
| #include "llvm/DebugInfo/PDB/Raw/StreamReader.h" |
| #include "llvm/Support/Endian.h" |
| |
| using namespace llvm; |
| using namespace llvm::support; |
| using namespace llvm::pdb; |
| |
| static inline uint32_t HashStringV1(StringRef Str) { |
| uint32_t Result = 0; |
| uint32_t Size = Str.size(); |
| |
| ArrayRef<ulittle32_t> Longs(reinterpret_cast<const ulittle32_t *>(Str.data()), |
| Size / 4); |
| |
| for (auto Value : Longs) |
| Result ^= Value; |
| |
| const uint8_t *Remainder = reinterpret_cast<const uint8_t *>(Longs.end()); |
| uint32_t RemainderSize = Size - Longs.size() * 4; |
| |
| // Maximum of 3 bytes left. Hash a 2 byte word if possible, then hash the |
| // possibly remaining 1 byte. |
| if (RemainderSize >= 2) { |
| uint16_t Value = *reinterpret_cast<const ulittle16_t *>(Remainder); |
| Result ^= static_cast<uint32_t>(Value); |
| Remainder += 2; |
| RemainderSize -= 2; |
| } |
| |
| // hash possible odd byte |
| if (RemainderSize == 1) { |
| Result ^= *(Remainder++); |
| } |
| |
| const uint32_t toLowerMask = 0x20202020; |
| Result |= toLowerMask; |
| Result ^= (Result >> 11); |
| |
| return Result ^ (Result >> 16); |
| } |
| |
| static inline uint32_t HashStringV2(StringRef Str) { |
| uint32_t Hash = 0xb170a1bf; |
| |
| ArrayRef<char> Buffer(Str.begin(), Str.end()); |
| |
| ArrayRef<ulittle32_t> Items( |
| reinterpret_cast<const ulittle32_t *>(Buffer.data()), |
| Buffer.size() / sizeof(ulittle32_t)); |
| for (ulittle32_t Item : Items) { |
| Hash += Item; |
| Hash += (Hash << 10); |
| Hash ^= (Hash >> 6); |
| } |
| Buffer = Buffer.slice(Items.size() * sizeof(ulittle32_t)); |
| for (uint8_t Item : Buffer) { |
| Hash += Item; |
| Hash += (Hash << 10); |
| Hash ^= (Hash >> 6); |
| } |
| |
| return Hash * 1664525L + 1013904223L; |
| } |
| |
| NameHashTable::NameHashTable() : Signature(0), HashVersion(0), NameCount(0) {} |
| |
| Error NameHashTable::load(StreamReader &Stream) { |
| struct Header { |
| support::ulittle32_t Signature; |
| support::ulittle32_t HashVersion; |
| support::ulittle32_t ByteSize; |
| }; |
| |
| Header H; |
| if (auto EC = Stream.readObject(&H)) |
| return EC; |
| |
| if (H.Signature != 0xEFFEEFFE) |
| return make_error<RawError>(raw_error_code::corrupt_file, |
| "Invalid hash table signature"); |
| if (H.HashVersion != 1 && H.HashVersion != 2) |
| return make_error<RawError>(raw_error_code::corrupt_file, |
| "Unsupported hash version"); |
| |
| Signature = H.Signature; |
| HashVersion = H.HashVersion; |
| if (auto EC = NamesBuffer.initialize(Stream, H.ByteSize)) |
| return make_error<RawError>(raw_error_code::corrupt_file, |
| "Invalid hash table byte length"); |
| |
| support::ulittle32_t HashCount; |
| if (auto EC = Stream.readObject(&HashCount)) |
| return EC; |
| |
| std::vector<support::ulittle32_t> BucketArray(HashCount); |
| if (auto EC = Stream.readArray<support::ulittle32_t>(BucketArray)) |
| return make_error<RawError>(raw_error_code::corrupt_file, |
| "Could not read bucket array"); |
| IDs.assign(BucketArray.begin(), BucketArray.end()); |
| |
| if (Stream.bytesRemaining() < sizeof(support::ulittle32_t)) |
| return make_error<RawError>(raw_error_code::corrupt_file, |
| "Missing name count"); |
| |
| if (auto EC = Stream.readInteger(NameCount)) |
| return EC; |
| return Error::success(); |
| } |
| |
| StringRef NameHashTable::getStringForID(uint32_t ID) const { |
| if (ID == IDs[0]) |
| return StringRef(); |
| |
| return StringRef(NamesBuffer.str().begin() + ID); |
| } |
| |
| uint32_t NameHashTable::getIDForString(StringRef Str) const { |
| uint32_t Hash = (HashVersion == 1) ? HashStringV1(Str) : HashStringV2(Str); |
| size_t Count = IDs.size(); |
| uint32_t Start = Hash % Count; |
| for (size_t I = 0; I < Count; ++I) { |
| // The hash is just a starting point for the search, but if it |
| // doesn't work we should find the string no matter what, because |
| // we iterate the entire array. |
| uint32_t Index = (Start + I) % Count; |
| |
| uint32_t ID = IDs[Index]; |
| StringRef S = getStringForID(ID); |
| if (S == Str) |
| return ID; |
| } |
| // IDs[0] contains the ID of the "invalid" entry. |
| return IDs[0]; |
| } |
| |
| ArrayRef<uint32_t> NameHashTable::name_ids() const { |
| return ArrayRef<uint32_t>(IDs).slice(1, NameCount); |
| } |