153 lines
4.6 KiB
C++
153 lines
4.6 KiB
C++
//===- NameHashTable.cpp - PDB Name Hash Table ------------------*- C++ -*-===//
|
|
//
|
|
// The LLVM Compiler Infrastructure
|
|
//
|
|
// This file is distributed under the University of Illinois Open Source
|
|
// License. See LICENSE.TXT for details.
|
|
//
|
|
//===----------------------------------------------------------------------===//
|
|
|
|
#include "llvm/DebugInfo/PDB/Raw/NameHashTable.h"
|
|
|
|
#include "llvm/ADT/ArrayRef.h"
|
|
#include "llvm/DebugInfo/PDB/Raw/ByteStream.h"
|
|
#include "llvm/DebugInfo/PDB/Raw/RawError.h"
|
|
#include "llvm/DebugInfo/PDB/Raw/StreamReader.h"
|
|
#include "llvm/Support/Endian.h"
|
|
|
|
using namespace llvm;
|
|
using namespace llvm::support;
|
|
using namespace llvm::pdb;
|
|
|
|
static inline uint32_t HashStringV1(StringRef Str) {
|
|
uint32_t Result = 0;
|
|
uint32_t Size = Str.size();
|
|
|
|
ArrayRef<ulittle32_t> Longs(reinterpret_cast<const ulittle32_t *>(Str.data()),
|
|
Size / 4);
|
|
|
|
for (auto Value : Longs)
|
|
Result ^= Value;
|
|
|
|
const uint8_t *Remainder = reinterpret_cast<const uint8_t *>(Longs.end());
|
|
uint32_t RemainderSize = Size - Longs.size() * 4;
|
|
|
|
// Maximum of 3 bytes left. Hash a 2 byte word if possible, then hash the
|
|
// possibly remaining 1 byte.
|
|
if (RemainderSize >= 2) {
|
|
uint16_t Value = *reinterpret_cast<const ulittle16_t *>(Remainder);
|
|
Result ^= static_cast<uint32_t>(Value);
|
|
Remainder += 2;
|
|
RemainderSize -= 2;
|
|
}
|
|
|
|
// hash possible odd byte
|
|
if (RemainderSize == 1) {
|
|
Result ^= *(Remainder++);
|
|
}
|
|
|
|
const uint32_t toLowerMask = 0x20202020;
|
|
Result |= toLowerMask;
|
|
Result ^= (Result >> 11);
|
|
|
|
return Result ^ (Result >> 16);
|
|
}
|
|
|
|
static inline uint32_t HashStringV2(StringRef Str) {
|
|
uint32_t Hash = 0xb170a1bf;
|
|
|
|
ArrayRef<char> Buffer(Str.begin(), Str.end());
|
|
|
|
ArrayRef<ulittle32_t> Items(
|
|
reinterpret_cast<const ulittle32_t *>(Buffer.data()),
|
|
Buffer.size() / sizeof(ulittle32_t));
|
|
for (ulittle32_t Item : Items) {
|
|
Hash += Item;
|
|
Hash += (Hash << 10);
|
|
Hash ^= (Hash >> 6);
|
|
}
|
|
Buffer = Buffer.slice(Items.size() * sizeof(ulittle32_t));
|
|
for (uint8_t Item : Buffer) {
|
|
Hash += Item;
|
|
Hash += (Hash << 10);
|
|
Hash ^= (Hash >> 6);
|
|
}
|
|
|
|
return Hash * 1664525L + 1013904223L;
|
|
}
|
|
|
|
NameHashTable::NameHashTable() : Signature(0), HashVersion(0), NameCount(0) {}
|
|
|
|
Error NameHashTable::load(StreamReader &Stream) {
|
|
struct Header {
|
|
support::ulittle32_t Signature;
|
|
support::ulittle32_t HashVersion;
|
|
support::ulittle32_t ByteSize;
|
|
};
|
|
|
|
Header H;
|
|
if (auto EC = Stream.readObject(&H))
|
|
return EC;
|
|
|
|
if (H.Signature != 0xEFFEEFFE)
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
"Invalid hash table signature");
|
|
if (H.HashVersion != 1 && H.HashVersion != 2)
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
"Unsupported hash version");
|
|
|
|
Signature = H.Signature;
|
|
HashVersion = H.HashVersion;
|
|
if (auto EC = NamesBuffer.initialize(Stream, H.ByteSize))
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
"Invalid hash table byte length");
|
|
|
|
support::ulittle32_t HashCount;
|
|
if (auto EC = Stream.readObject(&HashCount))
|
|
return EC;
|
|
|
|
std::vector<support::ulittle32_t> BucketArray(HashCount);
|
|
if (auto EC = Stream.readArray<support::ulittle32_t>(BucketArray))
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
"Could not read bucket array");
|
|
IDs.assign(BucketArray.begin(), BucketArray.end());
|
|
|
|
if (Stream.bytesRemaining() < sizeof(support::ulittle32_t))
|
|
return make_error<RawError>(raw_error_code::corrupt_file,
|
|
"Missing name count");
|
|
|
|
if (auto EC = Stream.readInteger(NameCount))
|
|
return EC;
|
|
return Error::success();
|
|
}
|
|
|
|
StringRef NameHashTable::getStringForID(uint32_t ID) const {
|
|
if (ID == IDs[0])
|
|
return StringRef();
|
|
|
|
return StringRef(NamesBuffer.str().begin() + ID);
|
|
}
|
|
|
|
uint32_t NameHashTable::getIDForString(StringRef Str) const {
|
|
uint32_t Hash = (HashVersion == 1) ? HashStringV1(Str) : HashStringV2(Str);
|
|
size_t Count = IDs.size();
|
|
uint32_t Start = Hash % Count;
|
|
for (size_t I = 0; I < Count; ++I) {
|
|
// The hash is just a starting point for the search, but if it
|
|
// doesn't work we should find the string no matter what, because
|
|
// we iterate the entire array.
|
|
uint32_t Index = (Start + I) % Count;
|
|
|
|
uint32_t ID = IDs[Index];
|
|
StringRef S = getStringForID(ID);
|
|
if (S == Str)
|
|
return ID;
|
|
}
|
|
// IDs[0] contains the ID of the "invalid" entry.
|
|
return IDs[0];
|
|
}
|
|
|
|
ArrayRef<uint32_t> NameHashTable::name_ids() const {
|
|
return ArrayRef<uint32_t>(IDs).slice(1, NameCount);
|
|
}
|