diff options
-rw-r--r-- | llvm/include/llvm/DebugInfo/PDB/Raw/ByteStream.h | 1 | ||||
-rw-r--r-- | llvm/include/llvm/DebugInfo/PDB/Raw/DbiStream.h | 2 | ||||
-rw-r--r-- | llvm/include/llvm/DebugInfo/PDB/Raw/NameHashTable.h | 48 | ||||
-rw-r--r-- | llvm/include/llvm/DebugInfo/PDB/Raw/StreamReader.h | 5 | ||||
-rw-r--r-- | llvm/lib/DebugInfo/PDB/CMakeLists.txt | 1 | ||||
-rw-r--r-- | llvm/lib/DebugInfo/PDB/Raw/ByteStream.cpp | 5 | ||||
-rw-r--r-- | llvm/lib/DebugInfo/PDB/Raw/DbiStream.cpp | 4 | ||||
-rw-r--r-- | llvm/lib/DebugInfo/PDB/Raw/NameHashTable.cpp | 141 | ||||
-rw-r--r-- | llvm/test/DebugInfo/PDB/pdbdump-headers.test | 15 | ||||
-rw-r--r-- | llvm/tools/llvm-pdbdump/llvm-pdbdump.cpp | 34 |
10 files changed, 231 insertions, 25 deletions
diff --git a/llvm/include/llvm/DebugInfo/PDB/Raw/ByteStream.h b/llvm/include/llvm/DebugInfo/PDB/Raw/ByteStream.h index eacd4c417da..e9209f91b64 100644 --- a/llvm/include/llvm/DebugInfo/PDB/Raw/ByteStream.h +++ b/llvm/include/llvm/DebugInfo/PDB/Raw/ByteStream.h @@ -38,6 +38,7 @@ public: uint32_t getLength() const override; ArrayRef<uint8_t> data() const { return Data; } + StringRef str() const; private: MutableArrayRef<uint8_t> Data; diff --git a/llvm/include/llvm/DebugInfo/PDB/Raw/DbiStream.h b/llvm/include/llvm/DebugInfo/PDB/Raw/DbiStream.h index 1e21be963e0..e94c4a80f3a 100644 --- a/llvm/include/llvm/DebugInfo/PDB/Raw/DbiStream.h +++ b/llvm/include/llvm/DebugInfo/PDB/Raw/DbiStream.h @@ -14,6 +14,7 @@ #include "llvm/DebugInfo/PDB/Raw/ByteStream.h" #include "llvm/DebugInfo/PDB/Raw/MappedBlockStream.h" #include "llvm/DebugInfo/PDB/Raw/ModInfo.h" +#include "llvm/DebugInfo/PDB/Raw/NameHashTable.h" #include "llvm/DebugInfo/PDB/Raw/RawConstants.h" #include "llvm/Support/Endian.h" @@ -54,6 +55,7 @@ private: MappedBlockStream Stream; std::vector<ModuleInfoEx> ModuleInfos; + NameHashTable ECNames; ByteStream ModInfoSubstream; ByteStream SecContrSubstream; diff --git a/llvm/include/llvm/DebugInfo/PDB/Raw/NameHashTable.h b/llvm/include/llvm/DebugInfo/PDB/Raw/NameHashTable.h new file mode 100644 index 00000000000..22807856be0 --- /dev/null +++ b/llvm/include/llvm/DebugInfo/PDB/Raw/NameHashTable.h @@ -0,0 +1,48 @@ +//===- NameHashTable.h - PDB Name Hash Table --------------------*- C++ -*-===// +// +// The LLVM Compiler Infrastructure +// +// This file is distributed under the University of Illinois Open Source +// License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// + +#ifndef LLVM_DEBUGINFO_PDB_RAW_NAMEHASHTABLE_H +#define LLVM_DEBUGINFO_PDB_RAW_NAMEHASHTABLE_H + +#include "llvm/ADT/StringMap.h" +#include "llvm/ADT/StringRef.h" +#include "llvm/DebugInfo/PDB/Raw/ByteStream.h" + +#include <stdint.h> +#include <utility> + +namespace llvm { +namespace pdb { +class StreamReader; +class NameHashTable { +public: + NameHashTable(); + + std::error_code load(StreamReader &Stream); + + uint32_t getNameCount() const { return NameCount; } + uint32_t getHashVersion() const { return HashVersion; } + uint32_t getSignature() const { return Signature; } + + StringRef getStringForID(uint32_t ID) const; + uint32_t getIDForString(StringRef Str) const; + + ArrayRef<uint32_t> name_ids() const; + +private: + ByteStream NamesBuffer; + std::vector<uint32_t> IDs; + uint32_t Signature; + uint32_t HashVersion; + uint32_t NameCount; +}; +} +} + +#endif diff --git a/llvm/include/llvm/DebugInfo/PDB/Raw/StreamReader.h b/llvm/include/llvm/DebugInfo/PDB/Raw/StreamReader.h index 2dd9dca1861..5a524ffc5af 100644 --- a/llvm/include/llvm/DebugInfo/PDB/Raw/StreamReader.h +++ b/llvm/include/llvm/DebugInfo/PDB/Raw/StreamReader.h @@ -34,6 +34,11 @@ public: return readBytes(Buffer); } + template <typename T> std::error_code readArray(MutableArrayRef<T> Array) { + MutableArrayRef<uint8_t> Casted(reinterpret_cast<uint8_t*>(Array.data()), Array.size() * sizeof(T)); + return readBytes(Casted); + } + void setOffset(uint32_t Off) { Offset = Off; } uint32_t getOffset() const { return Offset; } uint32_t getLength() const { return Stream.getLength(); } diff --git a/llvm/lib/DebugInfo/PDB/CMakeLists.txt b/llvm/lib/DebugInfo/PDB/CMakeLists.txt index d6a3d2bf71c..2fa74b96246 100644 --- a/llvm/lib/DebugInfo/PDB/CMakeLists.txt +++ b/llvm/lib/DebugInfo/PDB/CMakeLists.txt @@ -33,6 +33,7 @@ add_pdb_impl_folder(Raw Raw/PDBFile.cpp Raw/DbiStream.cpp Raw/InfoStream.cpp + Raw/NameHashTable.cpp Raw/NameMap.cpp Raw/RawSession.cpp Raw/StreamReader.cpp) diff --git a/llvm/lib/DebugInfo/PDB/Raw/ByteStream.cpp b/llvm/lib/DebugInfo/PDB/Raw/ByteStream.cpp index d8b78ec2248..89477ead223 100644 --- a/llvm/lib/DebugInfo/PDB/Raw/ByteStream.cpp +++ b/llvm/lib/DebugInfo/PDB/Raw/ByteStream.cpp @@ -59,3 +59,8 @@ std::error_code ByteStream::readBytes(uint32_t Offset, } uint32_t ByteStream::getLength() const { return Data.size(); } + +StringRef ByteStream::str() const { + const char *CharData = reinterpret_cast<const char *>(Data.data()); + return StringRef(CharData, Data.size()); +} diff --git a/llvm/lib/DebugInfo/PDB/Raw/DbiStream.cpp b/llvm/lib/DebugInfo/PDB/Raw/DbiStream.cpp index 7762fa34ceb..57f7644d034 100644 --- a/llvm/lib/DebugInfo/PDB/Raw/DbiStream.cpp +++ b/llvm/lib/DebugInfo/PDB/Raw/DbiStream.cpp @@ -10,6 +10,7 @@ #include "llvm/DebugInfo/PDB/Raw/DbiStream.h" #include "llvm/DebugInfo/PDB/Raw/InfoStream.h" #include "llvm/DebugInfo/PDB/Raw/ModInfo.h" +#include "llvm/DebugInfo/PDB/Raw/NameHashTable.h" #include "llvm/DebugInfo/PDB/Raw/PDBFile.h" #include "llvm/DebugInfo/PDB/Raw/RawConstants.h" #include "llvm/DebugInfo/PDB/Raw/StreamReader.h" @@ -148,6 +149,9 @@ std::error_code DbiStream::reload() { if (Reader.bytesRemaining() > 0) return std::make_error_code(std::errc::illegal_byte_sequence); + StreamReader ECReader(ECSubstream); + ECNames.load(ECReader); + return std::error_code(); } diff --git a/llvm/lib/DebugInfo/PDB/Raw/NameHashTable.cpp b/llvm/lib/DebugInfo/PDB/Raw/NameHashTable.cpp new file mode 100644 index 00000000000..3e8de73609f --- /dev/null +++ b/llvm/lib/DebugInfo/PDB/Raw/NameHashTable.cpp @@ -0,0 +1,141 @@ +//===- NameHashTable.cpp - PDB Name Hash Table ------------------*- C++ -*-===// +// +// The LLVM Compiler Infrastructure +// +// This file is distributed under the University of Illinois Open Source +// License. See LICENSE.TXT for details. +// +//===----------------------------------------------------------------------===// + +#include "llvm/DebugInfo/PDB/Raw/NameHashTable.h" + +#include "llvm/ADT/ArrayRef.h" +#include "llvm/DebugInfo/PDB/Raw/ByteStream.h" +#include "llvm/DebugInfo/PDB/Raw/StreamReader.h" +#include "llvm/Support/Endian.h" + +using namespace llvm; +using namespace llvm::support; +using namespace llvm::pdb; + +typedef uint32_t *PUL; +typedef uint16_t *PUS; + +static inline uint32_t HashStringV1(StringRef Str) { + uint32_t Result = 0; + uint32_t Size = Str.size(); + + ArrayRef<ulittle32_t> Longs(reinterpret_cast<const ulittle32_t *>(Str.data()), + Size / 4); + + for (auto Value : Longs) + Result ^= Value; + + const uint8_t *Remainder = reinterpret_cast<const uint8_t *>(Longs.end()); + uint32_t RemainderSize = Size - Longs.size() * 4; + + // Maximum of 3 bytes left. Hash a 2 byte word if possible, then hash the + // possibly remaining 1 byte. + if (RemainderSize >= 2) { + Result ^= *reinterpret_cast<const ulittle16_t *>(Remainder); + Remainder += 2; + RemainderSize -= 2; + } + + // hash possible odd byte + if (RemainderSize == 1) { + Result ^= *(Remainder++); + } + + const uint32_t toLowerMask = 0x20202020; + Result |= toLowerMask; + Result ^= (Result >> 11); + + return Result ^ (Result >> 16); +} + +static inline uint32_t HashStringV2(StringRef Str) { + uint32_t Hash = 0xb170a1bf; + + ArrayRef<char> Buffer(Str.begin(), Str.end()); + + ArrayRef<ulittle32_t> Items( + reinterpret_cast<const ulittle32_t *>(Buffer.data()), + Buffer.size() / sizeof(ulittle32_t)); + for (ulittle32_t Item : Items) { + Hash += Item; + Hash += (Hash << 10); + Hash ^= (Hash >> 6); + } + Buffer = Buffer.slice(Items.size() * sizeof(ulittle32_t)); + for (uint8_t Item : Buffer) { + Hash += Item; + Hash += (Hash << 10); + Hash ^= (Hash >> 6); + } + + return Hash * 1664525L + 1013904223L; +} + +NameHashTable::NameHashTable() : Signature(0), HashVersion(0), NameCount(0) {} + +std::error_code NameHashTable::load(StreamReader &Stream) { + struct Header { + support::ulittle32_t Signature; + support::ulittle32_t HashVersion; + support::ulittle32_t ByteSize; + }; + + Header H; + Stream.readObject(&H); + if (H.Signature != 0xEFFEEFFE) + return std::make_error_code(std::errc::illegal_byte_sequence); + if (H.HashVersion != 1 && H.HashVersion != 2) + return std::make_error_code(std::errc::not_supported); + + Signature = H.Signature; + HashVersion = H.HashVersion; + NamesBuffer.initialize(Stream, H.ByteSize); + + support::ulittle32_t HashCount; + Stream.readObject(&HashCount); + std::vector<support::ulittle32_t> BucketArray(HashCount); + Stream.readArray<support::ulittle32_t>(BucketArray); + IDs.assign(BucketArray.begin(), BucketArray.end()); + + if (Stream.bytesRemaining() < sizeof(support::ulittle32_t)) + return std::make_error_code(std::errc::illegal_byte_sequence); + + Stream.readInteger(NameCount); + return std::error_code(); +} + +StringRef NameHashTable::getStringForID(uint32_t ID) const { + if (ID == IDs[0]) + return StringRef(); + + return StringRef(NamesBuffer.str().begin() + ID); +} + +uint32_t NameHashTable::getIDForString(StringRef Str) const { + uint32_t Hash = (HashVersion == 1) ? HashStringV1(Str) : HashStringV2(Str); + size_t Count = IDs.size(); + uint32_t Start = Hash % Count; + for (size_t I = 0; I < Count; ++I) { + // The hash is just a starting point for the search, but if it + // doesn't work we should find the string no matter what, because + // we iterate the entire array. + uint32_t Index = (Start + I) % Count; + + uint32_t ID = IDs[Index]; + StringRef S = getStringForID(ID); + if (S == Str) + return ID; + } + // IDs[0] contains the ID of the "invalid" entry. + return IDs[0]; +} + +ArrayRef<uint32_t> NameHashTable::name_ids() const { + return ArrayRef<uint32_t>(IDs).slice(1, NameCount); +} diff --git a/llvm/test/DebugInfo/PDB/pdbdump-headers.test b/llvm/test/DebugInfo/PDB/pdbdump-headers.test index 92999827e45..6b4c61cf8b6 100644 --- a/llvm/test/DebugInfo/PDB/pdbdump-headers.test +++ b/llvm/test/DebugInfo/PDB/pdbdump-headers.test @@ -20,6 +20,11 @@ ; EMPTY: NameStream: 13 ; EMPTY-NEXT: NameStreamSignature: effeeffe ; EMPTY-NEXT: NameStreamVersion: 1 +; EMPTY-NEXT: Name Count: 4 +; EMPTY-NEXT: Name: d:\src\llvm\test\debuginfo\pdb\inputs\predefined c++ attributes (compiler internal) +; EMPTY-NEXT: Name: +; EMPTY-NEXT: Name: d:\src\llvm\test\debuginfo\pdb\inputs\empty.cpp +; EMPTY-NEXT: Name: ; EMPTY: Dbi Version: 19990903 ; EMPTY-NEXT: Age: 1 @@ -76,6 +81,16 @@ BIG-NEXT: Guid: {880ECC89-DF81-0B4F-839C-58CBD052E937} BIG: NameStream: 13 BIG-NEXT: NameStreamSignature: effeeffe BIG-NEXT: NameStreamVersion: 1 +BIG-NEXT: Name Count: 92 +BIG-NEXT: Name: f:\dd\vctools\crt\vcruntime\inc\vcruntime_startup.h +BIG-NEXT: Name: f:\dd\vctools\crt\vcstartup\src\misc\checkcfg.c +BIG-NEXT: Name: f:\dd\vctools\langapi\include\isa_availability.h +BIG-NEXT: Name: +BIG-NEXT: Name: $T0 $ebp = $T2 $esp = $T1 .raSearchStart = $eip $T1 ^ = $ebp $T0 = $esp $T1 4 + = +BIG-NEXT: Name: +BIG-NEXT: Name: f:\dd\vctools\crt\vcstartup\src\startup\exe_common.inl +BIG-NEXT: Name: $T0 $ebp = $eip $T0 4 + ^ = $ebp $T0 ^ = $esp $T0 8 + = $20 $T0 40 - ^ = $23 $T0 44 - ^ = $24 $T0 48 - ^ = +BIG-NEXT: Name: $T0 $ebp = $eip $T0 4 + ^ = $ebp $T0 ^ = $esp $T0 8 + = $23 $T0 16 - ^ = $24 $T0 20 - ^ = BIG: Dbi Version: 19990903 BIG-NEXT: Age: 1 diff --git a/llvm/tools/llvm-pdbdump/llvm-pdbdump.cpp b/llvm/tools/llvm-pdbdump/llvm-pdbdump.cpp index fec28a9391f..a1fe8d50681 100644 --- a/llvm/tools/llvm-pdbdump/llvm-pdbdump.cpp +++ b/llvm/tools/llvm-pdbdump/llvm-pdbdump.cpp @@ -39,6 +39,7 @@ #include "llvm/DebugInfo/PDB/Raw/InfoStream.h" #include "llvm/DebugInfo/PDB/Raw/MappedBlockStream.h" #include "llvm/DebugInfo/PDB/Raw/ModInfo.h" +#include "llvm/DebugInfo/PDB/Raw/NameHashTable.h" #include "llvm/DebugInfo/PDB/Raw/PDBFile.h" #include "llvm/DebugInfo/PDB/Raw/RawSession.h" #include "llvm/DebugInfo/PDB/Raw/StreamReader.h" @@ -147,19 +148,6 @@ cl::opt<bool> NoEnumDefs("no-enum-definitions", cl::cat(FilterCategory)); } - -static void reportError(StringRef Input, StringRef Message) { - if (Input == "-") - Input = "<stdin>"; - errs() << Input << ": " << Message << "\n"; - errs().flush(); - exit(1); -} - -static void reportError(StringRef Input, std::error_code EC) { - reportError(Input, EC.message()); -} - static void dumpStructure(RawSession &RS) { PDBFile &File = RS.getPDBFile(); @@ -253,19 +241,15 @@ static void dumpStructure(RawSession &RS) { outs() << "NameStream: " << NameStreamIndex << '\n'; - // The name stream appears to start with a signature and version. - uint32_t NameStreamSignature; - Reader.readInteger(NameStreamSignature); + NameHashTable NameTable; + NameTable.load(Reader); outs() << "NameStreamSignature: "; - outs().write_hex(NameStreamSignature) << '\n'; - - uint32_t NameStreamVersion; - Reader.readInteger(NameStreamVersion); - outs() << "NameStreamVersion: " << NameStreamVersion << '\n'; - - // We only support this particular version of the name stream. - if (NameStreamSignature != 0xeffeeffe || NameStreamVersion != 1) - reportError("", std::make_error_code(std::errc::not_supported)); + outs().write_hex(NameTable.getSignature()) << '\n'; + outs() << "NameStreamVersion: " << NameTable.getHashVersion() << '\n'; + outs() << "Name Count: " << NameTable.getNameCount() << '\n'; + for (uint32_t ID : NameTable.name_ids()) { + outs() << "Name: " << NameTable.getStringForID(ID) << '\n'; + } } DbiStream &DS = File.getPDBDbiStream(); |