Convert over to the latest and greatest on disc accelerator

hash tables. Renamed the DWARF sections to ".apple_names" and ".apple_types" until we get more buy in from other vendors. llvm-svn: 140702
author: Greg Clayton <gclayton@apple.com> 2011-09-28 17:06:40 +0000
committer: Greg Clayton <gclayton@apple.com> 2011-09-28 17:06:40 +0000
commit: 1767440a72c9e385f520c279e46d359b4030d54c (patch)
tree: c2af8d9378f2a06729b249710522cc04d538b40a /lldb/source/Plugins/SymbolFile/DWARF/HashedNameToDIE.cpp
parent: ef8e4efff8f247a0dd216e9485d321c612dac760 (diff)
download: bcm5719-llvm-1767440a72c9e385f520c279e46d359b4030d54c.tar.gz
bcm5719-llvm-1767440a72c9e385f520c279e46d359b4030d54c.zip
1 files changed, 242 insertions, 81 deletions
diff --git a/lldb/source/Plugins/SymbolFile/DWARF/HashedNameToDIE.cpp b/lldb/source/Plugins/SymbolFile/DWARF/HashedNameToDIE.cpp
index 3ee478ebc56..1a764913a8e 100644
--- a/lldb/source/Plugins/SymbolFile/DWARF/HashedNameToDIE.cpp
+++ b/lldb/source/Plugins/SymbolFile/DWARF/HashedNameToDIE.cpp
@@ -18,6 +18,7 @@
 #include "DWARFCompileUnit.h"
 #include "DWARFDebugInfo.h"
 #include "DWARFDebugInfoEntry.h"
+#include "DWARFDefines.h"
 #include "SymbolFileDWARF.h"
 using namespace lldb;
 using namespace lldb_private;
@@ -33,115 +34,275 @@ dl_new_hash (const char *s)
     return h;
 }
 
-HashedNameToDIE::HashedNameToDIE (SymbolFileDWARF *dwarf, const DataExtractor &data) :
-    m_dwarf (dwarf),
-    m_data (data),
-    m_header  ()
+
+void
+HashedNameToDIE::Header::Dump (Stream &s)
 {
+    s.Printf ("header.magic              = 0x%8.8x", magic);
+    s.Printf ("header.version            = 0x%4.4x", version);
+    s.Printf ("header.addr_bytesize      = 0x%2.2x", addr_bytesize);
+    s.Printf ("header.hash_function      = 0x%2.2x", hash_function);
+    s.Printf ("header.hash_count_bitsize = 0x%2.2x", hash_count_bitsize);
+    s.Printf ("header.hash_index_bitsize = 0x%2.2x", hash_index_bitsize);
+    s.Printf ("header.hash_bytesize      = 0x%2.2x", hash_bytesize);
+    s.Printf ("header.offset_bytesize    = 0x%2.2x", offset_bytesize);
+    s.Printf ("header.bucket_count       = 0x%8.8x %u", bucket_count, bucket_count);
+    s.Printf ("header.hashes_count       = 0x%8.8x %u", hashes_count, hashes_count);
+    s.Printf ("header.prologue_length    = 0x%8.8x %u", prologue_length, prologue_length);
+}
+
+uint32_t
+HashedNameToDIE::Header::Read (const DataExtractor &data, uint32_t offset)
+{
+    magic = data.GetU32 (&offset);
+    if (magic != HASH_MAGIC)
+    {
+        // Magic bytes didn't match
+        version = 0;
+        return UINT32_MAX;
+    }
+    
+    version = data.GetU16 (&offset);
+    if (version != 1)
+    {
+        // Unsupported version
+        return UINT32_MAX;
+    }
+    addr_bytesize       = data.GetU8  (&offset);
+    hash_function       = data.GetU8  (&offset);
+    hash_count_bitsize  = data.GetU8  (&offset);
+    hash_index_bitsize  = data.GetU8  (&offset);
+    hash_bytesize       = data.GetU8  (&offset);
+    offset_bytesize     = data.GetU8  (&offset);
+    bucket_count        = data.GetU32 (&offset);
+    hashes_count        = data.GetU32 (&offset);
+    prologue_length     = data.GetU32 (&offset);
+    return offset;
 }
 
 void
-HashedNameToDIE::Initialize()
+HashedNameToDIE::DWARF::Header::Dump (Stream &s)
 {
-    uint32_t offset = 0;
-    m_header.version = m_data.GetU16(&offset);
-    if (m_header.version)
+    HashedNameToDIE::Header::Dump (s);
+    dwarf_prologue.Dump (s);
+}
+
+uint32_t
+HashedNameToDIE::DWARF::Header::Read (const DataExtractor &data, uint32_t offset)
+{
+    offset = HashedNameToDIE::Header::Read (data, offset);
+    if (offset != UINT32_MAX)
+        offset = dwarf_prologue.Read (data, offset);
+    else
+        dwarf_prologue.Clear();
+    return offset;
+}
+
+void
+HashedNameToDIE::DWARF::Prologue::Dump (Stream &s)
+{
+    s.Printf ("dwarf_prologue.die_base_offset    = 0x%8.8x\n", die_base_offset);
+    const size_t num_atoms = atoms.size();
+    for (size_t i = 0; i < num_atoms; ++i)
     {
-        m_header.hash_type = m_data.GetU8(&offset);
-        m_header.hash_index_bitsize = m_data.GetU8(&offset);
-        m_header.num_buckets = m_data.GetU32(&offset);
-        m_header.num_hashes = m_data.GetU32(&offset);
-        m_header.die_offset_base = m_data.GetU32(&offset);
+        s.Printf ("dwarf_prologue.atom[%zi] = %17s %s\n", 
+                  i, 
+                  GetAtomTypeName (atoms[i].type), 
+                  DW_FORM_value_to_name(atoms[i].form));
     }
 }
 
-size_t
-HashedNameToDIE::Find (const ConstString &name, DIEArray &die_ofsets) const
+uint32_t
+HashedNameToDIE::DWARF::Prologue::Read (const DataExtractor &data, uint32_t offset)
 {
-    const size_t initial_size = die_ofsets.size();
-    const char *name_cstr = name.GetCString();
-    if (name_cstr && name_cstr[0])
+    Clear();
+    die_base_offset = data.GetU32 (&offset);
+    Atom atom;
+    while (offset != UINT32_MAX)
     {
-        // Hash the C string
-        const uint32_t name_hash = dl_new_hash (name_cstr);
-        
-        // Find the correct bucket for the using the hash value
-        const uint32_t bucket_idx = name_hash % m_header.num_buckets;
-        
-        // Calculate the offset for the bucket entry for the bucket index
-        uint32_t offset = GetOffsetOfBucketEntry (bucket_idx);
+        atom.type = data.GetU16 (&offset);
+        atom.form = data.GetU16 (&offset);
+        if (atom.type == eAtomTypeNULL)
+            break;
+        atoms.push_back(atom);
+    }
+    return offset;
+}
+
+
+HashedNameToDIE::MemoryTable::MemoryTable (SymbolFileDWARF *dwarf, 
+                                           const lldb_private::DataExtractor &data,
+                                           bool is_apple_names) :
+    m_data (data),
+    m_string_table (dwarf->get_debug_str_data ()),
+    m_is_apple_names (is_apple_names),
+    m_header  ()
+{
+}
 
-        // Extract the bucket entry.
-        const uint32_t bucket_entry = m_data.GetU32 (&offset);
-        if (bucket_entry)
+bool
+HashedNameToDIE::MemoryTable::Initialize ()
+{
+    uint32_t offset = 0;
+    offset = m_header.Read (m_data, offset);
+    return m_header.version == 1;
+}
+
+
+size_t
+HashedNameToDIE::MemoryTable::Find (const char *name_cstr, DIEArray &die_ofsets) const
+{
+    if (m_header.version == 1)
+    {
+        const size_t initial_size = die_ofsets.size();
+        if (name_cstr && name_cstr[0])
         {
-            // The bucket entry is non-zero which means it isn't empty.
-            // The bucket entry is made up of a hash index whose bit width
-            // is m_header.hash_index_bitsize, and a hash count whose value
-            // is the remaining bits in the 32 bit value. Below we extract
-            // the hash index and the hash count
-            const uint32_t hash_idx = bucket_entry & GetHashIndexMask();
-            const uint32_t hash_count = bucket_entry >> m_header.hash_index_bitsize;
-            const uint32_t hash_end_idx = hash_idx + hash_count;
-            // Figure out the offset to the hash value by index
-            uint32_t hash_offset = GetOffsetOfHashValue (hash_idx);
-            for (uint32_t idx = hash_idx; idx < hash_end_idx; ++idx)
+            // Hash the C string
+            const uint32_t name_hash = dl_new_hash (name_cstr);
+            
+            // Find the correct bucket for the using the hash value
+            const uint32_t bucket_idx = name_hash % m_header.bucket_count;
+            
+            // Calculate the offset for the bucket entry for the bucket index
+            uint32_t offset = GetOffsetOfBucketEntry (bucket_idx);
+            
+            // Extract the bucket entry.
+            const uint32_t bucket_entry = m_data.GetU32 (&offset);
+            if (bucket_entry)
             {
-                // Extract the hash value and see if it matches our string
-                const uint32_t hash = m_data.GetU32 (&hash_offset);
-                if (hash == name_hash)
+                // The bucket entry is non-zero which means it isn't empty.
+                // The bucket entry is made up of a hash index whose bit width
+                // is m_header.hash_index_bitsize, and a hash count whose value
+                // is the remaining bits in the 32 bit value. Below we extract
+                // the hash index and the hash count
+                const uint32_t hash_idx = bucket_entry & GetHashIndexMask();
+                const uint32_t hash_count = bucket_entry >> m_header.hash_index_bitsize;
+                const uint32_t hash_end_idx = hash_idx + hash_count;
+                // Figure out the offset to the hash value by index
+                uint32_t hash_offset = GetOffsetOfHashValue (hash_idx);
+                for (uint32_t idx = hash_idx; idx < hash_end_idx; ++idx)
                 {
-                    // The hash matches, but we still need to verify that the
-                    // C string matches in case we have a hash collision. Figure
-                    // out the offset for the data associated with this hash entry
-                    offset = GetOffsetOfHashDataOffset (idx);
-                    // Extract the first 32 bit value which is the .debug_str offset
-                    // of the string we need
-                    uint32_t hash_data_offset = m_data.GetU32 (&offset);
-                    const uint32_t str_offset = m_data.GetU32 (&hash_data_offset);
-                    // Extract the C string and comapare it
-                    const char *cstr_name = m_dwarf->get_debug_str_data().PeekCStr(str_offset);
-                    if (cstr_name)
+                    // Extract the hash value and see if it matches our string
+                    const uint32_t hash = m_data.GetU32 (&hash_offset);
+                    if (hash == name_hash)
                     {
-                        if (strcmp(name_cstr, cstr_name) == 0)
+                        // The hash matches, but we still need to verify that the
+                        // C string matches in case we have a hash collision. Figure
+                        // out the offset for the data associated with this hash entry
+                        offset = GetOffsetOfHashDataOffset (idx);
+                        uint32_t hash_data_offset = m_data.GetU32 (&offset);
+                        uint32_t str_offset;
+                        // Now we have the offset to the data for all strings that match
+                        // our 32 bit hash. The format of the hash bucket is:
+                        //
+                        // uint32_t stroff;     // string offset in .debug_str table
+                        // uint32_t num_dies;   // Number of DIEs in debug info that match the string that follow this
+                        // uint32_t die_offsets[num_dies]; // An array of DIE offsets
+                        //
+                        // When a "stroff" is read and it is zero, then the data for this
+                        // hash is terminated.
+                        while ((str_offset = m_data.GetU32 (&hash_data_offset)) != 0)
                         {
-                            // We have a match, now extract the DIE count
-                            const uint32_t die_count = m_data.GetU32 (&hash_data_offset);
-                            // Now extract "die_count" DIE offsets and put them into the
-                            // results
-                            for (uint32_t die_idx = 0; die_idx < die_count; ++die_idx)
-                                die_ofsets.push_back(m_data.GetU32 (&hash_data_offset));
+                            // Extract the C string and comapare it
+                            const char *cstr_name = m_string_table.PeekCStr(str_offset);
+                            if (cstr_name)
+                            {
+                                if (strcmp(name_cstr, cstr_name) == 0)
+                                {
+                                    // We have a match, now extract the DIE count
+                                    const uint32_t die_count = m_data.GetU32 (&hash_data_offset);
+                                    // Now extract "die_count" DIE offsets and put them into the
+                                    // results
+                                    for (uint32_t die_idx = 0; die_idx < die_count; ++die_idx)
+                                        die_ofsets.push_back(m_data.GetU32 (&hash_data_offset));
+                                }
+                            }
                         }
                     }
                 }
             }
         }
+        return die_ofsets.size() - initial_size;
     }
-    return die_ofsets.size() - initial_size;
-}
-
-size_t
-HashedNameToDIE::Find (const RegularExpression& regex, DIEArray &die_ofsets) const
-{
-//    const size_t initial_info_array_size = info_array.size();
-//    collection::const_iterator pos, end = m_collection.end();
-//    for (pos = m_collection.begin(); pos != end; ++pos)
-//    {
-//        if (regex.Execute(pos->first))
-//            info_array.push_back (pos->second);
-//    }
-//    return info_array.size() - initial_info_array_size;
     return 0;
 }
 
 void
-HashedNameToDIE::Dump (Stream *s)
+HashedNameToDIE::MemoryTable::Dump (Stream &s)
 {
-//    collection::const_iterator pos, end = m_collection.end();
-//    for (pos = m_collection.begin(); pos != end; ++pos)
-//    {
-//        s->Printf("%p: 0x%8.8x 0x%8.8x \"%s\"\n", pos->first, pos->second.cu_idx, pos->second.die_idx, pos->first);
-//    }
+    if (m_header.version == 1)
+    {
+
+        bool verbose = s.GetVerbose();
+        
+        if (m_is_apple_names)
+            s.PutCString (".apple_names contents:\n");
+        else
+            s.PutCString (".apple_types contents:\n");
+        
+        m_header.Dump (s);
+        uint32_t i,j,k;
+        uint32_t empty_bucket_count = 0;
+        uint32_t hash_collisions = 0;
+        uint32_t bucket_entry_offset = GetOffsetOfBucketEntry (0);
+        for (i=0; i<m_header.bucket_count; ++i)
+        {
+            const uint32_t bucket_entry = m_data.GetU32 (&bucket_entry_offset);
+            s.Printf("bucket[%u] 0x%8.8x", i, bucket_entry);
+            if (bucket_entry)
+            {
+                const uint32_t hash_idx = bucket_entry & GetHashIndexMask();
+                const uint32_t hash_count = bucket_entry >> m_header.hash_index_bitsize;
+                
+                s.Printf(" (hash_idx = %u, hash_count = %u)\n", hash_idx, hash_count);
+                
+                const uint32_t hash_end_idx = hash_idx + hash_count;
+                uint32_t hash_offset = GetOffsetOfHashValue (hash_idx);
+                uint32_t data_offset = GetOffsetOfHashDataOffset (hash_idx);
+                
+                for (j=hash_idx; j<hash_end_idx; ++j)
+                {
+                    const uint32_t hash = m_data.GetU32 (&hash_offset);
+                    uint32_t hash_data_offset = m_data.GetU32 (&data_offset);
+                    if (verbose)
+                        s.Printf("  hash[%u] = 0x%8.8x, offset[%u] = 0x%8.8x\n", j, hash, j, hash_data_offset);
+                    else
+                        s.Printf("  hash[%u] = 0x%8.8x\n", j, hash);
+
+                    uint32_t string_idx = 0;
+                    uint32_t strp_offset;
+                    while ((strp_offset = m_data.GetU32 (&hash_data_offset)) != 0)
+                    {
+                        const uint32_t num_die_offsets = m_data.GetU32 (&hash_data_offset);
+                        s.Printf("    string[%u] = 0x%8.8x \"%s\", dies[%u] = {", 
+                                 string_idx, 
+                                 strp_offset, 
+                                 m_string_table.PeekCStr(strp_offset),
+                                 num_die_offsets);
+                        ++string_idx;
+                        
+                        for (k=0; k<num_die_offsets; ++k)
+                        {
+                            const uint32_t die_offset = m_data.GetU32 (&hash_data_offset);
+                            s.Printf(" 0x%8.8x", die_offset);
+                        }
+                        s.PutCString (" }\n");
+                    }
+                    if (string_idx > 1)
+                        ++hash_collisions;
+                }
+            }
+            else
+            {
+                s.PutCString(" (empty)\n");
+                ++empty_bucket_count;
+            }
+        }
+        
+        s.Printf ("%u of %u buckets empty (%2.1f%%)\n",  empty_bucket_count, m_header.bucket_count, (((float)empty_bucket_count/(float)m_header.bucket_count)*100.0f));
+        s.Printf ("Average hashes/non-empty bucket = %2.1f%%\n", ((float)m_header.hashes_count/(float)(m_header.bucket_count - empty_bucket_count)));
+        s.Printf ("Hash collisions = %u\n", hash_collisions);
+    }
 }
author	Greg Clayton <gclayton@apple.com>	2011-09-28 17:06:40 +0000
committer	Greg Clayton <gclayton@apple.com>	2011-09-28 17:06:40 +0000
commit	1767440a72c9e385f520c279e46d359b4030d54c (patch)
tree	c2af8d9378f2a06729b249710522cc04d538b40a /lldb/source/Plugins/SymbolFile/DWARF/HashedNameToDIE.cpp
parent	ef8e4efff8f247a0dd216e9485d321c612dac760 (diff)
download	bcm5719-llvm-1767440a72c9e385f520c279e46d359b4030d54c.tar.gz bcm5719-llvm-1767440a72c9e385f520c279e46d359b4030d54c.zip