//=-- InstrProfWriter.cpp - Instrumented profiling writer -------------------=// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file contains support for writing profiling data for clang's // instrumentation based PGO and coverage. // //===----------------------------------------------------------------------===// #include "llvm/ProfileData/InstrProfWriter.h" #include "InstrProfIndexed.h" #include "llvm/ADT/StringExtras.h" #include "llvm/Support/EndianStream.h" #include "llvm/Support/OnDiskHashTable.h" using namespace llvm; namespace { class InstrProfRecordTrait { public: typedef StringRef key_type; typedef StringRef key_type_ref; typedef const InstrProfWriter::ProfilingData *const data_type; typedef const InstrProfWriter::ProfilingData *const data_type_ref; typedef uint64_t hash_value_type; typedef uint64_t offset_type; static hash_value_type ComputeHash(key_type_ref K) { return IndexedInstrProf::ComputeHash(IndexedInstrProf::HashType, K); } static std::pair EmitKeyDataLength(raw_ostream &Out, key_type_ref K, data_type_ref V) { using namespace llvm::support; endian::Writer LE(Out); offset_type N = K.size(); LE.write(N); offset_type M = 0; for (const auto &ProfileData : *V) { M += sizeof(uint64_t); // The function hash M += sizeof(uint64_t); // The size of the Counts vector M += ProfileData.second.Counts.size() * sizeof(uint64_t); // Value data M += sizeof(uint64_t); // Number of value kinds with value sites. for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) { const std::vector &ValueSites = ProfileData.second.getValueSitesForKind(Kind); if (ValueSites.empty()) continue; M += sizeof(uint64_t); // Value kind M += sizeof(uint64_t); // The number of value sites for given value kind for (InstrProfValueSiteRecord I : ValueSites) { M += sizeof(uint64_t); // Number of value data pairs at a value site M += 2 * sizeof(uint64_t) * I.ValueData.size(); // Value data pairs } } } LE.write(M); return std::make_pair(N, M); } static void EmitKey(raw_ostream &Out, key_type_ref K, offset_type N){ Out.write(K.data(), N); } static void EmitData(raw_ostream &Out, key_type_ref, data_type_ref V, offset_type) { using namespace llvm::support; endian::Writer LE(Out); for (const auto &ProfileData : *V) { LE.write(ProfileData.first); // Function hash LE.write(ProfileData.second.Counts.size()); for (uint64_t I : ProfileData.second.Counts) LE.write(I); // Compute the number of value kinds with value sites. uint64_t NumValueKinds = 0; for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) NumValueKinds += !(ProfileData.second.getValueSitesForKind(Kind).empty()); LE.write(NumValueKinds); // Write value data for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) { const std::vector &ValueSites = ProfileData.second.getValueSitesForKind(Kind); if (ValueSites.empty()) continue; LE.write(Kind); // Write value kind // Write number of value sites for current value kind LE.write(ValueSites.size()); for (InstrProfValueSiteRecord I : ValueSites) { // Write number of value data pairs at this value site LE.write(I.ValueData.size()); for (auto V : I.ValueData) { if (Kind == IPVK_IndirectCallTarget) LE.write(ComputeHash((const char *)V.first)); else LE.write(V.first); LE.write(V.second); } } } } } }; } static std::error_code combineInstrProfRecords(InstrProfRecord &Dest, InstrProfRecord &Source, uint64_t &MaxFunctionCount) { // If the number of counters doesn't match we either have bad data // or a hash collision. if (Dest.Counts.size() != Source.Counts.size()) return instrprof_error::count_mismatch; for (size_t I = 0, E = Source.Counts.size(); I < E; ++I) { if (Dest.Counts[I] + Source.Counts[I] < Dest.Counts[I]) return instrprof_error::counter_overflow; Dest.Counts[I] += Source.Counts[I]; } for (uint32_t Kind = IPVK_First; Kind <= IPVK_Last; ++Kind) { std::vector &SourceValueSites = Source.getValueSitesForKind(Kind); if (SourceValueSites.empty()) continue; std::vector &DestValueSites = Dest.getValueSitesForKind(Kind); if (DestValueSites.empty()) { DestValueSites.swap(SourceValueSites); continue; } if (DestValueSites.size() != SourceValueSites.size()) return instrprof_error::value_site_count_mismatch; for (size_t I = 0, E = SourceValueSites.size(); I < E; ++I) DestValueSites[I].mergeValueData(SourceValueSites[I]); } // We keep track of the max function count as we go for simplicity. if (Dest.Counts[0] > MaxFunctionCount) MaxFunctionCount = Dest.Counts[0]; return instrprof_error::success; } void InstrProfWriter::updateStringTableReferences(InstrProfRecord &I) { I.Name = StringTable.insertString(I.Name); for (auto &VSite : I.IndirectCallSites) for (auto &VData : VSite.ValueData) VData.first = (uint64_t)StringTable.insertString((const char *)VData.first); } std::error_code InstrProfWriter::addRecord(InstrProfRecord &&I) { updateStringTableReferences(I); auto &ProfileDataMap = FunctionData[I.Name]; auto Where = ProfileDataMap.find(I.Hash); if (Where == ProfileDataMap.end()) { // We've never seen a function with this name and hash, add it. ProfileDataMap[I.Hash] = I; // We keep track of the max function count as we go for simplicity. if (I.Counts[0] > MaxFunctionCount) MaxFunctionCount = I.Counts[0]; return instrprof_error::success; } // We're updating a function we've seen before. return combineInstrProfRecords(Where->second, I, MaxFunctionCount); } std::pair InstrProfWriter::writeImpl(raw_ostream &OS) { OnDiskChainedHashTableGenerator Generator; // Populate the hash table generator. for (const auto &I : FunctionData) Generator.insert(I.getKey(), &I.getValue()); using namespace llvm::support; endian::Writer LE(OS); // Write the header. LE.write(IndexedInstrProf::Magic); LE.write(IndexedInstrProf::Version); LE.write(MaxFunctionCount); LE.write(static_cast(IndexedInstrProf::HashType)); // Save a space to write the hash table start location. uint64_t HashTableStartLoc = OS.tell(); LE.write(0); // Write the hash table. uint64_t HashTableStart = Generator.Emit(OS); return std::make_pair(HashTableStartLoc, HashTableStart); } void InstrProfWriter::write(raw_fd_ostream &OS) { // Write the hash table. auto TableStart = writeImpl(OS); // Go back and fill in the hash table start. using namespace support; OS.seek(TableStart.first); endian::Writer(OS).write(TableStart.second); } std::unique_ptr InstrProfWriter::writeBuffer() { std::string Data; llvm::raw_string_ostream OS(Data); // Write the hash table. auto TableStart = writeImpl(OS); OS.flush(); // Go back and fill in the hash table start. using namespace support; uint64_t Bytes = endian::byte_swap(TableStart.second); Data.replace(TableStart.first, sizeof(uint64_t), (const char *)&Bytes, sizeof(uint64_t)); // Return this in an aligned memory buffer. return MemoryBuffer::getMemBufferCopy(Data); }