//=-- InstrProfReader.h - Instrumented profiling readers ----------*- C++ -*-=// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file contains support for reading profiling data for instrumentation // based PGO and coverage. // //===----------------------------------------------------------------------===// #ifndef LLVM_PROFILEDATA_INSTRPROFREADER_H #define LLVM_PROFILEDATA_INSTRPROFREADER_H #include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ProfileData/InstrProf.h" #include "llvm/Support/EndianStream.h" #include "llvm/Support/LineIterator.h" #include "llvm/Support/MemoryBuffer.h" #include "llvm/Support/OnDiskHashTable.h" #include "llvm/Support/raw_ostream.h" #include namespace llvm { class InstrProfReader; /// A file format agnostic iterator over profiling data. class InstrProfIterator : public std::iterator { InstrProfReader *Reader; InstrProfRecord Record; void Increment(); public: InstrProfIterator() : Reader(nullptr) {} InstrProfIterator(InstrProfReader *Reader) : Reader(Reader) { Increment(); } InstrProfIterator &operator++() { Increment(); return *this; } bool operator==(const InstrProfIterator &RHS) { return Reader == RHS.Reader; } bool operator!=(const InstrProfIterator &RHS) { return Reader != RHS.Reader; } InstrProfRecord &operator*() { return Record; } InstrProfRecord *operator->() { return &Record; } }; /// Base class and interface for reading profiling data of any known instrprof /// format. Provides an iterator over InstrProfRecords. class InstrProfReader { instrprof_error LastError; public: InstrProfReader() : LastError(instrprof_error::success), Symtab() {} virtual ~InstrProfReader() {} /// Read the header. Required before reading first record. virtual Error readHeader() = 0; /// Read a single record. virtual Error readNextRecord(InstrProfRecord &Record) = 0; /// Iterator over profile data. InstrProfIterator begin() { return InstrProfIterator(this); } InstrProfIterator end() { return InstrProfIterator(); } virtual bool isIRLevelProfile() const = 0; /// Return the PGO symtab. There are three different readers: /// Raw, Text, and Indexed profile readers. The first two types /// of readers are used only by llvm-profdata tool, while the indexed /// profile reader is also used by llvm-cov tool and the compiler ( /// backend or frontend). Since creating PGO symtab can create /// significant runtime and memory overhead (as it touches data /// for the whole program), InstrProfSymtab for the indexed profile /// reader should be created on demand and it is recommended to be /// only used for dumping purpose with llvm-proftool, not with the /// compiler. virtual InstrProfSymtab &getSymtab() = 0; protected: std::unique_ptr Symtab; /// Set the current error and return same. Error error(instrprof_error Err) { LastError = Err; if (Err == instrprof_error::success) return Error::success(); return make_error(Err); } Error error(Error E) { return error(InstrProfError::take(std::move(E))); } /// Clear the current error and return a successful one. Error success() { return error(instrprof_error::success); } public: /// Return true if the reader has finished reading the profile data. bool isEOF() { return LastError == instrprof_error::eof; } /// Return true if the reader encountered an error reading profiling data. bool hasError() { return LastError != instrprof_error::success && !isEOF(); } /// Get the current error. Error getError() { if (hasError()) return make_error(LastError); return Error::success(); } /// Factory method to create an appropriately typed reader for the given /// instrprof file. static Expected> create(const Twine &Path); static Expected> create(std::unique_ptr Buffer); }; /// Reader for the simple text based instrprof format. /// /// This format is a simple text format that's suitable for test data. Records /// are separated by one or more blank lines, and record fields are separated by /// new lines. /// /// Each record consists of a function name, a function hash, a number of /// counters, and then each counter value, in that order. class TextInstrProfReader : public InstrProfReader { private: /// The profile data file contents. std::unique_ptr DataBuffer; /// Iterator over the profile data. line_iterator Line; bool IsIRLevelProfile; TextInstrProfReader(const TextInstrProfReader &) = delete; TextInstrProfReader &operator=(const TextInstrProfReader &) = delete; Error readValueProfileData(InstrProfRecord &Record); public: TextInstrProfReader(std::unique_ptr DataBuffer_) : DataBuffer(std::move(DataBuffer_)), Line(*DataBuffer, true, '#'), IsIRLevelProfile(false) {} /// Return true if the given buffer is in text instrprof format. static bool hasFormat(const MemoryBuffer &Buffer); bool isIRLevelProfile() const override { return IsIRLevelProfile; } /// Read the header. Error readHeader() override; /// Read a single record. Error readNextRecord(InstrProfRecord &Record) override; InstrProfSymtab &getSymtab() override { assert(Symtab.get()); return *Symtab.get(); } }; /// Reader for the raw instrprof binary format from runtime. /// /// This format is a raw memory dump of the instrumentation-baed profiling data /// from the runtime. It has no index. /// /// Templated on the unsigned type whose size matches pointers on the platform /// that wrote the profile. template class RawInstrProfReader : public InstrProfReader { private: /// The profile data file contents. std::unique_ptr DataBuffer; bool ShouldSwapBytes; // The value of the version field of the raw profile data header. The lower 56 // bits specifies the format version and the most significant 8 bits specify // the variant types of the profile. uint64_t Version; uint64_t CountersDelta; uint64_t NamesDelta; const RawInstrProf::ProfileData *Data; const RawInstrProf::ProfileData *DataEnd; const uint64_t *CountersStart; const char *NamesStart; uint64_t NamesSize; // After value profile is all read, this pointer points to // the header of next profile data (if exists) const uint8_t *ValueDataStart; uint32_t ValueKindLast; uint32_t CurValueDataSize; InstrProfRecord::ValueMapType FunctionPtrToNameMap; RawInstrProfReader(const RawInstrProfReader &) = delete; RawInstrProfReader &operator=(const RawInstrProfReader &) = delete; public: RawInstrProfReader(std::unique_ptr DataBuffer) : DataBuffer(std::move(DataBuffer)) { } static bool hasFormat(const MemoryBuffer &DataBuffer); Error readHeader() override; Error readNextRecord(InstrProfRecord &Record) override; bool isIRLevelProfile() const override { return (Version & VARIANT_MASK_IR_PROF) != 0; } InstrProfSymtab &getSymtab() override { assert(Symtab.get()); return *Symtab.get(); } private: Error createSymtab(InstrProfSymtab &Symtab); Error readNextHeader(const char *CurrentPos); Error readHeader(const RawInstrProf::Header &Header); template IntT swap(IntT Int) const { return ShouldSwapBytes ? sys::getSwappedBytes(Int) : Int; } support::endianness getDataEndianness() const { support::endianness HostEndian = getHostEndianness(); if (!ShouldSwapBytes) return HostEndian; if (HostEndian == support::little) return support::big; else return support::little; } inline uint8_t getNumPaddingBytes(uint64_t SizeInBytes) { return 7 & (sizeof(uint64_t) - SizeInBytes % sizeof(uint64_t)); } Error readName(InstrProfRecord &Record); Error readFuncHash(InstrProfRecord &Record); Error readRawCounts(InstrProfRecord &Record); Error readValueProfilingData(InstrProfRecord &Record); bool atEnd() const { return Data == DataEnd; } void advanceData() { Data++; ValueDataStart += CurValueDataSize; } const char *getNextHeaderPos() const { assert(atEnd()); return (const char *)ValueDataStart; } const uint64_t *getCounter(IntPtrT CounterPtr) const { ptrdiff_t Offset = (swap(CounterPtr) - CountersDelta) / sizeof(uint64_t); return CountersStart + Offset; } StringRef getName(uint64_t NameRef) const { return Symtab->getFuncName(swap(NameRef)); } }; typedef RawInstrProfReader RawInstrProfReader32; typedef RawInstrProfReader RawInstrProfReader64; namespace IndexedInstrProf { enum class HashT : uint32_t; } /// Trait for lookups into the on-disk hash table for the binary instrprof /// format. class InstrProfLookupTrait { std::vector DataBuffer; IndexedInstrProf::HashT HashType; unsigned FormatVersion; // Endianness of the input value profile data. // It should be LE by default, but can be changed // for testing purpose. support::endianness ValueProfDataEndianness; public: InstrProfLookupTrait(IndexedInstrProf::HashT HashType, unsigned FormatVersion) : HashType(HashType), FormatVersion(FormatVersion), ValueProfDataEndianness(support::little) {} typedef ArrayRef data_type; typedef StringRef internal_key_type; typedef StringRef external_key_type; typedef uint64_t hash_value_type; typedef uint64_t offset_type; static bool EqualKey(StringRef A, StringRef B) { return A == B; } static StringRef GetInternalKey(StringRef K) { return K; } static StringRef GetExternalKey(StringRef K) { return K; } hash_value_type ComputeHash(StringRef K); static std::pair ReadKeyDataLength(const unsigned char *&D) { using namespace support; offset_type KeyLen = endian::readNext(D); offset_type DataLen = endian::readNext(D); return std::make_pair(KeyLen, DataLen); } StringRef ReadKey(const unsigned char *D, offset_type N) { return StringRef((const char *)D, N); } bool readValueProfilingData(const unsigned char *&D, const unsigned char *const End); data_type ReadData(StringRef K, const unsigned char *D, offset_type N); // Used for testing purpose only. void setValueProfDataEndianness(support::endianness Endianness) { ValueProfDataEndianness = Endianness; } }; struct InstrProfReaderIndexBase { // Read all the profile records with the same key pointed to the current // iterator. virtual Error getRecords(ArrayRef &Data) = 0; // Read all the profile records with the key equal to FuncName virtual Error getRecords(StringRef FuncName, ArrayRef &Data) = 0; virtual void advanceToNextKey() = 0; virtual bool atEnd() const = 0; virtual void setValueProfDataEndianness(support::endianness Endianness) = 0; virtual ~InstrProfReaderIndexBase() {} virtual uint64_t getVersion() const = 0; virtual bool isIRLevelProfile() const = 0; virtual void populateSymtab(InstrProfSymtab &) = 0; }; typedef OnDiskIterableChainedHashTable OnDiskHashTableImplV3; template class InstrProfReaderIndex : public InstrProfReaderIndexBase { private: std::unique_ptr HashTable; typename HashTableImpl::data_iterator RecordIterator; uint64_t FormatVersion; public: InstrProfReaderIndex(const unsigned char *Buckets, const unsigned char *const Payload, const unsigned char *const Base, IndexedInstrProf::HashT HashType, uint64_t Version); Error getRecords(ArrayRef &Data) override; Error getRecords(StringRef FuncName, ArrayRef &Data) override; void advanceToNextKey() override { RecordIterator++; } bool atEnd() const override { return RecordIterator == HashTable->data_end(); } void setValueProfDataEndianness(support::endianness Endianness) override { HashTable->getInfoObj().setValueProfDataEndianness(Endianness); } ~InstrProfReaderIndex() override {} uint64_t getVersion() const override { return GET_VERSION(FormatVersion); } bool isIRLevelProfile() const override { return (FormatVersion & VARIANT_MASK_IR_PROF) != 0; } void populateSymtab(InstrProfSymtab &Symtab) override { Symtab.create(HashTable->keys()); } }; /// Reader for the indexed binary instrprof format. class IndexedInstrProfReader : public InstrProfReader { private: /// The profile data file contents. std::unique_ptr DataBuffer; /// The index into the profile data. std::unique_ptr Index; /// Profile summary data. std::unique_ptr Summary; IndexedInstrProfReader(const IndexedInstrProfReader &) = delete; IndexedInstrProfReader &operator=(const IndexedInstrProfReader &) = delete; // Read the profile summary. Return a pointer pointing to one byte past the // end of the summary data if it exists or the input \c Cur. const unsigned char *readSummary(IndexedInstrProf::ProfVersion Version, const unsigned char *Cur); public: /// Return the profile version. uint64_t getVersion() const { return Index->getVersion(); } bool isIRLevelProfile() const override { return Index->isIRLevelProfile(); } IndexedInstrProfReader(std::unique_ptr DataBuffer) : DataBuffer(std::move(DataBuffer)), Index(nullptr) {} /// Return true if the given buffer is in an indexed instrprof format. static bool hasFormat(const MemoryBuffer &DataBuffer); /// Read the file header. Error readHeader() override; /// Read a single record. Error readNextRecord(InstrProfRecord &Record) override; /// Return the pointer to InstrProfRecord associated with FuncName /// and FuncHash Expected getInstrProfRecord(StringRef FuncName, uint64_t FuncHash); /// Fill Counts with the profile data for the given function name. Error getFunctionCounts(StringRef FuncName, uint64_t FuncHash, std::vector &Counts); /// Return the maximum of all known function counts. uint64_t getMaximumFunctionCount() { return Summary->getMaxFunctionCount(); } /// Factory method to create an indexed reader. static Expected> create(const Twine &Path); static Expected> create(std::unique_ptr Buffer); // Used for testing purpose only. void setValueProfDataEndianness(support::endianness Endianness) { Index->setValueProfDataEndianness(Endianness); } // See description in the base class. This interface is designed // to be used by llvm-profdata (for dumping). Avoid using this when // the client is the compiler. InstrProfSymtab &getSymtab() override; ProfileSummary &getSummary() { return *(Summary.get()); } }; } // end namespace llvm #endif