1 //=-- InstrProfReader.h - Instrumented profiling readers ----------*- C++ -*-=//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file contains support for reading profiling data for instrumentation
11 // based PGO and coverage.
13 //===----------------------------------------------------------------------===//
15 #ifndef LLVM_PROFILEDATA_INSTRPROFREADER_H
16 #define LLVM_PROFILEDATA_INSTRPROFREADER_H
18 #include "llvm/ADT/ArrayRef.h"
19 #include "llvm/ADT/StringExtras.h"
20 #include "llvm/ProfileData/InstrProf.h"
21 #include "llvm/Support/EndianStream.h"
22 #include "llvm/Support/ErrorOr.h"
23 #include "llvm/Support/LineIterator.h"
24 #include "llvm/Support/MemoryBuffer.h"
25 #include "llvm/Support/OnDiskHashTable.h"
26 #include "llvm/Support/raw_ostream.h"
31 class InstrProfReader;
33 /// A file format agnostic iterator over profiling data.
34 class InstrProfIterator : public std::iterator<std::input_iterator_tag,
36 InstrProfReader *Reader;
37 InstrProfRecord Record;
41 InstrProfIterator() : Reader(nullptr) {}
42 InstrProfIterator(InstrProfReader *Reader) : Reader(Reader) { Increment(); }
44 InstrProfIterator &operator++() { Increment(); return *this; }
45 bool operator==(const InstrProfIterator &RHS) { return Reader == RHS.Reader; }
46 bool operator!=(const InstrProfIterator &RHS) { return Reader != RHS.Reader; }
47 InstrProfRecord &operator*() { return Record; }
48 InstrProfRecord *operator->() { return &Record; }
51 /// Base class and interface for reading profiling data of any known instrprof
52 /// format. Provides an iterator over InstrProfRecords.
53 class InstrProfReader {
54 std::error_code LastError;
57 InstrProfReader() : LastError(instrprof_error::success) {}
58 virtual ~InstrProfReader() {}
60 /// Read the header. Required before reading first record.
61 virtual std::error_code readHeader() = 0;
62 /// Read a single record.
63 virtual std::error_code readNextRecord(InstrProfRecord &Record) = 0;
64 /// Iterator over profile data.
65 InstrProfIterator begin() { return InstrProfIterator(this); }
66 InstrProfIterator end() { return InstrProfIterator(); }
69 /// Set the current std::error_code and return same.
70 std::error_code error(std::error_code EC) {
75 /// Clear the current error code and return a successful one.
76 std::error_code success() { return error(instrprof_error::success); }
79 /// Return true if the reader has finished reading the profile data.
80 bool isEOF() { return LastError == instrprof_error::eof; }
81 /// Return true if the reader encountered an error reading profiling data.
82 bool hasError() { return LastError && !isEOF(); }
83 /// Get the current error code.
84 std::error_code getError() { return LastError; }
86 /// Factory method to create an appropriately typed reader for the given
88 static ErrorOr<std::unique_ptr<InstrProfReader>> create(std::string Path);
90 static ErrorOr<std::unique_ptr<InstrProfReader>>
91 create(std::unique_ptr<MemoryBuffer> Buffer);
94 /// Reader for the simple text based instrprof format.
96 /// This format is a simple text format that's suitable for test data. Records
97 /// are separated by one or more blank lines, and record fields are separated by
100 /// Each record consists of a function name, a function hash, a number of
101 /// counters, and then each counter value, in that order.
102 class TextInstrProfReader : public InstrProfReader {
104 /// The profile data file contents.
105 std::unique_ptr<MemoryBuffer> DataBuffer;
106 /// Iterator over the profile data.
109 TextInstrProfReader(const TextInstrProfReader &) = delete;
110 TextInstrProfReader &operator=(const TextInstrProfReader &) = delete;
112 TextInstrProfReader(std::unique_ptr<MemoryBuffer> DataBuffer_)
113 : DataBuffer(std::move(DataBuffer_)), Line(*DataBuffer, true, '#') {}
115 /// Return true if the given buffer is in text instrprof format.
116 static bool hasFormat(const MemoryBuffer &Buffer);
119 std::error_code readHeader() override { return success(); }
120 /// Read a single record.
121 std::error_code readNextRecord(InstrProfRecord &Record) override;
124 /// Reader for the raw instrprof binary format from runtime.
126 /// This format is a raw memory dump of the instrumentation-baed profiling data
127 /// from the runtime. It has no index.
129 /// Templated on the unsigned type whose size matches pointers on the platform
130 /// that wrote the profile.
131 template <class IntPtrT>
132 class RawInstrProfReader : public InstrProfReader {
134 /// The profile data file contents.
135 std::unique_ptr<MemoryBuffer> DataBuffer;
136 bool ShouldSwapBytes;
137 uint64_t CountersDelta;
139 uint64_t ValueDataDelta;
140 const RawInstrProf::ProfileData<IntPtrT> *Data;
141 const RawInstrProf::ProfileData<IntPtrT> *DataEnd;
142 const uint64_t *CountersStart;
143 const char *NamesStart;
144 const uint8_t *ValueDataStart;
145 const char *ProfileEnd;
146 uint32_t ValueKindLast;
148 // String table for holding a unique copy of all the strings in the profile.
149 InstrProfStringTable StringTable;
150 InstrProfRecord::ValueMapType FunctionPtrToNameMap;
152 RawInstrProfReader(const RawInstrProfReader &) = delete;
153 RawInstrProfReader &operator=(const RawInstrProfReader &) = delete;
155 RawInstrProfReader(std::unique_ptr<MemoryBuffer> DataBuffer)
156 : DataBuffer(std::move(DataBuffer)) { }
158 static bool hasFormat(const MemoryBuffer &DataBuffer);
159 std::error_code readHeader() override;
160 std::error_code readNextRecord(InstrProfRecord &Record) override;
163 std::error_code readNextHeader(const char *CurrentPos);
164 std::error_code readHeader(const RawInstrProf::Header &Header);
165 template <class IntT> IntT swap(IntT Int) const {
166 return ShouldSwapBytes ? sys::getSwappedBytes(Int) : Int;
168 support::endianness getDataEndianness() const {
169 support::endianness HostEndian = getHostEndianness();
170 if (!ShouldSwapBytes)
172 if (HostEndian == support::little)
175 return support::little;
178 inline uint8_t getNumPaddingBytes(uint64_t SizeInBytes) {
179 return 7 & (sizeof(uint64_t) - SizeInBytes % sizeof(uint64_t));
181 std::error_code readName(InstrProfRecord &Record);
182 std::error_code readFuncHash(InstrProfRecord &Record);
183 std::error_code readRawCounts(InstrProfRecord &Record);
184 std::error_code readValueProfilingData(InstrProfRecord &Record);
185 bool atEnd() const { return Data == DataEnd; }
186 void advanceData() { Data++; }
188 const uint64_t *getCounter(IntPtrT CounterPtr) const {
189 ptrdiff_t Offset = (swap(CounterPtr) - CountersDelta) / sizeof(uint64_t);
190 return CountersStart + Offset;
192 const char *getName(IntPtrT NamePtr) const {
193 ptrdiff_t Offset = (swap(NamePtr) - NamesDelta) / sizeof(char);
194 return NamesStart + Offset;
196 const uint8_t *getValueDataCounts(IntPtrT ValueCountsPtr) const {
198 (swap(ValueCountsPtr) - ValueDataDelta) / sizeof(uint8_t);
199 return ValueDataStart + Offset;
201 // This accepts an already byte-swapped ValueDataPtr argument.
202 const InstrProfValueData *getValueData(IntPtrT ValueDataPtr) const {
203 ptrdiff_t Offset = (ValueDataPtr - ValueDataDelta) / sizeof(uint8_t);
204 return reinterpret_cast<const InstrProfValueData *>(ValueDataStart +
209 typedef RawInstrProfReader<uint32_t> RawInstrProfReader32;
210 typedef RawInstrProfReader<uint64_t> RawInstrProfReader64;
212 namespace IndexedInstrProf {
213 enum class HashT : uint32_t;
216 /// Trait for lookups into the on-disk hash table for the binary instrprof
218 class InstrProfLookupTrait {
219 std::vector<InstrProfRecord> DataBuffer;
220 IndexedInstrProf::HashT HashType;
221 unsigned FormatVersion;
222 // Endianness of the input value profile data.
223 // It should be LE by default, but can be changed
224 // for testing purpose.
225 support::endianness ValueProfDataEndianness;
226 std::vector<std::pair<uint64_t, const char *>> HashKeys;
229 InstrProfLookupTrait(IndexedInstrProf::HashT HashType, unsigned FormatVersion)
230 : HashType(HashType), FormatVersion(FormatVersion),
231 ValueProfDataEndianness(support::little) {}
233 typedef ArrayRef<InstrProfRecord> data_type;
235 typedef StringRef internal_key_type;
236 typedef StringRef external_key_type;
237 typedef uint64_t hash_value_type;
238 typedef uint64_t offset_type;
240 static bool EqualKey(StringRef A, StringRef B) { return A == B; }
241 static StringRef GetInternalKey(StringRef K) { return K; }
242 static StringRef GetExternalKey(StringRef K) { return K; }
244 hash_value_type ComputeHash(StringRef K);
246 void setHashKeys(std::vector<std::pair<uint64_t, const char *>> HashKeys) {
247 this->HashKeys = std::move(HashKeys);
249 static std::pair<offset_type, offset_type>
250 ReadKeyDataLength(const unsigned char *&D) {
251 using namespace support;
252 offset_type KeyLen = endian::readNext<offset_type, little, unaligned>(D);
253 offset_type DataLen = endian::readNext<offset_type, little, unaligned>(D);
254 return std::make_pair(KeyLen, DataLen);
257 StringRef ReadKey(const unsigned char *D, offset_type N) {
258 return StringRef((const char *)D, N);
261 bool readValueProfilingData(const unsigned char *&D,
262 const unsigned char *const End);
263 data_type ReadData(StringRef K, const unsigned char *D, offset_type N);
265 // Used for testing purpose only.
266 void setValueProfDataEndianness(support::endianness Endianness) {
267 ValueProfDataEndianness = Endianness;
271 struct InstrProfReaderIndexBase {
272 // Read all the profile records with the same key pointed to the current
274 virtual std::error_code getRecords(ArrayRef<InstrProfRecord> &Data) = 0;
275 // Read all the profile records with the key equal to FuncName
276 virtual std::error_code getRecords(StringRef FuncName,
277 ArrayRef<InstrProfRecord> &Data) = 0;
278 virtual void advanceToNextKey() = 0;
279 virtual bool atEnd() const = 0;
280 virtual void setValueProfDataEndianness(support::endianness Endianness) = 0;
281 virtual ~InstrProfReaderIndexBase() {}
284 typedef OnDiskIterableChainedHashTable<InstrProfLookupTrait>
285 OnDiskHashTableImplV3;
287 template <typename HashTableImpl>
288 class InstrProfReaderIndex : public InstrProfReaderIndexBase {
291 std::unique_ptr<HashTableImpl> HashTable;
292 typename HashTableImpl::data_iterator RecordIterator;
293 uint64_t FormatVersion;
295 // String table for holding a unique copy of all the strings in the profile.
296 InstrProfStringTable StringTable;
299 InstrProfReaderIndex(const unsigned char *Buckets,
300 const unsigned char *const Payload,
301 const unsigned char *const Base,
302 IndexedInstrProf::HashT HashType, uint64_t Version);
304 std::error_code getRecords(ArrayRef<InstrProfRecord> &Data) override;
305 std::error_code getRecords(StringRef FuncName,
306 ArrayRef<InstrProfRecord> &Data) override;
307 void advanceToNextKey() override { RecordIterator++; }
308 bool atEnd() const override {
309 return RecordIterator == HashTable->data_end();
311 void setValueProfDataEndianness(support::endianness Endianness) override {
312 HashTable->getInfoObj().setValueProfDataEndianness(Endianness);
314 ~InstrProfReaderIndex() override {}
317 /// Reader for the indexed binary instrprof format.
318 class IndexedInstrProfReader : public InstrProfReader {
320 /// The profile data file contents.
321 std::unique_ptr<MemoryBuffer> DataBuffer;
322 /// The index into the profile data.
323 std::unique_ptr<InstrProfReaderIndexBase> Index;
324 /// The maximal execution count among all functions.
325 uint64_t MaxFunctionCount;
327 IndexedInstrProfReader(const IndexedInstrProfReader &) = delete;
328 IndexedInstrProfReader &operator=(const IndexedInstrProfReader &) = delete;
331 IndexedInstrProfReader(std::unique_ptr<MemoryBuffer> DataBuffer)
332 : DataBuffer(std::move(DataBuffer)), Index(nullptr) {}
334 /// Return true if the given buffer is in an indexed instrprof format.
335 static bool hasFormat(const MemoryBuffer &DataBuffer);
337 /// Read the file header.
338 std::error_code readHeader() override;
339 /// Read a single record.
340 std::error_code readNextRecord(InstrProfRecord &Record) override;
342 /// Return the pointer to InstrProfRecord associated with FuncName
344 ErrorOr<InstrProfRecord> getInstrProfRecord(StringRef FuncName,
347 /// Fill Counts with the profile data for the given function name.
348 std::error_code getFunctionCounts(StringRef FuncName, uint64_t FuncHash,
349 std::vector<uint64_t> &Counts);
351 /// Return the maximum of all known function counts.
352 uint64_t getMaximumFunctionCount() { return MaxFunctionCount; }
354 /// Factory method to create an indexed reader.
355 static ErrorOr<std::unique_ptr<IndexedInstrProfReader>>
356 create(std::string Path);
358 static ErrorOr<std::unique_ptr<IndexedInstrProfReader>>
359 create(std::unique_ptr<MemoryBuffer> Buffer);
361 // Used for testing purpose only.
362 void setValueProfDataEndianness(support::endianness Endianness) {
363 Index->setValueProfDataEndianness(Endianness);
367 } // end namespace llvm