1 //=-- InstrProfReader.h - Instrumented profiling readers ----------*- C++ -*-=//
3 // The LLVM Compiler Infrastructure
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
8 //===----------------------------------------------------------------------===//
10 // This file contains support for reading profiling data for instrumentation
11 // based PGO and coverage.
13 //===----------------------------------------------------------------------===//
15 #ifndef LLVM_PROFILEDATA_INSTRPROFREADER_H
16 #define LLVM_PROFILEDATA_INSTRPROFREADER_H
18 #include "llvm/ADT/ArrayRef.h"
19 #include "llvm/ADT/StringExtras.h"
20 #include "llvm/ProfileData/InstrProf.h"
21 #include "llvm/Support/LineIterator.h"
22 #include "llvm/Support/MemoryBuffer.h"
23 #include "llvm/Support/EndianStream.h"
24 #include "llvm/Support/OnDiskHashTable.h"
30 class InstrProfReader;
32 /// Profiling information for a single function.
33 struct InstrProfRecord {
35 InstrProfRecord(StringRef Name, uint64_t Hash, ArrayRef<uint64_t> Counts)
36 : Name(Name), Hash(Hash), Counts(Counts) {}
39 ArrayRef<uint64_t> Counts;
42 /// A file format agnostic iterator over profiling data.
43 class InstrProfIterator : public std::iterator<std::input_iterator_tag,
45 InstrProfReader *Reader;
46 InstrProfRecord Record;
50 InstrProfIterator() : Reader(nullptr) {}
51 InstrProfIterator(InstrProfReader *Reader) : Reader(Reader) { Increment(); }
53 InstrProfIterator &operator++() { Increment(); return *this; }
54 bool operator==(const InstrProfIterator &RHS) { return Reader == RHS.Reader; }
55 bool operator!=(const InstrProfIterator &RHS) { return Reader != RHS.Reader; }
56 InstrProfRecord &operator*() { return Record; }
57 InstrProfRecord *operator->() { return &Record; }
60 /// Base class and interface for reading profiling data of any known instrprof
61 /// format. Provides an iterator over InstrProfRecords.
62 class InstrProfReader {
63 std::error_code LastError;
66 InstrProfReader() : LastError(instrprof_error::success) {}
67 virtual ~InstrProfReader() {}
69 /// Read the header. Required before reading first record.
70 virtual std::error_code readHeader() = 0;
71 /// Read a single record.
72 virtual std::error_code readNextRecord(InstrProfRecord &Record) = 0;
73 /// Iterator over profile data.
74 InstrProfIterator begin() { return InstrProfIterator(this); }
75 InstrProfIterator end() { return InstrProfIterator(); }
78 /// Set the current std::error_code and return same.
79 std::error_code error(std::error_code EC) {
84 /// Clear the current error code and return a successful one.
85 std::error_code success() { return error(instrprof_error::success); }
88 /// Return true if the reader has finished reading the profile data.
89 bool isEOF() { return LastError == instrprof_error::eof; }
90 /// Return true if the reader encountered an error reading profiling data.
91 bool hasError() { return LastError && !isEOF(); }
92 /// Get the current error code.
93 std::error_code getError() { return LastError; }
95 /// Factory method to create an appropriately typed reader for the given
97 static std::error_code create(std::string Path,
98 std::unique_ptr<InstrProfReader> &Result);
101 /// Reader for the simple text based instrprof format.
103 /// This format is a simple text format that's suitable for test data. Records
104 /// are separated by one or more blank lines, and record fields are separated by
107 /// Each record consists of a function name, a function hash, a number of
108 /// counters, and then each counter value, in that order.
109 class TextInstrProfReader : public InstrProfReader {
111 /// The profile data file contents.
112 std::unique_ptr<MemoryBuffer> DataBuffer;
113 /// Iterator over the profile data.
115 /// The current set of counter values.
116 std::vector<uint64_t> Counts;
118 TextInstrProfReader(const TextInstrProfReader &) LLVM_DELETED_FUNCTION;
119 TextInstrProfReader &operator=(const TextInstrProfReader &)
120 LLVM_DELETED_FUNCTION;
122 TextInstrProfReader(std::unique_ptr<MemoryBuffer> DataBuffer_)
123 : DataBuffer(std::move(DataBuffer_)), Line(*DataBuffer, true, '#') {}
126 std::error_code readHeader() override { return success(); }
127 /// Read a single record.
128 std::error_code readNextRecord(InstrProfRecord &Record) override;
131 /// Reader for the raw instrprof binary format from runtime.
133 /// This format is a raw memory dump of the instrumentation-baed profiling data
134 /// from the runtime. It has no index.
136 /// Templated on the unsigned type whose size matches pointers on the platform
137 /// that wrote the profile.
138 template <class IntPtrT>
139 class RawInstrProfReader : public InstrProfReader {
141 /// The profile data file contents.
142 std::unique_ptr<MemoryBuffer> DataBuffer;
143 /// The current set of counter values.
144 std::vector<uint64_t> Counts;
146 const uint32_t NameSize;
147 const uint32_t NumCounters;
148 const uint64_t FuncHash;
149 const IntPtrT NamePtr;
150 const IntPtrT CounterPtr;
153 const uint64_t Magic;
154 const uint64_t Version;
155 const uint64_t DataSize;
156 const uint64_t CountersSize;
157 const uint64_t NamesSize;
158 const uint64_t CountersDelta;
159 const uint64_t NamesDelta;
162 bool ShouldSwapBytes;
163 uint64_t CountersDelta;
165 const ProfileData *Data;
166 const ProfileData *DataEnd;
167 const uint64_t *CountersStart;
168 const char *NamesStart;
169 const char *ProfileEnd;
171 RawInstrProfReader(const RawInstrProfReader &) LLVM_DELETED_FUNCTION;
172 RawInstrProfReader &operator=(const RawInstrProfReader &)
173 LLVM_DELETED_FUNCTION;
175 RawInstrProfReader(std::unique_ptr<MemoryBuffer> DataBuffer)
176 : DataBuffer(std::move(DataBuffer)) { }
178 static bool hasFormat(const MemoryBuffer &DataBuffer);
179 std::error_code readHeader() override;
180 std::error_code readNextRecord(InstrProfRecord &Record) override;
183 std::error_code readNextHeader(const char *CurrentPos);
184 std::error_code readHeader(const RawHeader &Header);
185 template <class IntT>
186 IntT swap(IntT Int) const {
187 return ShouldSwapBytes ? sys::getSwappedBytes(Int) : Int;
189 const uint64_t *getCounter(IntPtrT CounterPtr) const {
190 ptrdiff_t Offset = (swap(CounterPtr) - CountersDelta) / sizeof(uint64_t);
191 return CountersStart + Offset;
193 const char *getName(IntPtrT NamePtr) const {
194 ptrdiff_t Offset = (swap(NamePtr) - NamesDelta) / sizeof(char);
195 return NamesStart + Offset;
199 typedef RawInstrProfReader<uint32_t> RawInstrProfReader32;
200 typedef RawInstrProfReader<uint64_t> RawInstrProfReader64;
202 namespace IndexedInstrProf {
203 enum class HashT : uint32_t;
206 /// Trait for lookups into the on-disk hash table for the binary instrprof
208 class InstrProfLookupTrait {
209 std::vector<uint64_t> DataBuffer;
210 IndexedInstrProf::HashT HashType;
212 InstrProfLookupTrait(IndexedInstrProf::HashT HashType) : HashType(HashType) {}
215 data_type(StringRef Name, ArrayRef<uint64_t> Data)
216 : Name(Name), Data(Data) {}
218 ArrayRef<uint64_t> Data;
220 typedef StringRef internal_key_type;
221 typedef StringRef external_key_type;
222 typedef uint64_t hash_value_type;
223 typedef uint64_t offset_type;
225 static bool EqualKey(StringRef A, StringRef B) { return A == B; }
226 static StringRef GetInternalKey(StringRef K) { return K; }
228 hash_value_type ComputeHash(StringRef K);
230 static std::pair<offset_type, offset_type>
231 ReadKeyDataLength(const unsigned char *&D) {
232 using namespace support;
233 offset_type KeyLen = endian::readNext<offset_type, little, unaligned>(D);
234 offset_type DataLen = endian::readNext<offset_type, little, unaligned>(D);
235 return std::make_pair(KeyLen, DataLen);
238 StringRef ReadKey(const unsigned char *D, offset_type N) {
239 return StringRef((const char *)D, N);
242 data_type ReadData(StringRef K, const unsigned char *D, offset_type N) {
244 if (N % sizeof(uint64_t))
245 // The data is corrupt, don't try to read it.
246 return data_type("", DataBuffer);
248 using namespace support;
249 // We just treat the data as opaque here. It's simpler to handle in
250 // IndexedInstrProfReader.
251 unsigned NumEntries = N / sizeof(uint64_t);
252 DataBuffer.reserve(NumEntries);
253 for (unsigned I = 0; I < NumEntries; ++I)
254 DataBuffer.push_back(endian::readNext<uint64_t, little, unaligned>(D));
255 return data_type(K, DataBuffer);
258 typedef OnDiskIterableChainedHashTable<InstrProfLookupTrait>
259 InstrProfReaderIndex;
261 /// Reader for the indexed binary instrprof format.
262 class IndexedInstrProfReader : public InstrProfReader {
264 /// The profile data file contents.
265 std::unique_ptr<MemoryBuffer> DataBuffer;
266 /// The index into the profile data.
267 std::unique_ptr<InstrProfReaderIndex> Index;
268 /// Iterator over the profile data.
269 InstrProfReaderIndex::data_iterator RecordIterator;
270 /// Offset into our current data set.
271 size_t CurrentOffset;
272 /// The file format version of the profile data.
273 uint64_t FormatVersion;
274 /// The maximal execution count among all functions.
275 uint64_t MaxFunctionCount;
277 IndexedInstrProfReader(const IndexedInstrProfReader &) LLVM_DELETED_FUNCTION;
278 IndexedInstrProfReader &operator=(const IndexedInstrProfReader &)
279 LLVM_DELETED_FUNCTION;
281 IndexedInstrProfReader(std::unique_ptr<MemoryBuffer> DataBuffer)
282 : DataBuffer(std::move(DataBuffer)), Index(nullptr), CurrentOffset(0) {}
284 /// Return true if the given buffer is in an indexed instrprof format.
285 static bool hasFormat(const MemoryBuffer &DataBuffer);
287 /// Read the file header.
288 std::error_code readHeader() override;
289 /// Read a single record.
290 std::error_code readNextRecord(InstrProfRecord &Record) override;
292 /// Fill Counts with the profile data for the given function name.
293 std::error_code getFunctionCounts(StringRef FuncName, uint64_t FuncHash,
294 std::vector<uint64_t> &Counts);
295 /// Return the maximum of all known function counts.
296 uint64_t getMaximumFunctionCount() { return MaxFunctionCount; }
298 /// Factory method to create an indexed reader.
299 static std::error_code
300 create(std::string Path, std::unique_ptr<IndexedInstrProfReader> &Result);
303 } // end namespace llvm