1 //=-- SampleProf.h - Sampling profiling format support --------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file contains common definitions used in the reading and writing of
11 // sample profile data.
12 //
13 //===----------------------------------------------------------------------===//
14
15 #ifndef LLVM_PROFILEDATA_SAMPLEPROF_H_
16 #define LLVM_PROFILEDATA_SAMPLEPROF_H_
17
18 #include "llvm/ADT/SmallVector.h"
19 #include "llvm/ADT/StringMap.h"
20 #include "llvm/Support/Debug.h"
21 #include "llvm/Support/ErrorOr.h"
22 #include "llvm/Support/raw_ostream.h"
23
24 #include <map>
25 #include <system_error>
26
27 namespace llvm {
28
29 const std::error_category &sampleprof_category();
30
31 enum class sampleprof_error {
32 success = 0,
33 bad_magic,
34 unsupported_version,
35 too_large,
36 truncated,
37 malformed,
38 unrecognized_format,
39 unsupported_writing_format,
40 truncated_name_table,
41 not_implemented,
42 counter_overflow
43 };
44
make_error_code(sampleprof_error E)45 inline std::error_code make_error_code(sampleprof_error E) {
46 return std::error_code(static_cast<int>(E), sampleprof_category());
47 }
48
MergeResult(sampleprof_error & Accumulator,sampleprof_error Result)49 inline sampleprof_error MergeResult(sampleprof_error &Accumulator,
50 sampleprof_error Result) {
51 // Prefer first error encountered as later errors may be secondary effects of
52 // the initial problem.
53 if (Accumulator == sampleprof_error::success &&
54 Result != sampleprof_error::success)
55 Accumulator = Result;
56 return Accumulator;
57 }
58
59 } // end namespace llvm
60
61 namespace std {
62 template <>
63 struct is_error_code_enum<llvm::sampleprof_error> : std::true_type {};
64 }
65
66 namespace llvm {
67
68 namespace sampleprof {
69
70 static inline uint64_t SPMagic() {
71 return uint64_t('S') << (64 - 8) | uint64_t('P') << (64 - 16) |
72 uint64_t('R') << (64 - 24) | uint64_t('O') << (64 - 32) |
73 uint64_t('F') << (64 - 40) | uint64_t('4') << (64 - 48) |
74 uint64_t('2') << (64 - 56) | uint64_t(0xff);
75 }
76
77 static inline uint64_t SPVersion() { return 102; }
78
79 /// Represents the relative location of an instruction.
80 ///
81 /// Instruction locations are specified by the line offset from the
82 /// beginning of the function (marked by the line where the function
83 /// header is) and the discriminator value within that line.
84 ///
85 /// The discriminator value is useful to distinguish instructions
86 /// that are on the same line but belong to different basic blocks
87 /// (e.g., the two post-increment instructions in "if (p) x++; else y++;").
88 struct LineLocation {
89 LineLocation(uint32_t L, uint32_t D) : LineOffset(L), Discriminator(D) {}
90 void print(raw_ostream &OS) const;
91 void dump() const;
92 bool operator<(const LineLocation &O) const {
93 return LineOffset < O.LineOffset ||
94 (LineOffset == O.LineOffset && Discriminator < O.Discriminator);
95 }
96
97 uint32_t LineOffset;
98 uint32_t Discriminator;
99 };
100
101 raw_ostream &operator<<(raw_ostream &OS, const LineLocation &Loc);
102
103 /// Represents the relative location of a callsite.
104 ///
105 /// Callsite locations are specified by the line offset from the
106 /// beginning of the function (marked by the line where the function
107 /// head is), the discriminator value within that line, and the callee
108 /// function name.
109 struct CallsiteLocation : public LineLocation {
110 CallsiteLocation(uint32_t L, uint32_t D, StringRef N)
111 : LineLocation(L, D), CalleeName(N) {}
112 void print(raw_ostream &OS) const;
113 void dump() const;
114
115 StringRef CalleeName;
116 };
117
118 raw_ostream &operator<<(raw_ostream &OS, const CallsiteLocation &Loc);
119
120 /// Representation of a single sample record.
121 ///
122 /// A sample record is represented by a positive integer value, which
123 /// indicates how frequently was the associated line location executed.
124 ///
125 /// Additionally, if the associated location contains a function call,
126 /// the record will hold a list of all the possible called targets. For
127 /// direct calls, this will be the exact function being invoked. For
128 /// indirect calls (function pointers, virtual table dispatch), this
129 /// will be a list of one or more functions.
130 class SampleRecord {
131 public:
132 typedef StringMap<uint64_t> CallTargetMap;
133
134 SampleRecord() : NumSamples(0), CallTargets() {}
135
136 /// Increment the number of samples for this record by \p S.
137 /// Optionally scale sample count \p S by \p Weight.
138 ///
139 /// Sample counts accumulate using saturating arithmetic, to avoid wrapping
140 /// around unsigned integers.
141 sampleprof_error addSamples(uint64_t S, uint64_t Weight = 1) {
142 bool Overflowed;
143 if (Weight > 1) {
144 S = SaturatingMultiply(S, Weight, &Overflowed);
145 if (Overflowed)
146 return sampleprof_error::counter_overflow;
147 }
148 NumSamples = SaturatingAdd(NumSamples, S, &Overflowed);
149 if (Overflowed)
150 return sampleprof_error::counter_overflow;
151
152 return sampleprof_error::success;
153 }
154
155 /// Add called function \p F with samples \p S.
156 /// Optionally scale sample count \p S by \p Weight.
157 ///
158 /// Sample counts accumulate using saturating arithmetic, to avoid wrapping
159 /// around unsigned integers.
160 sampleprof_error addCalledTarget(StringRef F, uint64_t S,
161 uint64_t Weight = 1) {
162 uint64_t &TargetSamples = CallTargets[F];
163 bool Overflowed;
164 if (Weight > 1) {
165 S = SaturatingMultiply(S, Weight, &Overflowed);
166 if (Overflowed)
167 return sampleprof_error::counter_overflow;
168 }
169 TargetSamples = SaturatingAdd(TargetSamples, S, &Overflowed);
170 if (Overflowed)
171 return sampleprof_error::counter_overflow;
172
173 return sampleprof_error::success;
174 }
175
176 /// Return true if this sample record contains function calls.
177 bool hasCalls() const { return CallTargets.size() > 0; }
178
179 uint64_t getSamples() const { return NumSamples; }
180 const CallTargetMap &getCallTargets() const { return CallTargets; }
181
182 /// Merge the samples in \p Other into this record.
183 /// Optionally scale sample counts by \p Weight.
184 sampleprof_error merge(const SampleRecord &Other, uint64_t Weight = 1) {
185 sampleprof_error Result = addSamples(Other.getSamples(), Weight);
186 for (const auto &I : Other.getCallTargets()) {
187 MergeResult(Result, addCalledTarget(I.first(), I.second, Weight));
188 }
189 return Result;
190 }
191
192 void print(raw_ostream &OS, unsigned Indent) const;
193 void dump() const;
194
195 private:
196 uint64_t NumSamples;
197 CallTargetMap CallTargets;
198 };
199
200 raw_ostream &operator<<(raw_ostream &OS, const SampleRecord &Sample);
201
202 typedef std::map<LineLocation, SampleRecord> BodySampleMap;
203 class FunctionSamples;
204 typedef std::map<CallsiteLocation, FunctionSamples> CallsiteSampleMap;
205
206 /// Representation of the samples collected for a function.
207 ///
208 /// This data structure contains all the collected samples for the body
209 /// of a function. Each sample corresponds to a LineLocation instance
210 /// within the body of the function.
211 class FunctionSamples {
212 public:
213 FunctionSamples() : TotalSamples(0), TotalHeadSamples(0) {}
214 void print(raw_ostream &OS = dbgs(), unsigned Indent = 0) const;
215 void dump() const;
216 sampleprof_error addTotalSamples(uint64_t Num, uint64_t Weight = 1) {
217 bool Overflowed;
218 if (Weight > 1) {
219 Num = SaturatingMultiply(Num, Weight, &Overflowed);
220 if (Overflowed)
221 return sampleprof_error::counter_overflow;
222 }
223 TotalSamples = SaturatingAdd(TotalSamples, Num, &Overflowed);
224 if (Overflowed)
225 return sampleprof_error::counter_overflow;
226
227 return sampleprof_error::success;
228 }
229 sampleprof_error addHeadSamples(uint64_t Num, uint64_t Weight = 1) {
230 bool Overflowed;
231 if (Weight > 1) {
232 Num = SaturatingMultiply(Num, Weight, &Overflowed);
233 if (Overflowed)
234 return sampleprof_error::counter_overflow;
235 }
236 TotalHeadSamples = SaturatingAdd(TotalHeadSamples, Num, &Overflowed);
237 if (Overflowed)
238 return sampleprof_error::counter_overflow;
239
240 return sampleprof_error::success;
241 }
242 sampleprof_error addBodySamples(uint32_t LineOffset, uint32_t Discriminator,
243 uint64_t Num, uint64_t Weight = 1) {
244 return BodySamples[LineLocation(LineOffset, Discriminator)].addSamples(
245 Num, Weight);
246 }
247 sampleprof_error addCalledTargetSamples(uint32_t LineOffset,
248 uint32_t Discriminator,
249 std::string FName, uint64_t Num,
250 uint64_t Weight = 1) {
251 return BodySamples[LineLocation(LineOffset, Discriminator)].addCalledTarget(
252 FName, Num, Weight);
253 }
254
255 /// Return the number of samples collected at the given location.
256 /// Each location is specified by \p LineOffset and \p Discriminator.
257 /// If the location is not found in profile, return error.
258 ErrorOr<uint64_t> findSamplesAt(uint32_t LineOffset,
259 uint32_t Discriminator) const {
260 const auto &ret = BodySamples.find(LineLocation(LineOffset, Discriminator));
261 if (ret == BodySamples.end())
262 return std::error_code();
263 else
264 return ret->second.getSamples();
265 }
266
267 /// Return the function samples at the given callsite location.
268 FunctionSamples &functionSamplesAt(const CallsiteLocation &Loc) {
269 return CallsiteSamples[Loc];
270 }
271
272 /// Return a pointer to function samples at the given callsite location.
273 const FunctionSamples *
274 findFunctionSamplesAt(const CallsiteLocation &Loc) const {
275 auto iter = CallsiteSamples.find(Loc);
276 if (iter == CallsiteSamples.end()) {
277 return nullptr;
278 } else {
279 return &iter->second;
280 }
281 }
282
283 bool empty() const { return TotalSamples == 0; }
284
285 /// Return the total number of samples collected inside the function.
286 uint64_t getTotalSamples() const { return TotalSamples; }
287
288 /// Return the total number of samples collected at the head of the
289 /// function.
290 uint64_t getHeadSamples() const { return TotalHeadSamples; }
291
292 /// Return all the samples collected in the body of the function.
293 const BodySampleMap &getBodySamples() const { return BodySamples; }
294
295 /// Return all the callsite samples collected in the body of the function.
296 const CallsiteSampleMap &getCallsiteSamples() const {
297 return CallsiteSamples;
298 }
299
300 /// Merge the samples in \p Other into this one.
301 /// Optionally scale samples by \p Weight.
302 sampleprof_error merge(const FunctionSamples &Other, uint64_t Weight = 1) {
303 sampleprof_error Result = sampleprof_error::success;
304 MergeResult(Result, addTotalSamples(Other.getTotalSamples(), Weight));
305 MergeResult(Result, addHeadSamples(Other.getHeadSamples(), Weight));
306 for (const auto &I : Other.getBodySamples()) {
307 const LineLocation &Loc = I.first;
308 const SampleRecord &Rec = I.second;
309 MergeResult(Result, BodySamples[Loc].merge(Rec, Weight));
310 }
311 for (const auto &I : Other.getCallsiteSamples()) {
312 const CallsiteLocation &Loc = I.first;
313 const FunctionSamples &Rec = I.second;
314 MergeResult(Result, functionSamplesAt(Loc).merge(Rec, Weight));
315 }
316 return Result;
317 }
318
319 private:
320 /// Total number of samples collected inside this function.
321 ///
322 /// Samples are cumulative, they include all the samples collected
323 /// inside this function and all its inlined callees.
324 uint64_t TotalSamples;
325
326 /// Total number of samples collected at the head of the function.
327 /// This is an approximation of the number of calls made to this function
328 /// at runtime.
329 uint64_t TotalHeadSamples;
330
331 /// Map instruction locations to collected samples.
332 ///
333 /// Each entry in this map contains the number of samples
334 /// collected at the corresponding line offset. All line locations
335 /// are an offset from the start of the function.
336 BodySampleMap BodySamples;
337
338 /// Map call sites to collected samples for the called function.
339 ///
340 /// Each entry in this map corresponds to all the samples
341 /// collected for the inlined function call at the given
342 /// location. For example, given:
343 ///
344 /// void foo() {
345 /// 1 bar();
346 /// ...
347 /// 8 baz();
348 /// }
349 ///
350 /// If the bar() and baz() calls were inlined inside foo(), this
351 /// map will contain two entries. One for all the samples collected
352 /// in the call to bar() at line offset 1, the other for all the samples
353 /// collected in the call to baz() at line offset 8.
354 CallsiteSampleMap CallsiteSamples;
355 };
356
357 raw_ostream &operator<<(raw_ostream &OS, const FunctionSamples &FS);
358
359 /// Sort a LocationT->SampleT map by LocationT.
360 ///
361 /// It produces a sorted list of <LocationT, SampleT> records by ascending
362 /// order of LocationT.
363 template <class LocationT, class SampleT> class SampleSorter {
364 public:
365 typedef std::pair<const LocationT, SampleT> SamplesWithLoc;
366 typedef SmallVector<const SamplesWithLoc *, 20> SamplesWithLocList;
367
368 SampleSorter(const std::map<LocationT, SampleT> &Samples) {
369 for (const auto &I : Samples)
370 V.push_back(&I);
371 std::stable_sort(V.begin(), V.end(),
372 [](const SamplesWithLoc *A, const SamplesWithLoc *B) {
373 return A->first < B->first;
374 });
375 }
376 const SamplesWithLocList &get() const { return V; }
377
378 private:
379 SamplesWithLocList V;
380 };
381
382 } // end namespace sampleprof
383
384 } // end namespace llvm
385
386 #endif // LLVM_PROFILEDATA_SAMPLEPROF_H_
387