1 //===- ProfileEstimatorPass.cpp - LLVM Pass to estimate profile info ------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements a concrete implementation of profiling information that
11 // estimates the profiling information in a very crude and unimaginative way.
12 //
13 //===----------------------------------------------------------------------===//
14 #define DEBUG_TYPE "profile-estimator"
15 #include "llvm/Pass.h"
16 #include "llvm/Analysis/Passes.h"
17 #include "llvm/Analysis/ProfileInfo.h"
18 #include "llvm/Analysis/LoopInfo.h"
19 #include "llvm/Support/CommandLine.h"
20 #include "llvm/Support/Debug.h"
21 #include "llvm/Support/raw_ostream.h"
22 #include "llvm/Support/Format.h"
23 using namespace llvm;
24
25 static cl::opt<double>
26 LoopWeight(
27 "profile-estimator-loop-weight", cl::init(10),
28 cl::value_desc("loop-weight"),
29 cl::desc("Number of loop executions used for profile-estimator")
30 );
31
32 namespace {
33 class ProfileEstimatorPass : public FunctionPass, public ProfileInfo {
34 double ExecCount;
35 LoopInfo *LI;
36 std::set<BasicBlock*> BBToVisit;
37 std::map<Loop*,double> LoopExitWeights;
38 std::map<Edge,double> MinimalWeight;
39 public:
40 static char ID; // Class identification, replacement for typeinfo
ProfileEstimatorPass(const double execcount=0)41 explicit ProfileEstimatorPass(const double execcount = 0)
42 : FunctionPass(ID), ExecCount(execcount) {
43 initializeProfileEstimatorPassPass(*PassRegistry::getPassRegistry());
44 if (execcount == 0) ExecCount = LoopWeight;
45 }
46
getAnalysisUsage(AnalysisUsage & AU) const47 virtual void getAnalysisUsage(AnalysisUsage &AU) const {
48 AU.setPreservesAll();
49 AU.addRequired<LoopInfo>();
50 }
51
getPassName() const52 virtual const char *getPassName() const {
53 return "Profiling information estimator";
54 }
55
56 /// run - Estimate the profile information from the specified file.
57 virtual bool runOnFunction(Function &F);
58
59 /// getAdjustedAnalysisPointer - This method is used when a pass implements
60 /// an analysis interface through multiple inheritance. If needed, it
61 /// should override this to adjust the this pointer as needed for the
62 /// specified pass info.
getAdjustedAnalysisPointer(AnalysisID PI)63 virtual void *getAdjustedAnalysisPointer(AnalysisID PI) {
64 if (PI == &ProfileInfo::ID)
65 return (ProfileInfo*)this;
66 return this;
67 }
68
69 virtual void recurseBasicBlock(BasicBlock *BB);
70
71 void inline printEdgeWeight(Edge);
72 };
73 } // End of anonymous namespace
74
75 char ProfileEstimatorPass::ID = 0;
76 INITIALIZE_AG_PASS_BEGIN(ProfileEstimatorPass, ProfileInfo, "profile-estimator",
77 "Estimate profiling information", false, true, false)
78 INITIALIZE_PASS_DEPENDENCY(LoopInfo)
79 INITIALIZE_AG_PASS_END(ProfileEstimatorPass, ProfileInfo, "profile-estimator",
80 "Estimate profiling information", false, true, false)
81
82 namespace llvm {
83 char &ProfileEstimatorPassID = ProfileEstimatorPass::ID;
84
createProfileEstimatorPass()85 FunctionPass *createProfileEstimatorPass() {
86 return new ProfileEstimatorPass();
87 }
88
89 /// createProfileEstimatorPass - This function returns a Pass that estimates
90 /// profiling information using the given loop execution count.
createProfileEstimatorPass(const unsigned execcount)91 Pass *createProfileEstimatorPass(const unsigned execcount) {
92 return new ProfileEstimatorPass(execcount);
93 }
94 }
95
ignoreMissing(double w)96 static double ignoreMissing(double w) {
97 if (w == ProfileInfo::MissingValue) return 0;
98 return w;
99 }
100
printEdgeError(ProfileInfo::Edge e,const char * M)101 static void inline printEdgeError(ProfileInfo::Edge e, const char *M) {
102 DEBUG(dbgs() << "-- Edge " << e << " is not calculated, " << M << "\n");
103 }
104
printEdgeWeight(Edge E)105 void inline ProfileEstimatorPass::printEdgeWeight(Edge E) {
106 DEBUG(dbgs() << "-- Weight of Edge " << E << ":"
107 << format("%20.20g", getEdgeWeight(E)) << "\n");
108 }
109
110 // recurseBasicBlock() - This calculates the ProfileInfo estimation for a
111 // single block and then recurses into the successors.
112 // The algorithm preserves the flow condition, meaning that the sum of the
113 // weight of the incoming edges must be equal the block weight which must in
114 // turn be equal to the sume of the weights of the outgoing edges.
115 // Since the flow of an block is deterimined from the current state of the
116 // flow, once an edge has a flow assigned this flow is never changed again,
117 // otherwise it would be possible to violate the flow condition in another
118 // block.
recurseBasicBlock(BasicBlock * BB)119 void ProfileEstimatorPass::recurseBasicBlock(BasicBlock *BB) {
120
121 // Break the recursion if this BasicBlock was already visited.
122 if (BBToVisit.find(BB) == BBToVisit.end()) return;
123
124 // Read the LoopInfo for this block.
125 bool BBisHeader = LI->isLoopHeader(BB);
126 Loop* BBLoop = LI->getLoopFor(BB);
127
128 // To get the block weight, read all incoming edges.
129 double BBWeight = 0;
130 std::set<BasicBlock*> ProcessedPreds;
131 for ( pred_iterator bbi = pred_begin(BB), bbe = pred_end(BB);
132 bbi != bbe; ++bbi ) {
133 // If this block was not considered already, add weight.
134 Edge edge = getEdge(*bbi,BB);
135 double w = getEdgeWeight(edge);
136 if (ProcessedPreds.insert(*bbi).second) {
137 BBWeight += ignoreMissing(w);
138 }
139 // If this block is a loop header and the predecessor is contained in this
140 // loop, thus the edge is a backedge, continue and do not check if the
141 // value is valid.
142 if (BBisHeader && BBLoop->contains(*bbi)) {
143 printEdgeError(edge, "but is backedge, continuing");
144 continue;
145 }
146 // If the edges value is missing (and this is no loop header, and this is
147 // no backedge) return, this block is currently non estimatable.
148 if (w == MissingValue) {
149 printEdgeError(edge, "returning");
150 return;
151 }
152 }
153 if (getExecutionCount(BB) != MissingValue) {
154 BBWeight = getExecutionCount(BB);
155 }
156
157 // Fetch all necessary information for current block.
158 SmallVector<Edge, 8> ExitEdges;
159 SmallVector<Edge, 8> Edges;
160 if (BBLoop) {
161 BBLoop->getExitEdges(ExitEdges);
162 }
163
164 // If this is a loop header, consider the following:
165 // Exactly the flow that is entering this block, must exit this block too. So
166 // do the following:
167 // *) get all the exit edges, read the flow that is already leaving this
168 // loop, remember the edges that do not have any flow on them right now.
169 // (The edges that have already flow on them are most likely exiting edges of
170 // other loops, do not touch those flows because the previously caclulated
171 // loopheaders would not be exact anymore.)
172 // *) In case there is not a single exiting edge left, create one at the loop
173 // latch to prevent the flow from building up in the loop.
174 // *) Take the flow that is not leaving the loop already and distribute it on
175 // the remaining exiting edges.
176 // (This ensures that all flow that enters the loop also leaves it.)
177 // *) Increase the flow into the loop by increasing the weight of this block.
178 // There is at least one incoming backedge that will bring us this flow later
179 // on. (So that the flow condition in this node is valid again.)
180 if (BBisHeader) {
181 double incoming = BBWeight;
182 // Subtract the flow leaving the loop.
183 std::set<Edge> ProcessedExits;
184 for (SmallVector<Edge, 8>::iterator ei = ExitEdges.begin(),
185 ee = ExitEdges.end(); ei != ee; ++ei) {
186 if (ProcessedExits.insert(*ei).second) {
187 double w = getEdgeWeight(*ei);
188 if (w == MissingValue) {
189 Edges.push_back(*ei);
190 // Check if there is a necessary minimal weight, if yes, subtract it
191 // from weight.
192 if (MinimalWeight.find(*ei) != MinimalWeight.end()) {
193 incoming -= MinimalWeight[*ei];
194 DEBUG(dbgs() << "Reserving " << format("%.20g",MinimalWeight[*ei]) << " at " << (*ei) << "\n");
195 }
196 } else {
197 incoming -= w;
198 }
199 }
200 }
201 // If no exit edges, create one:
202 if (Edges.size() == 0) {
203 BasicBlock *Latch = BBLoop->getLoopLatch();
204 if (Latch) {
205 Edge edge = getEdge(Latch,0);
206 EdgeInformation[BB->getParent()][edge] = BBWeight;
207 printEdgeWeight(edge);
208 edge = getEdge(Latch, BB);
209 EdgeInformation[BB->getParent()][edge] = BBWeight * ExecCount;
210 printEdgeWeight(edge);
211 }
212 }
213
214 // Distribute remaining weight to the exting edges. To prevent fractions
215 // from building up and provoking precision problems the weight which is to
216 // be distributed is split and the rounded, the last edge gets a somewhat
217 // bigger value, but we are close enough for an estimation.
218 double fraction = floor(incoming/Edges.size());
219 for (SmallVector<Edge, 8>::iterator ei = Edges.begin(), ee = Edges.end();
220 ei != ee; ++ei) {
221 double w = 0;
222 if (ei != (ee-1)) {
223 w = fraction;
224 incoming -= fraction;
225 } else {
226 w = incoming;
227 }
228 EdgeInformation[BB->getParent()][*ei] += w;
229 // Read necessary minimal weight.
230 if (MinimalWeight.find(*ei) != MinimalWeight.end()) {
231 EdgeInformation[BB->getParent()][*ei] += MinimalWeight[*ei];
232 DEBUG(dbgs() << "Additionally " << format("%.20g",MinimalWeight[*ei]) << " at " << (*ei) << "\n");
233 }
234 printEdgeWeight(*ei);
235
236 // Add minimal weight to paths to all exit edges, this is used to ensure
237 // that enough flow is reaching this edges.
238 Path p;
239 const BasicBlock *Dest = GetPath(BB, (*ei).first, p, GetPathToDest);
240 while (Dest != BB) {
241 const BasicBlock *Parent = p.find(Dest)->second;
242 Edge e = getEdge(Parent, Dest);
243 if (MinimalWeight.find(e) == MinimalWeight.end()) {
244 MinimalWeight[e] = 0;
245 }
246 MinimalWeight[e] += w;
247 DEBUG(dbgs() << "Minimal Weight for " << e << ": " << format("%.20g",MinimalWeight[e]) << "\n");
248 Dest = Parent;
249 }
250 }
251 // Increase flow into the loop.
252 BBWeight *= (ExecCount+1);
253 }
254
255 BlockInformation[BB->getParent()][BB] = BBWeight;
256 // Up until now we considered only the loop exiting edges, now we have a
257 // definite block weight and must distribute this onto the outgoing edges.
258 // Since there may be already flow attached to some of the edges, read this
259 // flow first and remember the edges that have still now flow attached.
260 Edges.clear();
261 std::set<BasicBlock*> ProcessedSuccs;
262
263 succ_iterator bbi = succ_begin(BB), bbe = succ_end(BB);
264 // Also check for (BB,0) edges that may already contain some flow. (But only
265 // in case there are no successors.)
266 if (bbi == bbe) {
267 Edge edge = getEdge(BB,0);
268 EdgeInformation[BB->getParent()][edge] = BBWeight;
269 printEdgeWeight(edge);
270 }
271 for ( ; bbi != bbe; ++bbi ) {
272 if (ProcessedSuccs.insert(*bbi).second) {
273 Edge edge = getEdge(BB,*bbi);
274 double w = getEdgeWeight(edge);
275 if (w != MissingValue) {
276 BBWeight -= getEdgeWeight(edge);
277 } else {
278 Edges.push_back(edge);
279 // If minimal weight is necessary, reserve weight by subtracting weight
280 // from block weight, this is readded later on.
281 if (MinimalWeight.find(edge) != MinimalWeight.end()) {
282 BBWeight -= MinimalWeight[edge];
283 DEBUG(dbgs() << "Reserving " << format("%.20g",MinimalWeight[edge]) << " at " << edge << "\n");
284 }
285 }
286 }
287 }
288
289 double fraction = floor(BBWeight/Edges.size());
290 // Finally we know what flow is still not leaving the block, distribute this
291 // flow onto the empty edges.
292 for (SmallVector<Edge, 8>::iterator ei = Edges.begin(), ee = Edges.end();
293 ei != ee; ++ei) {
294 if (ei != (ee-1)) {
295 EdgeInformation[BB->getParent()][*ei] += fraction;
296 BBWeight -= fraction;
297 } else {
298 EdgeInformation[BB->getParent()][*ei] += BBWeight;
299 }
300 // Readd minial necessary weight.
301 if (MinimalWeight.find(*ei) != MinimalWeight.end()) {
302 EdgeInformation[BB->getParent()][*ei] += MinimalWeight[*ei];
303 DEBUG(dbgs() << "Additionally " << format("%.20g",MinimalWeight[*ei]) << " at " << (*ei) << "\n");
304 }
305 printEdgeWeight(*ei);
306 }
307
308 // This block is visited, mark this before the recursion.
309 BBToVisit.erase(BB);
310
311 // Recurse into successors.
312 for (succ_iterator bbi = succ_begin(BB), bbe = succ_end(BB);
313 bbi != bbe; ++bbi) {
314 recurseBasicBlock(*bbi);
315 }
316 }
317
runOnFunction(Function & F)318 bool ProfileEstimatorPass::runOnFunction(Function &F) {
319 if (F.isDeclaration()) return false;
320
321 // Fetch LoopInfo and clear ProfileInfo for this function.
322 LI = &getAnalysis<LoopInfo>();
323 FunctionInformation.erase(&F);
324 BlockInformation[&F].clear();
325 EdgeInformation[&F].clear();
326 BBToVisit.clear();
327
328 // Mark all blocks as to visit.
329 for (Function::iterator bi = F.begin(), be = F.end(); bi != be; ++bi)
330 BBToVisit.insert(bi);
331
332 // Clear Minimal Edges.
333 MinimalWeight.clear();
334
335 DEBUG(dbgs() << "Working on function " << F.getNameStr() << "\n");
336
337 // Since the entry block is the first one and has no predecessors, the edge
338 // (0,entry) is inserted with the starting weight of 1.
339 BasicBlock *entry = &F.getEntryBlock();
340 BlockInformation[&F][entry] = pow(2.0, 32.0);
341 Edge edge = getEdge(0,entry);
342 EdgeInformation[&F][edge] = BlockInformation[&F][entry];
343 printEdgeWeight(edge);
344
345 // Since recurseBasicBlock() maybe returns with a block which was not fully
346 // estimated, use recurseBasicBlock() until everything is calculated.
347 bool cleanup = false;
348 recurseBasicBlock(entry);
349 while (BBToVisit.size() > 0 && !cleanup) {
350 // Remember number of open blocks, this is later used to check if progress
351 // was made.
352 unsigned size = BBToVisit.size();
353
354 // Try to calculate all blocks in turn.
355 for (std::set<BasicBlock*>::iterator bi = BBToVisit.begin(),
356 be = BBToVisit.end(); bi != be; ++bi) {
357 recurseBasicBlock(*bi);
358 // If at least one block was finished, break because iterator may be
359 // invalid.
360 if (BBToVisit.size() < size) break;
361 }
362
363 // If there was not a single block resolved, make some assumptions.
364 if (BBToVisit.size() == size) {
365 bool found = false;
366 for (std::set<BasicBlock*>::iterator BBI = BBToVisit.begin(), BBE = BBToVisit.end();
367 (BBI != BBE) && (!found); ++BBI) {
368 BasicBlock *BB = *BBI;
369 // Try each predecessor if it can be assumend.
370 for (pred_iterator bbi = pred_begin(BB), bbe = pred_end(BB);
371 (bbi != bbe) && (!found); ++bbi) {
372 Edge e = getEdge(*bbi,BB);
373 double w = getEdgeWeight(e);
374 // Check that edge from predecessor is still free.
375 if (w == MissingValue) {
376 // Check if there is a circle from this block to predecessor.
377 Path P;
378 const BasicBlock *Dest = GetPath(BB, *bbi, P, GetPathToDest);
379 if (Dest != *bbi) {
380 // If there is no circle, just set edge weight to 0
381 EdgeInformation[&F][e] = 0;
382 DEBUG(dbgs() << "Assuming edge weight: ");
383 printEdgeWeight(e);
384 found = true;
385 }
386 }
387 }
388 }
389 if (!found) {
390 cleanup = true;
391 DEBUG(dbgs() << "No assumption possible in Fuction "<<F.getName()<<", setting all to zero\n");
392 }
393 }
394 }
395 // In case there was no safe way to assume edges, set as a last measure,
396 // set _everything_ to zero.
397 if (cleanup) {
398 FunctionInformation[&F] = 0;
399 BlockInformation[&F].clear();
400 EdgeInformation[&F].clear();
401 for (Function::const_iterator FI = F.begin(), FE = F.end(); FI != FE; ++FI) {
402 const BasicBlock *BB = &(*FI);
403 BlockInformation[&F][BB] = 0;
404 const_pred_iterator predi = pred_begin(BB), prede = pred_end(BB);
405 if (predi == prede) {
406 Edge e = getEdge(0,BB);
407 setEdgeWeight(e,0);
408 }
409 for (;predi != prede; ++predi) {
410 Edge e = getEdge(*predi,BB);
411 setEdgeWeight(e,0);
412 }
413 succ_const_iterator succi = succ_begin(BB), succe = succ_end(BB);
414 if (succi == succe) {
415 Edge e = getEdge(BB,0);
416 setEdgeWeight(e,0);
417 }
418 for (;succi != succe; ++succi) {
419 Edge e = getEdge(*succi,BB);
420 setEdgeWeight(e,0);
421 }
422 }
423 }
424
425 return false;
426 }
427