• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===--- MisExpect.cpp - Check the use of llvm.expect with PGO data -------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This contains code to emit warnings for potentially incorrect usage of the
10 // llvm.expect intrinsic. This utility extracts the threshold values from
11 // metadata associated with the instrumented Branch or Switch instruction. The
12 // threshold values are then used to determine if a warning should be emmited.
13 //
14 // MisExpect metadata is generated when llvm.expect intrinsics are lowered see
15 // LowerExpectIntrinsic.cpp
16 //
17 //===----------------------------------------------------------------------===//
18 
19 #include "llvm/Transforms/Utils/MisExpect.h"
20 #include "llvm/ADT/Twine.h"
21 #include "llvm/Analysis/OptimizationRemarkEmitter.h"
22 #include "llvm/IR/Constants.h"
23 #include "llvm/IR/DiagnosticInfo.h"
24 #include "llvm/IR/Instruction.h"
25 #include "llvm/IR/Instructions.h"
26 #include "llvm/IR/LLVMContext.h"
27 #include "llvm/Support/BranchProbability.h"
28 #include "llvm/Support/CommandLine.h"
29 #include "llvm/Support/Debug.h"
30 #include "llvm/Support/FormatVariadic.h"
31 #include <cstdint>
32 #include <functional>
33 #include <numeric>
34 
35 #define DEBUG_TYPE "misexpect"
36 
37 using namespace llvm;
38 using namespace misexpect;
39 
40 namespace llvm {
41 
42 // Command line option to enable/disable the warning when profile data suggests
43 // a mismatch with the use of the llvm.expect intrinsic
44 static cl::opt<bool> PGOWarnMisExpect(
45     "pgo-warn-misexpect", cl::init(false), cl::Hidden,
46     cl::desc("Use this option to turn on/off "
47              "warnings about incorrect usage of llvm.expect intrinsics."));
48 
49 } // namespace llvm
50 
51 namespace {
52 
getOprndOrInst(Instruction * I)53 Instruction *getOprndOrInst(Instruction *I) {
54   assert(I != nullptr && "MisExpect target Instruction cannot be nullptr");
55   Instruction *Ret = nullptr;
56   if (auto *B = dyn_cast<BranchInst>(I)) {
57     Ret = dyn_cast<Instruction>(B->getCondition());
58   }
59   // TODO: Find a way to resolve condition location for switches
60   // Using the condition of the switch seems to often resolve to an earlier
61   // point in the program, i.e. the calculation of the switch condition, rather
62   // than the switches location in the source code. Thus, we should use the
63   // instruction to get source code locations rather than the condition to
64   // improve diagnostic output, such as the caret. If the same problem exists
65   // for branch instructions, then we should remove this function and directly
66   // use the instruction
67   //
68   // else if (auto S = dyn_cast<SwitchInst>(I)) {
69   // Ret = I;
70   //}
71   return Ret ? Ret : I;
72 }
73 
emitMisexpectDiagnostic(Instruction * I,LLVMContext & Ctx,uint64_t ProfCount,uint64_t TotalCount)74 void emitMisexpectDiagnostic(Instruction *I, LLVMContext &Ctx,
75                              uint64_t ProfCount, uint64_t TotalCount) {
76   double PercentageCorrect = (double)ProfCount / TotalCount;
77   auto PerString =
78       formatv("{0:P} ({1} / {2})", PercentageCorrect, ProfCount, TotalCount);
79   auto RemStr = formatv(
80       "Potential performance regression from use of the llvm.expect intrinsic: "
81       "Annotation was correct on {0} of profiled executions.",
82       PerString);
83   Twine Msg(PerString);
84   Instruction *Cond = getOprndOrInst(I);
85   if (PGOWarnMisExpect)
86     Ctx.diagnose(DiagnosticInfoMisExpect(Cond, Msg));
87   OptimizationRemarkEmitter ORE(I->getParent()->getParent());
88   ORE.emit(OptimizationRemark(DEBUG_TYPE, "misexpect", Cond) << RemStr.str());
89 }
90 
91 } // namespace
92 
93 namespace llvm {
94 namespace misexpect {
95 
verifyMisExpect(Instruction * I,const SmallVector<uint32_t,4> & Weights,LLVMContext & Ctx)96 void verifyMisExpect(Instruction *I, const SmallVector<uint32_t, 4> &Weights,
97                      LLVMContext &Ctx) {
98   if (auto *MisExpectData = I->getMetadata(LLVMContext::MD_misexpect)) {
99     auto *MisExpectDataName = dyn_cast<MDString>(MisExpectData->getOperand(0));
100     if (MisExpectDataName &&
101         MisExpectDataName->getString().equals("misexpect")) {
102       LLVM_DEBUG(llvm::dbgs() << "------------------\n");
103       LLVM_DEBUG(llvm::dbgs()
104                  << "Function: " << I->getFunction()->getName() << "\n");
105       LLVM_DEBUG(llvm::dbgs() << "Instruction: " << *I << ":\n");
106       LLVM_DEBUG(for (int Idx = 0, Size = Weights.size(); Idx < Size; ++Idx) {
107         llvm::dbgs() << "Weights[" << Idx << "] = " << Weights[Idx] << "\n";
108       });
109 
110       // extract values from misexpect metadata
111       const auto *IndexCint =
112           mdconst::dyn_extract<ConstantInt>(MisExpectData->getOperand(1));
113       const auto *LikelyCInt =
114           mdconst::dyn_extract<ConstantInt>(MisExpectData->getOperand(2));
115       const auto *UnlikelyCInt =
116           mdconst::dyn_extract<ConstantInt>(MisExpectData->getOperand(3));
117 
118       if (!IndexCint || !LikelyCInt || !UnlikelyCInt)
119         return;
120 
121       const uint64_t Index = IndexCint->getZExtValue();
122       const uint64_t LikelyBranchWeight = LikelyCInt->getZExtValue();
123       const uint64_t UnlikelyBranchWeight = UnlikelyCInt->getZExtValue();
124       const uint64_t ProfileCount = Weights[Index];
125       const uint64_t CaseTotal = std::accumulate(
126           Weights.begin(), Weights.end(), (uint64_t)0, std::plus<uint64_t>());
127       const uint64_t NumUnlikelyTargets = Weights.size() - 1;
128 
129       const uint64_t TotalBranchWeight =
130           LikelyBranchWeight + (UnlikelyBranchWeight * NumUnlikelyTargets);
131 
132       const llvm::BranchProbability LikelyThreshold(LikelyBranchWeight,
133                                                     TotalBranchWeight);
134       uint64_t ScaledThreshold = LikelyThreshold.scale(CaseTotal);
135 
136       LLVM_DEBUG(llvm::dbgs()
137                  << "Unlikely Targets: " << NumUnlikelyTargets << ":\n");
138       LLVM_DEBUG(llvm::dbgs() << "Profile Count: " << ProfileCount << ":\n");
139       LLVM_DEBUG(llvm::dbgs()
140                  << "Scaled Threshold: " << ScaledThreshold << ":\n");
141       LLVM_DEBUG(llvm::dbgs() << "------------------\n");
142       if (ProfileCount < ScaledThreshold)
143         emitMisexpectDiagnostic(I, Ctx, ProfileCount, CaseTotal);
144     }
145   }
146 }
147 
checkFrontendInstrumentation(Instruction & I)148 void checkFrontendInstrumentation(Instruction &I) {
149   if (auto *MD = I.getMetadata(LLVMContext::MD_prof)) {
150     unsigned NOps = MD->getNumOperands();
151 
152     // Only emit misexpect diagnostics if at least 2 branch weights are present.
153     // Less than 2 branch weights means that the profiling metadata is:
154     //    1) incorrect/corrupted
155     //    2) not branch weight metadata
156     //    3) completely deterministic
157     // In these cases we should not emit any diagnostic related to misexpect.
158     if (NOps < 3)
159       return;
160 
161     // Operand 0 is a string tag "branch_weights"
162     if (MDString *Tag = cast<MDString>(MD->getOperand(0))) {
163       if (Tag->getString().equals("branch_weights")) {
164         SmallVector<uint32_t, 4> RealWeights(NOps - 1);
165         for (unsigned i = 1; i < NOps; i++) {
166           ConstantInt *Value =
167               mdconst::dyn_extract<ConstantInt>(MD->getOperand(i));
168           RealWeights[i - 1] = Value->getZExtValue();
169         }
170         verifyMisExpect(&I, RealWeights, I.getContext());
171       }
172     }
173   }
174 }
175 
176 } // namespace misexpect
177 } // namespace llvm
178 #undef DEBUG_TYPE
179