1 //===- LowerExpectIntrinsic.cpp - Lower expect intrinsic ------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This pass lowers the 'expect' intrinsic to LLVM metadata.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "llvm/Transforms/Scalar/LowerExpectIntrinsic.h"
14 #include "llvm/ADT/SmallVector.h"
15 #include "llvm/ADT/Statistic.h"
16 #include "llvm/ADT/iterator_range.h"
17 #include "llvm/IR/BasicBlock.h"
18 #include "llvm/IR/Constants.h"
19 #include "llvm/IR/Function.h"
20 #include "llvm/IR/Instructions.h"
21 #include "llvm/IR/Intrinsics.h"
22 #include "llvm/IR/LLVMContext.h"
23 #include "llvm/IR/MDBuilder.h"
24 #include "llvm/IR/Metadata.h"
25 #include "llvm/InitializePasses.h"
26 #include "llvm/Pass.h"
27 #include "llvm/Support/CommandLine.h"
28 #include "llvm/Support/Debug.h"
29 #include "llvm/Transforms/Scalar.h"
30 #include "llvm/Transforms/Utils/MisExpect.h"
31 
32 using namespace llvm;
33 
34 #define DEBUG_TYPE "lower-expect-intrinsic"
35 
36 STATISTIC(ExpectIntrinsicsHandled,
37           "Number of 'expect' intrinsic instructions handled");
38 
39 // These default values are chosen to represent an extremely skewed outcome for
40 // a condition, but they leave some room for interpretation by later passes.
41 //
42 // If the documentation for __builtin_expect() was made explicit that it should
43 // only be used in extreme cases, we could make this ratio higher. As it stands,
44 // programmers may be using __builtin_expect() / llvm.expect to annotate that a
45 // branch is likely or unlikely to be taken.
46 //
47 // There is a known dependency on this ratio in CodeGenPrepare when transforming
48 // 'select' instructions. It may be worthwhile to hoist these values to some
49 // shared space, so they can be used directly by other passes.
50 
51 static cl::opt<uint32_t> LikelyBranchWeight(
52     "likely-branch-weight", cl::Hidden, cl::init(2000),
53     cl::desc("Weight of the branch likely to be taken (default = 2000)"));
54 static cl::opt<uint32_t> UnlikelyBranchWeight(
55     "unlikely-branch-weight", cl::Hidden, cl::init(1),
56     cl::desc("Weight of the branch unlikely to be taken (default = 1)"));
57 
58 static std::tuple<uint32_t, uint32_t>
getBranchWeight(Intrinsic::ID IntrinsicID,CallInst * CI,int BranchCount)59 getBranchWeight(Intrinsic::ID IntrinsicID, CallInst *CI, int BranchCount) {
60   if (IntrinsicID == Intrinsic::expect) {
61     // __builtin_expect
62     return std::make_tuple(LikelyBranchWeight.getValue(),
63                            UnlikelyBranchWeight.getValue());
64   } else {
65     // __builtin_expect_with_probability
66     assert(CI->getNumOperands() >= 3 &&
67            "expect with probability must have 3 arguments");
68     ConstantFP *Confidence = dyn_cast<ConstantFP>(CI->getArgOperand(2));
69     double TrueProb = Confidence->getValueAPF().convertToDouble();
70     assert((TrueProb >= 0.0 && TrueProb <= 1.0) &&
71            "probability value must be in the range [0.0, 1.0]");
72     double FalseProb = (1.0 - TrueProb) / (BranchCount - 1);
73     uint32_t LikelyBW = ceil((TrueProb * (double)(INT32_MAX - 1)) + 1.0);
74     uint32_t UnlikelyBW = ceil((FalseProb * (double)(INT32_MAX - 1)) + 1.0);
75     return std::make_tuple(LikelyBW, UnlikelyBW);
76   }
77 }
78 
handleSwitchExpect(SwitchInst & SI)79 static bool handleSwitchExpect(SwitchInst &SI) {
80   CallInst *CI = dyn_cast<CallInst>(SI.getCondition());
81   if (!CI)
82     return false;
83 
84   Function *Fn = CI->getCalledFunction();
85   if (!Fn || (Fn->getIntrinsicID() != Intrinsic::expect &&
86               Fn->getIntrinsicID() != Intrinsic::expect_with_probability))
87     return false;
88 
89   Value *ArgValue = CI->getArgOperand(0);
90   ConstantInt *ExpectedValue = dyn_cast<ConstantInt>(CI->getArgOperand(1));
91   if (!ExpectedValue)
92     return false;
93 
94   SwitchInst::CaseHandle Case = *SI.findCaseValue(ExpectedValue);
95   unsigned n = SI.getNumCases(); // +1 for default case.
96   uint32_t LikelyBranchWeightVal, UnlikelyBranchWeightVal;
97   std::tie(LikelyBranchWeightVal, UnlikelyBranchWeightVal) =
98       getBranchWeight(Fn->getIntrinsicID(), CI, n + 1);
99 
100   SmallVector<uint32_t, 16> Weights(n + 1, UnlikelyBranchWeightVal);
101 
102   uint64_t Index = (Case == *SI.case_default()) ? 0 : Case.getCaseIndex() + 1;
103   Weights[Index] = LikelyBranchWeightVal;
104 
105   SI.setMetadata(LLVMContext::MD_misexpect,
106                  MDBuilder(CI->getContext())
107                      .createMisExpect(Index, LikelyBranchWeightVal,
108                                       UnlikelyBranchWeightVal));
109 
110   SI.setCondition(ArgValue);
111   misexpect::checkFrontendInstrumentation(SI);
112 
113   SI.setMetadata(LLVMContext::MD_prof,
114                  MDBuilder(CI->getContext()).createBranchWeights(Weights));
115 
116   return true;
117 }
118 
119 /// Handler for PHINodes that define the value argument to an
120 /// @llvm.expect call.
121 ///
122 /// If the operand of the phi has a constant value and it 'contradicts'
123 /// with the expected value of phi def, then the corresponding incoming
124 /// edge of the phi is unlikely to be taken. Using that information,
125 /// the branch probability info for the originating branch can be inferred.
handlePhiDef(CallInst * Expect)126 static void handlePhiDef(CallInst *Expect) {
127   Value &Arg = *Expect->getArgOperand(0);
128   ConstantInt *ExpectedValue = dyn_cast<ConstantInt>(Expect->getArgOperand(1));
129   if (!ExpectedValue)
130     return;
131   const APInt &ExpectedPhiValue = ExpectedValue->getValue();
132 
133   // Walk up in backward a list of instructions that
134   // have 'copy' semantics by 'stripping' the copies
135   // until a PHI node or an instruction of unknown kind
136   // is reached. Negation via xor is also handled.
137   //
138   //       C = PHI(...);
139   //       B = C;
140   //       A = B;
141   //       D = __builtin_expect(A, 0);
142   //
143   Value *V = &Arg;
144   SmallVector<Instruction *, 4> Operations;
145   while (!isa<PHINode>(V)) {
146     if (ZExtInst *ZExt = dyn_cast<ZExtInst>(V)) {
147       V = ZExt->getOperand(0);
148       Operations.push_back(ZExt);
149       continue;
150     }
151 
152     if (SExtInst *SExt = dyn_cast<SExtInst>(V)) {
153       V = SExt->getOperand(0);
154       Operations.push_back(SExt);
155       continue;
156     }
157 
158     BinaryOperator *BinOp = dyn_cast<BinaryOperator>(V);
159     if (!BinOp || BinOp->getOpcode() != Instruction::Xor)
160       return;
161 
162     ConstantInt *CInt = dyn_cast<ConstantInt>(BinOp->getOperand(1));
163     if (!CInt)
164       return;
165 
166     V = BinOp->getOperand(0);
167     Operations.push_back(BinOp);
168   }
169 
170   // Executes the recorded operations on input 'Value'.
171   auto ApplyOperations = [&](const APInt &Value) {
172     APInt Result = Value;
173     for (auto Op : llvm::reverse(Operations)) {
174       switch (Op->getOpcode()) {
175       case Instruction::Xor:
176         Result ^= cast<ConstantInt>(Op->getOperand(1))->getValue();
177         break;
178       case Instruction::ZExt:
179         Result = Result.zext(Op->getType()->getIntegerBitWidth());
180         break;
181       case Instruction::SExt:
182         Result = Result.sext(Op->getType()->getIntegerBitWidth());
183         break;
184       default:
185         llvm_unreachable("Unexpected operation");
186       }
187     }
188     return Result;
189   };
190 
191   auto *PhiDef = cast<PHINode>(V);
192 
193   // Get the first dominating conditional branch of the operand
194   // i's incoming block.
195   auto GetDomConditional = [&](unsigned i) -> BranchInst * {
196     BasicBlock *BB = PhiDef->getIncomingBlock(i);
197     BranchInst *BI = dyn_cast<BranchInst>(BB->getTerminator());
198     if (BI && BI->isConditional())
199       return BI;
200     BB = BB->getSinglePredecessor();
201     if (!BB)
202       return nullptr;
203     BI = dyn_cast<BranchInst>(BB->getTerminator());
204     if (!BI || BI->isUnconditional())
205       return nullptr;
206     return BI;
207   };
208 
209   // Now walk through all Phi operands to find phi oprerands with values
210   // conflicting with the expected phi output value. Any such operand
211   // indicates the incoming edge to that operand is unlikely.
212   for (unsigned i = 0, e = PhiDef->getNumIncomingValues(); i != e; ++i) {
213 
214     Value *PhiOpnd = PhiDef->getIncomingValue(i);
215     ConstantInt *CI = dyn_cast<ConstantInt>(PhiOpnd);
216     if (!CI)
217       continue;
218 
219     // Not an interesting case when IsUnlikely is false -- we can not infer
220     // anything useful when the operand value matches the expected phi
221     // output.
222     if (ExpectedPhiValue == ApplyOperations(CI->getValue()))
223       continue;
224 
225     BranchInst *BI = GetDomConditional(i);
226     if (!BI)
227       continue;
228 
229     MDBuilder MDB(PhiDef->getContext());
230 
231     // There are two situations in which an operand of the PhiDef comes
232     // from a given successor of a branch instruction BI.
233     // 1) When the incoming block of the operand is the successor block;
234     // 2) When the incoming block is BI's enclosing block and the
235     // successor is the PhiDef's enclosing block.
236     //
237     // Returns true if the operand which comes from OpndIncomingBB
238     // comes from outgoing edge of BI that leads to Succ block.
239     auto *OpndIncomingBB = PhiDef->getIncomingBlock(i);
240     auto IsOpndComingFromSuccessor = [&](BasicBlock *Succ) {
241       if (OpndIncomingBB == Succ)
242         // If this successor is the incoming block for this
243         // Phi operand, then this successor does lead to the Phi.
244         return true;
245       if (OpndIncomingBB == BI->getParent() && Succ == PhiDef->getParent())
246         // Otherwise, if the edge is directly from the branch
247         // to the Phi, this successor is the one feeding this
248         // Phi operand.
249         return true;
250       return false;
251     };
252     uint32_t LikelyBranchWeightVal, UnlikelyBranchWeightVal;
253     std::tie(LikelyBranchWeightVal, UnlikelyBranchWeightVal) = getBranchWeight(
254         Expect->getCalledFunction()->getIntrinsicID(), Expect, 2);
255 
256     if (IsOpndComingFromSuccessor(BI->getSuccessor(1)))
257       BI->setMetadata(LLVMContext::MD_prof,
258                       MDB.createBranchWeights(LikelyBranchWeightVal,
259                                               UnlikelyBranchWeightVal));
260     else if (IsOpndComingFromSuccessor(BI->getSuccessor(0)))
261       BI->setMetadata(LLVMContext::MD_prof,
262                       MDB.createBranchWeights(UnlikelyBranchWeightVal,
263                                               LikelyBranchWeightVal));
264   }
265 }
266 
267 // Handle both BranchInst and SelectInst.
handleBrSelExpect(BrSelInst & BSI)268 template <class BrSelInst> static bool handleBrSelExpect(BrSelInst &BSI) {
269 
270   // Handle non-optimized IR code like:
271   //   %expval = call i64 @llvm.expect.i64(i64 %conv1, i64 1)
272   //   %tobool = icmp ne i64 %expval, 0
273   //   br i1 %tobool, label %if.then, label %if.end
274   //
275   // Or the following simpler case:
276   //   %expval = call i1 @llvm.expect.i1(i1 %cmp, i1 1)
277   //   br i1 %expval, label %if.then, label %if.end
278 
279   CallInst *CI;
280 
281   ICmpInst *CmpI = dyn_cast<ICmpInst>(BSI.getCondition());
282   CmpInst::Predicate Predicate;
283   ConstantInt *CmpConstOperand = nullptr;
284   if (!CmpI) {
285     CI = dyn_cast<CallInst>(BSI.getCondition());
286     Predicate = CmpInst::ICMP_NE;
287   } else {
288     Predicate = CmpI->getPredicate();
289     if (Predicate != CmpInst::ICMP_NE && Predicate != CmpInst::ICMP_EQ)
290       return false;
291 
292     CmpConstOperand = dyn_cast<ConstantInt>(CmpI->getOperand(1));
293     if (!CmpConstOperand)
294       return false;
295     CI = dyn_cast<CallInst>(CmpI->getOperand(0));
296   }
297 
298   if (!CI)
299     return false;
300 
301   uint64_t ValueComparedTo = 0;
302   if (CmpConstOperand) {
303     if (CmpConstOperand->getBitWidth() > 64)
304       return false;
305     ValueComparedTo = CmpConstOperand->getZExtValue();
306   }
307 
308   Function *Fn = CI->getCalledFunction();
309   if (!Fn || (Fn->getIntrinsicID() != Intrinsic::expect &&
310               Fn->getIntrinsicID() != Intrinsic::expect_with_probability))
311     return false;
312 
313   Value *ArgValue = CI->getArgOperand(0);
314   ConstantInt *ExpectedValue = dyn_cast<ConstantInt>(CI->getArgOperand(1));
315   if (!ExpectedValue)
316     return false;
317 
318   MDBuilder MDB(CI->getContext());
319   MDNode *Node;
320   MDNode *ExpNode;
321 
322   uint32_t LikelyBranchWeightVal, UnlikelyBranchWeightVal;
323   std::tie(LikelyBranchWeightVal, UnlikelyBranchWeightVal) =
324       getBranchWeight(Fn->getIntrinsicID(), CI, 2);
325 
326   if ((ExpectedValue->getZExtValue() == ValueComparedTo) ==
327       (Predicate == CmpInst::ICMP_EQ)) {
328     Node =
329         MDB.createBranchWeights(LikelyBranchWeightVal, UnlikelyBranchWeightVal);
330     ExpNode =
331         MDB.createMisExpect(0, LikelyBranchWeightVal, UnlikelyBranchWeightVal);
332   } else {
333     Node =
334         MDB.createBranchWeights(UnlikelyBranchWeightVal, LikelyBranchWeightVal);
335     ExpNode =
336         MDB.createMisExpect(1, LikelyBranchWeightVal, UnlikelyBranchWeightVal);
337   }
338 
339   BSI.setMetadata(LLVMContext::MD_misexpect, ExpNode);
340 
341   if (CmpI)
342     CmpI->setOperand(0, ArgValue);
343   else
344     BSI.setCondition(ArgValue);
345 
346   misexpect::checkFrontendInstrumentation(BSI);
347 
348   BSI.setMetadata(LLVMContext::MD_prof, Node);
349 
350   return true;
351 }
352 
handleBranchExpect(BranchInst & BI)353 static bool handleBranchExpect(BranchInst &BI) {
354   if (BI.isUnconditional())
355     return false;
356 
357   return handleBrSelExpect<BranchInst>(BI);
358 }
359 
lowerExpectIntrinsic(Function & F)360 static bool lowerExpectIntrinsic(Function &F) {
361   bool Changed = false;
362 
363   for (BasicBlock &BB : F) {
364     // Create "block_weights" metadata.
365     if (BranchInst *BI = dyn_cast<BranchInst>(BB.getTerminator())) {
366       if (handleBranchExpect(*BI))
367         ExpectIntrinsicsHandled++;
368     } else if (SwitchInst *SI = dyn_cast<SwitchInst>(BB.getTerminator())) {
369       if (handleSwitchExpect(*SI))
370         ExpectIntrinsicsHandled++;
371     }
372 
373     // Remove llvm.expect intrinsics. Iterate backwards in order
374     // to process select instructions before the intrinsic gets
375     // removed.
376     for (auto BI = BB.rbegin(), BE = BB.rend(); BI != BE;) {
377       Instruction *Inst = &*BI++;
378       CallInst *CI = dyn_cast<CallInst>(Inst);
379       if (!CI) {
380         if (SelectInst *SI = dyn_cast<SelectInst>(Inst)) {
381           if (handleBrSelExpect(*SI))
382             ExpectIntrinsicsHandled++;
383         }
384         continue;
385       }
386 
387       Function *Fn = CI->getCalledFunction();
388       if (Fn && (Fn->getIntrinsicID() == Intrinsic::expect ||
389                  Fn->getIntrinsicID() == Intrinsic::expect_with_probability)) {
390         // Before erasing the llvm.expect, walk backward to find
391         // phi that define llvm.expect's first arg, and
392         // infer branch probability:
393         handlePhiDef(CI);
394         Value *Exp = CI->getArgOperand(0);
395         CI->replaceAllUsesWith(Exp);
396         CI->eraseFromParent();
397         Changed = true;
398       }
399     }
400   }
401 
402   return Changed;
403 }
404 
run(Function & F,FunctionAnalysisManager &)405 PreservedAnalyses LowerExpectIntrinsicPass::run(Function &F,
406                                                 FunctionAnalysisManager &) {
407   if (lowerExpectIntrinsic(F))
408     return PreservedAnalyses::none();
409 
410   return PreservedAnalyses::all();
411 }
412 
413 namespace {
414 /// Legacy pass for lowering expect intrinsics out of the IR.
415 ///
416 /// When this pass is run over a function it uses expect intrinsics which feed
417 /// branches and switches to provide branch weight metadata for those
418 /// terminators. It then removes the expect intrinsics from the IR so the rest
419 /// of the optimizer can ignore them.
420 class LowerExpectIntrinsic : public FunctionPass {
421 public:
422   static char ID;
LowerExpectIntrinsic()423   LowerExpectIntrinsic() : FunctionPass(ID) {
424     initializeLowerExpectIntrinsicPass(*PassRegistry::getPassRegistry());
425   }
426 
runOnFunction(Function & F)427   bool runOnFunction(Function &F) override { return lowerExpectIntrinsic(F); }
428 };
429 }
430 
431 char LowerExpectIntrinsic::ID = 0;
432 INITIALIZE_PASS(LowerExpectIntrinsic, "lower-expect",
433                 "Lower 'expect' Intrinsics", false, false)
434 
createLowerExpectIntrinsicPass()435 FunctionPass *llvm::createLowerExpectIntrinsicPass() {
436   return new LowerExpectIntrinsic();
437 }
438