blob: 2f33ee81ce17cd495c59888a6708963c7793be70 [file] [log] [blame]
Kostya Serebryany29a18dc2014-11-11 22:14:37 +00001//===-- SanitizerCoverage.cpp - coverage instrumentation for sanitizers ---===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// Coverage instrumentation that works with AddressSanitizer
11// and potentially with other Sanitizers.
12//
13// We create a Guard boolean variable with the same linkage
14// as the function and inject this code into the entry block (CoverageLevel=1)
15// or all blocks (CoverageLevel>=2):
16// if (*Guard) {
17// __sanitizer_cov();
18// *Guard = 1;
19// }
20// The accesses to Guard are atomic. The rest of the logic is
21// in __sanitizer_cov (it's fine to call it more than once).
22//
23// With CoverageLevel>=3 we also split critical edges this effectively
24// instrumenting all edges.
25//
26// CoverageLevel>=4 add indirect call profiling implented as a function call.
27//
28// This coverage implementation provides very limited data:
29// it only tells if a given function (block) was ever executed. No counters.
30// But for many use cases this is what we need and the added slowdown small.
31//
32//===----------------------------------------------------------------------===//
33
34#include "llvm/Transforms/Instrumentation.h"
35#include "llvm/ADT/ArrayRef.h"
36#include "llvm/ADT/SmallVector.h"
37#include "llvm/IR/CallSite.h"
38#include "llvm/IR/DataLayout.h"
39#include "llvm/IR/Function.h"
40#include "llvm/IR/IRBuilder.h"
41#include "llvm/IR/LLVMContext.h"
42#include "llvm/IR/MDBuilder.h"
43#include "llvm/IR/Module.h"
44#include "llvm/IR/Type.h"
45#include "llvm/Support/CommandLine.h"
46#include "llvm/Support/Debug.h"
47#include "llvm/Support/raw_ostream.h"
48#include "llvm/Transforms/Scalar.h"
49#include "llvm/Transforms/Utils/BasicBlockUtils.h"
50#include "llvm/Transforms/Utils/ModuleUtils.h"
51
52using namespace llvm;
53
54#define DEBUG_TYPE "sancov"
55
56static const char *const kSanCovModuleInitName = "__sanitizer_cov_module_init";
57static const char *const kSanCovName = "__sanitizer_cov";
58static const char *const kSanCovIndirCallName = "__sanitizer_cov_indir_call16";
59static const char *const kSanCovModuleCtorName = "sancov.module_ctor";
60static const uint64_t kSanCtorAndDtorPriority = 1;
61
62static cl::opt<int> ClCoverageLevel("sanitizer-coverage-level",
63 cl::desc("Sanitizer Coverage. 0: none, 1: entry block, 2: all blocks, "
64 "3: all blocks and critical edges, "
65 "4: above plus indirect calls"),
66 cl::Hidden, cl::init(0));
67
68static cl::opt<int> ClCoverageBlockThreshold(
69 "sanitizer-coverage-block-threshold",
70 cl::desc("Add coverage instrumentation only to the entry block if there "
71 "are more than this number of blocks."),
72 cl::Hidden, cl::init(1500));
73
74namespace {
75
76class SanitizerCoverageModule : public ModulePass {
77 public:
78 SanitizerCoverageModule(int CoverageLevel = 0)
79 : ModulePass(ID),
80 CoverageLevel(std::max(CoverageLevel, (int)ClCoverageLevel)) {
81 initializeBreakCriticalEdgesPass(*PassRegistry::getPassRegistry());
82 }
83 bool runOnModule(Module &M) override;
84 bool runOnFunction(Function &F);
85 static char ID; // Pass identification, replacement for typeid
86 const char *getPassName() const override {
87 return "SanitizerCoverageModule";
88 }
89
90 void getAnalysisUsage(AnalysisUsage &AU) const override {
91 if (CoverageLevel >= 3)
92 AU.addRequiredID(BreakCriticalEdgesID);
93 AU.addRequired<DataLayoutPass>();
94 }
95
96 private:
97 void InjectCoverageForIndirectCalls(Function &F,
98 ArrayRef<Instruction *> IndirCalls);
99 bool InjectCoverage(Function &F, ArrayRef<BasicBlock *> AllBlocks,
100 ArrayRef<Instruction *> IndirCalls);
101 void InjectCoverageAtBlock(Function &F, BasicBlock &BB);
102 Function *SanCovFunction;
103 Function *SanCovIndirCallFunction;
104 Function *SanCovModuleInit;
105 Type *IntptrTy;
106 LLVMContext *C;
107
108 int CoverageLevel;
109};
110
111} // namespace
112
113static Function *checkInterfaceFunction(Constant *FuncOrBitcast) {
114 if (Function *F = dyn_cast<Function>(FuncOrBitcast))
115 return F;
116 std::string Err;
117 raw_string_ostream Stream(Err);
118 Stream << "SanitizerCoverage interface function redefined: "
119 << *FuncOrBitcast;
120 report_fatal_error(Err);
121}
122
123bool SanitizerCoverageModule::runOnModule(Module &M) {
124 if (!CoverageLevel) return false;
125 C = &(M.getContext());
126 DataLayoutPass *DLP = &getAnalysis<DataLayoutPass>();
127 IntptrTy = Type::getIntNTy(*C, DLP->getDataLayout().getPointerSizeInBits());
128 Type *VoidTy = Type::getVoidTy(*C);
129
130 Function *CtorFunc =
131 Function::Create(FunctionType::get(VoidTy, false),
132 GlobalValue::InternalLinkage, kSanCovModuleCtorName, &M);
133 ReturnInst::Create(*C, BasicBlock::Create(*C, "", CtorFunc));
134 appendToGlobalCtors(M, CtorFunc, kSanCtorAndDtorPriority);
135
136 SanCovFunction =
137 checkInterfaceFunction(M.getOrInsertFunction(kSanCovName, VoidTy, NULL));
138 SanCovIndirCallFunction = checkInterfaceFunction(M.getOrInsertFunction(
139 kSanCovIndirCallName, VoidTy, IntptrTy, IntptrTy, NULL));
140 SanCovModuleInit = checkInterfaceFunction(M.getOrInsertFunction(
141 kSanCovModuleInitName, Type::getVoidTy(*C), IntptrTy, NULL));
142 SanCovModuleInit->setLinkage(Function::ExternalLinkage);
143
144 for (auto &F : M)
145 runOnFunction(F);
146
147 IRBuilder<> IRB(CtorFunc->getEntryBlock().getTerminator());
148 IRB.CreateCall(SanCovModuleInit,
149 ConstantInt::get(IntptrTy, SanCovFunction->getNumUses()));
150 return true;
151}
152
153bool SanitizerCoverageModule::runOnFunction(Function &F) {
154 if (F.empty()) return false;
155 // For now instrument only functions that will also be asan-instrumented.
156 if (!F.hasFnAttribute(Attribute::SanitizeAddress))
157 return false;
158 SmallVector<Instruction*, 8> IndirCalls;
159 SmallVector<BasicBlock*, 16> AllBlocks;
160 for (auto &BB : F) {
161 AllBlocks.push_back(&BB);
162 if (CoverageLevel >= 4)
163 for (auto &Inst : BB) {
164 CallSite CS(&Inst);
165 if (CS && !CS.getCalledFunction())
166 IndirCalls.push_back(&Inst);
167 }
168 }
169 InjectCoverage(F, AllBlocks, IndirCalls);
170 return true;
171}
172
173bool
174SanitizerCoverageModule::InjectCoverage(Function &F,
175 ArrayRef<BasicBlock *> AllBlocks,
176 ArrayRef<Instruction *> IndirCalls) {
177 if (!CoverageLevel) return false;
178
179 if (CoverageLevel == 1 ||
180 (unsigned)ClCoverageBlockThreshold < AllBlocks.size()) {
181 InjectCoverageAtBlock(F, F.getEntryBlock());
182 } else {
183 for (auto BB : AllBlocks)
184 InjectCoverageAtBlock(F, *BB);
185 }
186 InjectCoverageForIndirectCalls(F, IndirCalls);
187 return true;
188}
189
190// On every indirect call we call a run-time function
191// __sanitizer_cov_indir_call* with two parameters:
192// - callee address,
193// - global cache array that contains kCacheSize pointers (zero-initialized).
194// The cache is used to speed up recording the caller-callee pairs.
195// The address of the caller is passed implicitly via caller PC.
196// kCacheSize is encoded in the name of the run-time function.
197void SanitizerCoverageModule::InjectCoverageForIndirectCalls(
198 Function &F, ArrayRef<Instruction *> IndirCalls) {
199 if (IndirCalls.empty()) return;
200 const int kCacheSize = 16;
201 const int kCacheAlignment = 64; // Align for better performance.
202 Type *Ty = ArrayType::get(IntptrTy, kCacheSize);
203 for (auto I : IndirCalls) {
204 IRBuilder<> IRB(I);
205 CallSite CS(I);
206 Value *Callee = CS.getCalledValue();
207 if (dyn_cast<InlineAsm>(Callee)) continue;
208 GlobalVariable *CalleeCache = new GlobalVariable(
209 *F.getParent(), Ty, false, GlobalValue::PrivateLinkage,
210 Constant::getNullValue(Ty), "__sancov_gen_callee_cache");
211 CalleeCache->setAlignment(kCacheAlignment);
212 IRB.CreateCall2(SanCovIndirCallFunction,
213 IRB.CreatePointerCast(Callee, IntptrTy),
214 IRB.CreatePointerCast(CalleeCache, IntptrTy));
215 }
216}
217
218void SanitizerCoverageModule::InjectCoverageAtBlock(Function &F,
219 BasicBlock &BB) {
220 BasicBlock::iterator IP = BB.getFirstInsertionPt(), BE = BB.end();
221 // Skip static allocas at the top of the entry block so they don't become
222 // dynamic when we split the block. If we used our optimized stack layout,
223 // then there will only be one alloca and it will come first.
224 for (; IP != BE; ++IP) {
225 AllocaInst *AI = dyn_cast<AllocaInst>(IP);
226 if (!AI || !AI->isStaticAlloca())
227 break;
228 }
229
230 DebugLoc EntryLoc = &BB == &F.getEntryBlock()
231 ? IP->getDebugLoc().getFnDebugLoc(*C)
232 : IP->getDebugLoc();
233 IRBuilder<> IRB(IP);
234 IRB.SetCurrentDebugLocation(EntryLoc);
235 Type *Int8Ty = IRB.getInt8Ty();
236 GlobalVariable *Guard = new GlobalVariable(
237 *F.getParent(), Int8Ty, false, GlobalValue::PrivateLinkage,
238 Constant::getNullValue(Int8Ty), "__sancov_gen_cov_" + F.getName());
239 LoadInst *Load = IRB.CreateLoad(Guard);
240 Load->setAtomic(Monotonic);
241 Load->setAlignment(1);
242 Value *Cmp = IRB.CreateICmpEQ(Constant::getNullValue(Int8Ty), Load);
243 Instruction *Ins = SplitBlockAndInsertIfThen(
244 Cmp, IP, false, MDBuilder(*C).createBranchWeights(1, 100000));
245 IRB.SetInsertPoint(Ins);
246 IRB.SetCurrentDebugLocation(EntryLoc);
247 // __sanitizer_cov gets the PC of the instruction using GET_CALLER_PC.
248 IRB.CreateCall(SanCovFunction);
249 StoreInst *Store = IRB.CreateStore(ConstantInt::get(Int8Ty, 1), Guard);
250 Store->setAtomic(Monotonic);
251 Store->setAlignment(1);
252}
253
254char SanitizerCoverageModule::ID = 0;
255INITIALIZE_PASS(SanitizerCoverageModule, "sancov",
256 "SanitizerCoverage: TODO."
257 "ModulePass", false, false)
258ModulePass *llvm::createSanitizerCoverageModulePass(int CoverageLevel) {
259 return new SanitizerCoverageModule(CoverageLevel);
260}