blob: 8eb9ad409b8861594b3220df9338eff0d9a85d44 [file] [log] [blame]
Nuno Lopesa2f6cec2012-05-22 17:19:09 +00001//===- BoundsChecking.cpp - Instrumentation for run-time bounds checking --===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file implements a pass that instruments the code to perform run-time
11// bounds checking on loads, stores, and other memory intrinsics.
12//
13//===----------------------------------------------------------------------===//
14
Chandler Carruthed0881b2012-12-03 16:50:05 +000015#include "llvm/ADT/Statistic.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000016#include "llvm/ADT/Twine.h"
Chandler Carruthed0881b2012-12-03 16:50:05 +000017#include "llvm/Analysis/MemoryBuiltins.h"
Chandler Carruth452a0072014-03-04 11:59:06 +000018#include "llvm/Analysis/TargetFolder.h"
Benjamin Kramer799003b2015-03-23 19:32:43 +000019#include "llvm/Analysis/TargetLibraryInfo.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000020#include "llvm/IR/BasicBlock.h"
21#include "llvm/IR/Constants.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000022#include "llvm/IR/DataLayout.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000023#include "llvm/IR/Function.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000024#include "llvm/IR/IRBuilder.h"
Chandler Carruth83948572014-03-04 10:30:26 +000025#include "llvm/IR/InstIterator.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000026#include "llvm/IR/InstrTypes.h"
27#include "llvm/IR/Instruction.h"
28#include "llvm/IR/Instructions.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000029#include "llvm/IR/Intrinsics.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000030#include "llvm/IR/Value.h"
Chandler Carruthaafe0912012-06-29 12:38:19 +000031#include "llvm/Pass.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000032#include "llvm/Support/Casting.h"
Nuno Lopes288e86ff62012-05-31 22:58:48 +000033#include "llvm/Support/CommandLine.h"
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000034#include "llvm/Support/Debug.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000035#include "llvm/Support/ErrorHandling.h"
Chandler Carruthaafe0912012-06-29 12:38:19 +000036#include "llvm/Support/raw_ostream.h"
Chandler Carruth6bda14b2017-06-06 11:49:48 +000037#include "llvm/Transforms/Instrumentation.h"
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000038#include <cstdint>
39#include <vector>
40
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000041using namespace llvm;
42
Chandler Carruth964daaa2014-04-22 02:55:47 +000043#define DEBUG_TYPE "bounds-checking"
44
Nuno Lopes0e967e02012-06-21 15:59:53 +000045static cl::opt<bool> SingleTrapBB("bounds-checking-single-trap",
46 cl::desc("Use one trap block per function"));
Nuno Lopes288e86ff62012-05-31 22:58:48 +000047
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000048STATISTIC(ChecksAdded, "Bounds checks added");
49STATISTIC(ChecksSkipped, "Bounds checks skipped");
50STATISTIC(ChecksUnable, "Bounds checks unable to add");
51
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000052using BuilderTy = IRBuilder<TargetFolder>;
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000053
54namespace {
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000055
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000056 struct BoundsChecking : public FunctionPass {
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000057 static char ID;
58
Joey Gouly95198232012-11-23 10:47:35 +000059 BoundsChecking() : FunctionPass(ID) {
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000060 initializeBoundsCheckingPass(*PassRegistry::getPassRegistry());
61 }
62
Craig Topper3e4c6972014-03-05 09:10:37 +000063 bool runOnFunction(Function &F) override;
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000064
Craig Topper3e4c6972014-03-05 09:10:37 +000065 void getAnalysisUsage(AnalysisUsage &AU) const override {
Chandler Carruthb98f63d2015-01-15 10:41:28 +000066 AU.addRequired<TargetLibraryInfoWrapperPass>();
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000067 }
Nuno Lopes59e9df72012-05-22 22:02:19 +000068
69 private:
Benjamin Kramer8bcc9712012-08-29 15:32:21 +000070 const TargetLibraryInfo *TLI;
Nuno Lopes0e967e02012-06-21 15:59:53 +000071 ObjectSizeOffsetEvaluator *ObjSizeEval;
Nuno Lopes59e9df72012-05-22 22:02:19 +000072 BuilderTy *Builder;
Nuno Lopesde8c6fb2012-06-23 00:12:34 +000073 Instruction *Inst;
Nuno Lopes59e9df72012-05-22 22:02:19 +000074 BasicBlock *TrapBB;
Nuno Lopes59e9df72012-05-22 22:02:19 +000075
76 BasicBlock *getTrapBB();
Mehdi Aminia28d91d2015-03-10 02:37:25 +000077 bool instrument(Value *Ptr, Value *Val, const DataLayout &DL);
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000078 };
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000079
80} // end anonymous namespace
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000081
82char BoundsChecking::ID = 0;
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000083
Nuno Lopes1e8dffd2012-07-03 17:30:18 +000084INITIALIZE_PASS(BoundsChecking, "bounds-checking", "Run-time bounds checking",
85 false, false)
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000086
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000087/// getTrapBB - create a basic block that traps. All overflowing conditions
88/// branch to this block. There's only one trap block per function.
89BasicBlock *BoundsChecking::getTrapBB() {
Nuno Lopes0e967e02012-06-21 15:59:53 +000090 if (TrapBB && SingleTrapBB)
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000091 return TrapBB;
92
Nuno Lopesde8c6fb2012-06-23 00:12:34 +000093 Function *Fn = Inst->getParent()->getParent();
Benjamin Kramer6e931522013-09-30 15:40:17 +000094 IRBuilder<>::InsertPointGuard Guard(*Builder);
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000095 TrapBB = BasicBlock::Create(Fn->getContext(), "trap", Fn);
Benjamin Kramerf0047292013-09-30 15:52:50 +000096 Builder->SetInsertPoint(TrapBB);
Nuno Lopesa2f6cec2012-05-22 17:19:09 +000097
Eugene Zelenkobff0ef02017-10-19 22:07:16 +000098 Value *F = Intrinsic::getDeclaration(Fn->getParent(), Intrinsic::trap);
David Blaikieff6409d2015-05-18 22:13:54 +000099 CallInst *TrapCall = Builder->CreateCall(F, {});
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000100 TrapCall->setDoesNotReturn();
101 TrapCall->setDoesNotThrow();
Nuno Lopesde8c6fb2012-06-23 00:12:34 +0000102 TrapCall->setDebugLoc(Inst->getDebugLoc());
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000103 Builder->CreateUnreachable();
104
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000105 return TrapBB;
106}
107
Nuno Lopes59e9df72012-05-22 22:02:19 +0000108/// instrument - adds run-time bounds checks to memory accessing instructions.
109/// Ptr is the pointer that will be read/written, and InstVal is either the
110/// result from the load or the value being stored. It is used to determine the
111/// size of memory block that is touched.
112/// Returns true if any change was made to the IR, false otherwise.
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000113bool BoundsChecking::instrument(Value *Ptr, Value *InstVal,
114 const DataLayout &DL) {
115 uint64_t NeededSize = DL.getTypeStoreSize(InstVal->getType());
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000116 DEBUG(dbgs() << "Instrument " << *Ptr << " for " << Twine(NeededSize)
117 << " bytes\n");
118
Nuno Lopes0e967e02012-06-21 15:59:53 +0000119 SizeOffsetEvalType SizeOffset = ObjSizeEval->compute(Ptr);
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000120
Nuno Lopes0e967e02012-06-21 15:59:53 +0000121 if (!ObjSizeEval->bothKnown(SizeOffset)) {
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000122 ++ChecksUnable;
123 return false;
124 }
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000125
Nuno Lopes0e967e02012-06-21 15:59:53 +0000126 Value *Size = SizeOffset.first;
127 Value *Offset = SizeOffset.second;
Nuno Lopes1e8dffd2012-07-03 17:30:18 +0000128 ConstantInt *SizeCI = dyn_cast<ConstantInt>(Size);
Nuno Lopes0e967e02012-06-21 15:59:53 +0000129
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000130 Type *IntTy = DL.getIntPtrType(Ptr->getType());
Nuno Lopes0e967e02012-06-21 15:59:53 +0000131 Value *NeededSizeVal = ConstantInt::get(IntTy, NeededSize);
132
Nuno Lopes7d000612012-05-31 22:45:40 +0000133 // three checks are required to ensure safety:
134 // . Offset >= 0 (since the offset is given from the base ptr)
135 // . Size >= Offset (unsigned)
136 // . Size - Offset >= NeededSize (unsigned)
Nuno Lopes1e8dffd2012-07-03 17:30:18 +0000137 //
138 // optimization: if Size >= 0 (signed), skip 1st check
Nuno Lopes7d000612012-05-31 22:45:40 +0000139 // FIXME: add NSW/NUW here? -- we dont care if the subtraction overflows
Nuno Lopes0e967e02012-06-21 15:59:53 +0000140 Value *ObjSize = Builder->CreateSub(Size, Offset);
Nuno Lopes0e967e02012-06-21 15:59:53 +0000141 Value *Cmp2 = Builder->CreateICmpULT(Size, Offset);
142 Value *Cmp3 = Builder->CreateICmpULT(ObjSize, NeededSizeVal);
Nuno Lopes1e8dffd2012-07-03 17:30:18 +0000143 Value *Or = Builder->CreateOr(Cmp2, Cmp3);
144 if (!SizeCI || SizeCI->getValue().slt(0)) {
145 Value *Cmp1 = Builder->CreateICmpSLT(Offset, ConstantInt::get(IntTy, 0));
146 Or = Builder->CreateOr(Cmp1, Or);
147 }
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000148
Chandler Carruth3f0e0562017-10-18 22:42:36 +0000149 // check if the comparison is always false
150 ConstantInt *C = dyn_cast_or_null<ConstantInt>(Or);
151 if (C) {
152 ++ChecksSkipped;
153 // If non-zero, nothing to do.
154 if (!C->getZExtValue())
155 return true;
156 }
157 ++ChecksAdded;
158
159 BasicBlock::iterator SplitI = Builder->GetInsertPoint();
160 BasicBlock *OldBB = SplitI->getParent();
161 BasicBlock *Cont = OldBB->splitBasicBlock(SplitI);
162 OldBB->getTerminator()->eraseFromParent();
163
164 if (C) {
165 // If we have a constant zero, unconditionally branch.
166 // FIXME: We should really handle this differently to bypass the splitting
167 // the block.
168 BranchInst::Create(getTrapBB(), OldBB);
169 return true;
170 }
171
172 // Create the conditional branch.
173 BranchInst::Create(getTrapBB(), Cont, Or, OldBB);
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000174 return true;
175}
176
177bool BoundsChecking::runOnFunction(Function &F) {
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000178 const DataLayout &DL = F.getParent()->getDataLayout();
Chandler Carruthb98f63d2015-01-15 10:41:28 +0000179 TLI = &getAnalysis<TargetLibraryInfoWrapperPass>().getTLI();
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000180
Craig Topperf40110f2014-04-25 05:29:35 +0000181 TrapBB = nullptr;
Rafael Espindola37dc9e12014-02-21 00:06:31 +0000182 BuilderTy TheBuilder(F.getContext(), TargetFolder(DL));
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000183 Builder = &TheBuilder;
Rafael Espindola37dc9e12014-02-21 00:06:31 +0000184 ObjectSizeOffsetEvaluator TheObjSizeEval(DL, TLI, F.getContext(),
Nuno Lopes340b0462013-10-24 09:17:24 +0000185 /*RoundToAlign=*/true);
Nuno Lopes0e967e02012-06-21 15:59:53 +0000186 ObjSizeEval = &TheObjSizeEval;
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000187
188 // check HANDLE_MEMORY_INST in include/llvm/Instruction.def for memory
189 // touching instructions
Eugene Zelenkobff0ef02017-10-19 22:07:16 +0000190 std::vector<Instruction *> WorkList;
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000191 for (inst_iterator i = inst_begin(F), e = inst_end(F); i != e; ++i) {
192 Instruction *I = &*i;
193 if (isa<LoadInst>(I) || isa<StoreInst>(I) || isa<AtomicCmpXchgInst>(I) ||
194 isa<AtomicRMWInst>(I))
195 WorkList.push_back(I);
196 }
197
198 bool MadeChange = false;
Benjamin Kramer135f7352016-06-26 12:28:59 +0000199 for (Instruction *i : WorkList) {
200 Inst = i;
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000201
Nuno Lopesde8c6fb2012-06-23 00:12:34 +0000202 Builder->SetInsertPoint(Inst);
203 if (LoadInst *LI = dyn_cast<LoadInst>(Inst)) {
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000204 MadeChange |= instrument(LI->getPointerOperand(), LI, DL);
Nuno Lopesde8c6fb2012-06-23 00:12:34 +0000205 } else if (StoreInst *SI = dyn_cast<StoreInst>(Inst)) {
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000206 MadeChange |=
207 instrument(SI->getPointerOperand(), SI->getValueOperand(), DL);
Nuno Lopesde8c6fb2012-06-23 00:12:34 +0000208 } else if (AtomicCmpXchgInst *AI = dyn_cast<AtomicCmpXchgInst>(Inst)) {
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000209 MadeChange |=
210 instrument(AI->getPointerOperand(), AI->getCompareOperand(), DL);
Nuno Lopesde8c6fb2012-06-23 00:12:34 +0000211 } else if (AtomicRMWInst *AI = dyn_cast<AtomicRMWInst>(Inst)) {
Mehdi Aminia28d91d2015-03-10 02:37:25 +0000212 MadeChange |=
213 instrument(AI->getPointerOperand(), AI->getValOperand(), DL);
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000214 } else {
215 llvm_unreachable("unknown Instruction type");
216 }
217 }
218 return MadeChange;
219}
220
Joey Gouly95198232012-11-23 10:47:35 +0000221FunctionPass *llvm::createBoundsCheckingPass() {
222 return new BoundsChecking();
Nuno Lopesa2f6cec2012-05-22 17:19:09 +0000223}