blob: 72825f5f6f4260a31d8fde018e3d095cf9552e80 [file] [log] [blame]
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001//===-- AddressSanitizer.cpp - memory error detector ------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file is a part of AddressSanitizer, an address sanity checker.
11// Details of the algorithm:
12// http://code.google.com/p/address-sanitizer/wiki/AddressSanitizerAlgorithm
13//
14//===----------------------------------------------------------------------===//
15
16#define DEBUG_TYPE "asan"
17
Chandler Carruthed0881b2012-12-03 16:50:05 +000018#include "llvm/Transforms/Instrumentation.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000019#include "llvm/ADT/ArrayRef.h"
Alexey Samsonov29dd7f22012-12-27 08:50:58 +000020#include "llvm/ADT/DenseMap.h"
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +000021#include "llvm/ADT/DepthFirstIterator.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000022#include "llvm/ADT/OwningPtr.h"
23#include "llvm/ADT/SmallSet.h"
24#include "llvm/ADT/SmallString.h"
25#include "llvm/ADT/SmallVector.h"
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +000026#include "llvm/ADT/Statistic.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000027#include "llvm/ADT/StringExtras.h"
Evgeniy Stepanov617232f2012-05-23 11:52:12 +000028#include "llvm/ADT/Triple.h"
Alexey Samsonov3d43b632012-12-12 14:31:53 +000029#include "llvm/DIBuilder.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000030#include "llvm/IR/DataLayout.h"
31#include "llvm/IR/Function.h"
32#include "llvm/IR/IRBuilder.h"
33#include "llvm/IR/InlineAsm.h"
34#include "llvm/IR/IntrinsicInst.h"
35#include "llvm/IR/LLVMContext.h"
36#include "llvm/IR/Module.h"
37#include "llvm/IR/Type.h"
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +000038#include "llvm/InstVisitor.h"
Kostya Serebryany699ac282013-02-20 12:35:15 +000039#include "llvm/Support/CallSite.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000040#include "llvm/Support/CommandLine.h"
41#include "llvm/Support/DataTypes.h"
42#include "llvm/Support/Debug.h"
Kostya Serebryany9e62b302013-06-03 14:46:56 +000043#include "llvm/Support/Endian.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000044#include "llvm/Support/system_error.h"
Kostya Serebryany4fb78012013-12-06 09:00:17 +000045#include "llvm/Transforms/Utils/ASanStackFrameLayout.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000046#include "llvm/Transforms/Utils/BasicBlockUtils.h"
Kostya Serebryany9f5213f2013-06-26 09:18:17 +000047#include "llvm/Transforms/Utils/Cloning.h"
Alexey Samsonov3d43b632012-12-12 14:31:53 +000048#include "llvm/Transforms/Utils/Local.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000049#include "llvm/Transforms/Utils/ModuleUtils.h"
Peter Collingbourne015370e2013-07-09 22:02:49 +000050#include "llvm/Transforms/Utils/SpecialCaseList.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000051#include <algorithm>
Chandler Carruthed0881b2012-12-03 16:50:05 +000052#include <string>
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000053
54using namespace llvm;
55
56static const uint64_t kDefaultShadowScale = 3;
57static const uint64_t kDefaultShadowOffset32 = 1ULL << 29;
58static const uint64_t kDefaultShadowOffset64 = 1ULL << 44;
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +000059static const uint64_t kDefaultShort64bitShadowOffset = 0x7FFF8000; // < 2G.
Kostya Serebryany4766fe62013-01-23 12:54:55 +000060static const uint64_t kPPC64_ShadowOffset64 = 1ULL << 41;
Kostya Serebryany9e62b302013-06-03 14:46:56 +000061static const uint64_t kMIPS32_ShadowOffset32 = 0x0aaa8000;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000062
Kostya Serebryany6805de52013-09-10 13:16:56 +000063static const size_t kMinStackMallocSize = 1 << 6; // 64B
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000064static const size_t kMaxStackMallocSize = 1 << 16; // 64K
65static const uintptr_t kCurrentStackFrameMagic = 0x41B58AB3;
66static const uintptr_t kRetiredStackFrameMagic = 0x45E0360E;
67
Craig Topperd3a34f82013-07-16 01:17:10 +000068static const char *const kAsanModuleCtorName = "asan.module_ctor";
69static const char *const kAsanModuleDtorName = "asan.module_dtor";
70static const int kAsanCtorAndCtorPriority = 1;
71static const char *const kAsanReportErrorTemplate = "__asan_report_";
72static const char *const kAsanReportLoadN = "__asan_report_load_n";
73static const char *const kAsanReportStoreN = "__asan_report_store_n";
74static const char *const kAsanRegisterGlobalsName = "__asan_register_globals";
Alexey Samsonovf52b7172013-08-05 13:19:49 +000075static const char *const kAsanUnregisterGlobalsName =
76 "__asan_unregister_globals";
Craig Topperd3a34f82013-07-16 01:17:10 +000077static const char *const kAsanPoisonGlobalsName = "__asan_before_dynamic_init";
78static const char *const kAsanUnpoisonGlobalsName = "__asan_after_dynamic_init";
79static const char *const kAsanInitName = "__asan_init_v3";
Bob Wilsonda4147c2013-11-15 07:16:09 +000080static const char *const kAsanCovName = "__sanitizer_cov";
Craig Topperd3a34f82013-07-16 01:17:10 +000081static const char *const kAsanHandleNoReturnName = "__asan_handle_no_return";
82static const char *const kAsanMappingOffsetName = "__asan_mapping_offset";
83static const char *const kAsanMappingScaleName = "__asan_mapping_scale";
Kostya Serebryany6805de52013-09-10 13:16:56 +000084static const int kMaxAsanStackMallocSizeClass = 10;
85static const char *const kAsanStackMallocNameTemplate = "__asan_stack_malloc_";
86static const char *const kAsanStackFreeNameTemplate = "__asan_stack_free_";
Craig Topperd3a34f82013-07-16 01:17:10 +000087static const char *const kAsanGenPrefix = "__asan_gen_";
88static const char *const kAsanPoisonStackMemoryName =
89 "__asan_poison_stack_memory";
90static const char *const kAsanUnpoisonStackMemoryName =
Alexey Samsonov261177a2012-12-04 01:34:23 +000091 "__asan_unpoison_stack_memory";
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000092
Kostya Serebryanyf3223822013-09-18 14:07:14 +000093static const char *const kAsanOptionDetectUAR =
94 "__asan_option_detect_stack_use_after_return";
95
David Blaikieeacc2872013-09-18 00:11:27 +000096#ifndef NDEBUG
Kostya Serebryanybc86efb2013-09-17 12:14:50 +000097static const int kAsanStackAfterReturnMagic = 0xf5;
David Blaikieeacc2872013-09-18 00:11:27 +000098#endif
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000099
Kostya Serebryany874dae62012-07-16 16:15:40 +0000100// Accesses sizes are powers of two: 1, 2, 4, 8, 16.
101static const size_t kNumberOfAccessSizes = 5;
102
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000103// Command-line flags.
104
105// This flag may need to be replaced with -f[no-]asan-reads.
106static cl::opt<bool> ClInstrumentReads("asan-instrument-reads",
107 cl::desc("instrument read instructions"), cl::Hidden, cl::init(true));
108static cl::opt<bool> ClInstrumentWrites("asan-instrument-writes",
109 cl::desc("instrument write instructions"), cl::Hidden, cl::init(true));
Kostya Serebryany90241602012-05-30 09:04:06 +0000110static cl::opt<bool> ClInstrumentAtomics("asan-instrument-atomics",
111 cl::desc("instrument atomic instructions (rmw, cmpxchg)"),
112 cl::Hidden, cl::init(true));
Kostya Serebryany1e575ab2012-08-15 08:58:58 +0000113static cl::opt<bool> ClAlwaysSlowPath("asan-always-slow-path",
114 cl::desc("use instrumentation with slow path for all accesses"),
115 cl::Hidden, cl::init(false));
Kostya Serebryany874dae62012-07-16 16:15:40 +0000116// This flag limits the number of instructions to be instrumented
Kostya Serebryanyc387ca72012-06-28 09:34:41 +0000117// in any given BB. Normally, this should be set to unlimited (INT_MAX),
118// but due to http://llvm.org/bugs/show_bug.cgi?id=12652 we temporary
119// set it to 10000.
120static cl::opt<int> ClMaxInsnsToInstrumentPerBB("asan-max-ins-per-bb",
121 cl::init(10000),
122 cl::desc("maximal number of instructions to instrument in any given BB"),
123 cl::Hidden);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000124// This flag may need to be replaced with -f[no]asan-stack.
125static cl::opt<bool> ClStack("asan-stack",
126 cl::desc("Handle stack memory"), cl::Hidden, cl::init(true));
127// This flag may need to be replaced with -f[no]asan-use-after-return.
128static cl::opt<bool> ClUseAfterReturn("asan-use-after-return",
129 cl::desc("Check return-after-free"), cl::Hidden, cl::init(false));
130// This flag may need to be replaced with -f[no]asan-globals.
131static cl::opt<bool> ClGlobals("asan-globals",
132 cl::desc("Handle global objects"), cl::Hidden, cl::init(true));
Bob Wilsonda4147c2013-11-15 07:16:09 +0000133static cl::opt<bool> ClCoverage("asan-coverage",
134 cl::desc("ASan coverage"), cl::Hidden, cl::init(false));
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000135static cl::opt<bool> ClInitializers("asan-initialization-order",
136 cl::desc("Handle C++ initializer order"), cl::Hidden, cl::init(false));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000137static cl::opt<bool> ClMemIntrin("asan-memintrin",
138 cl::desc("Handle memset/memcpy/memmove"), cl::Hidden, cl::init(true));
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000139static cl::opt<unsigned> ClRealignStack("asan-realign-stack",
140 cl::desc("Realign stack to the value of this flag (power of two)"),
141 cl::Hidden, cl::init(32));
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000142static cl::opt<std::string> ClBlacklistFile("asan-blacklist",
143 cl::desc("File containing the list of objects to ignore "
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000144 "during instrumentation"), cl::Hidden);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000145
Kostya Serebryany9f5213f2013-06-26 09:18:17 +0000146// This is an experimental feature that will allow to choose between
147// instrumented and non-instrumented code at link-time.
148// If this option is on, just before instrumenting a function we create its
149// clone; if the function is not changed by asan the clone is deleted.
150// If we end up with a clone, we put the instrumented function into a section
151// called "ASAN" and the uninstrumented function into a section called "NOASAN".
152//
153// This is still a prototype, we need to figure out a way to keep two copies of
154// a function so that the linker can easily choose one of them.
155static cl::opt<bool> ClKeepUninstrumented("asan-keep-uninstrumented-functions",
156 cl::desc("Keep uninstrumented copies of functions"),
157 cl::Hidden, cl::init(false));
158
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000159// These flags allow to change the shadow mapping.
160// The shadow mapping looks like
161// Shadow = (Mem >> scale) + (1 << offset_log)
162static cl::opt<int> ClMappingScale("asan-mapping-scale",
163 cl::desc("scale of asan shadow mapping"), cl::Hidden, cl::init(0));
164static cl::opt<int> ClMappingOffsetLog("asan-mapping-offset-log",
165 cl::desc("offset of asan shadow mapping"), cl::Hidden, cl::init(-1));
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +0000166static cl::opt<bool> ClShort64BitOffset("asan-short-64bit-mapping-offset",
167 cl::desc("Use short immediate constant as the mapping offset for 64bit"),
Kostya Serebryanybe733372013-02-12 11:11:02 +0000168 cl::Hidden, cl::init(true));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000169
170// Optimization flags. Not user visible, used mostly for testing
171// and benchmarking the tool.
172static cl::opt<bool> ClOpt("asan-opt",
173 cl::desc("Optimize instrumentation"), cl::Hidden, cl::init(true));
174static cl::opt<bool> ClOptSameTemp("asan-opt-same-temp",
175 cl::desc("Instrument the same temp just once"), cl::Hidden,
176 cl::init(true));
177static cl::opt<bool> ClOptGlobals("asan-opt-globals",
178 cl::desc("Don't instrument scalar globals"), cl::Hidden, cl::init(true));
179
Alexey Samsonovdf624522012-11-29 18:14:24 +0000180static cl::opt<bool> ClCheckLifetime("asan-check-lifetime",
181 cl::desc("Use llvm.lifetime intrinsics to insert extra checks"),
182 cl::Hidden, cl::init(false));
183
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000184// Debug flags.
185static cl::opt<int> ClDebug("asan-debug", cl::desc("debug"), cl::Hidden,
186 cl::init(0));
187static cl::opt<int> ClDebugStack("asan-debug-stack", cl::desc("debug stack"),
188 cl::Hidden, cl::init(0));
189static cl::opt<std::string> ClDebugFunc("asan-debug-func",
190 cl::Hidden, cl::desc("Debug func"));
191static cl::opt<int> ClDebugMin("asan-debug-min", cl::desc("Debug min inst"),
192 cl::Hidden, cl::init(-1));
193static cl::opt<int> ClDebugMax("asan-debug-max", cl::desc("Debug man inst"),
194 cl::Hidden, cl::init(-1));
195
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000196STATISTIC(NumInstrumentedReads, "Number of instrumented reads");
197STATISTIC(NumInstrumentedWrites, "Number of instrumented writes");
198STATISTIC(NumOptimizedAccessesToGlobalArray,
199 "Number of optimized accesses to global arrays");
200STATISTIC(NumOptimizedAccessesToGlobalVar,
201 "Number of optimized accesses to global vars");
202
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000203namespace {
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000204/// A set of dynamically initialized globals extracted from metadata.
205class SetOfDynamicallyInitializedGlobals {
206 public:
207 void Init(Module& M) {
208 // Clang generates metadata identifying all dynamically initialized globals.
209 NamedMDNode *DynamicGlobals =
210 M.getNamedMetadata("llvm.asan.dynamically_initialized_globals");
211 if (!DynamicGlobals)
212 return;
213 for (int i = 0, n = DynamicGlobals->getNumOperands(); i < n; ++i) {
214 MDNode *MDN = DynamicGlobals->getOperand(i);
215 assert(MDN->getNumOperands() == 1);
216 Value *VG = MDN->getOperand(0);
217 // The optimizer may optimize away a global entirely, in which case we
218 // cannot instrument access to it.
219 if (!VG)
220 continue;
221 DynInitGlobals.insert(cast<GlobalVariable>(VG));
222 }
223 }
224 bool Contains(GlobalVariable *G) { return DynInitGlobals.count(G) != 0; }
225 private:
226 SmallSet<GlobalValue*, 32> DynInitGlobals;
227};
228
Alexey Samsonov1345d352013-01-16 13:23:28 +0000229/// This struct defines the shadow mapping using the rule:
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000230/// shadow = (mem >> Scale) ADD-or-OR Offset.
Alexey Samsonov1345d352013-01-16 13:23:28 +0000231struct ShadowMapping {
232 int Scale;
233 uint64_t Offset;
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000234 bool OrShadowOffset;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000235};
236
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000237static ShadowMapping getShadowMapping(const Module &M, int LongSize,
238 bool ZeroBaseShadow) {
239 llvm::Triple TargetTriple(M.getTargetTriple());
240 bool IsAndroid = TargetTriple.getEnvironment() == llvm::Triple::Android;
Alexander Potapenko259e8122013-02-12 12:41:12 +0000241 bool IsMacOSX = TargetTriple.getOS() == llvm::Triple::MacOSX;
Bill Schmidt0a9170d2013-07-26 01:35:43 +0000242 bool IsPPC64 = TargetTriple.getArch() == llvm::Triple::ppc64 ||
243 TargetTriple.getArch() == llvm::Triple::ppc64le;
Kostya Serebryanybe733372013-02-12 11:11:02 +0000244 bool IsX86_64 = TargetTriple.getArch() == llvm::Triple::x86_64;
Kostya Serebryany9e62b302013-06-03 14:46:56 +0000245 bool IsMIPS32 = TargetTriple.getArch() == llvm::Triple::mips ||
246 TargetTriple.getArch() == llvm::Triple::mipsel;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000247
248 ShadowMapping Mapping;
249
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000250 // OR-ing shadow offset if more efficient (at least on x86),
251 // but on ppc64 we have to use add since the shadow offset is not neccesary
252 // 1/8-th of the address space.
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +0000253 Mapping.OrShadowOffset = !IsPPC64 && !ClShort64BitOffset;
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000254
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000255 Mapping.Offset = (IsAndroid || ZeroBaseShadow) ? 0 :
Kostya Serebryany9e62b302013-06-03 14:46:56 +0000256 (LongSize == 32 ?
257 (IsMIPS32 ? kMIPS32_ShadowOffset32 : kDefaultShadowOffset32) :
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000258 IsPPC64 ? kPPC64_ShadowOffset64 : kDefaultShadowOffset64);
Alexander Potapenko259e8122013-02-12 12:41:12 +0000259 if (!ZeroBaseShadow && ClShort64BitOffset && IsX86_64 && !IsMacOSX) {
Kostya Serebryanybe733372013-02-12 11:11:02 +0000260 assert(LongSize == 64);
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +0000261 Mapping.Offset = kDefaultShort64bitShadowOffset;
Kostya Serebryanycaf11af2013-02-13 05:14:12 +0000262 }
263 if (!ZeroBaseShadow && ClMappingOffsetLog >= 0) {
Alexey Samsonov1345d352013-01-16 13:23:28 +0000264 // Zero offset log is the special case.
265 Mapping.Offset = (ClMappingOffsetLog == 0) ? 0 : 1ULL << ClMappingOffsetLog;
266 }
267
268 Mapping.Scale = kDefaultShadowScale;
269 if (ClMappingScale) {
270 Mapping.Scale = ClMappingScale;
271 }
272
273 return Mapping;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000274}
275
Alexey Samsonov1345d352013-01-16 13:23:28 +0000276static size_t RedzoneSizeForScale(int MappingScale) {
Kostya Serebryany20a79972012-11-22 03:18:50 +0000277 // Redzone used for stack and globals is at least 32 bytes.
278 // For scales 6 and 7, the redzone has to be 64 and 128 bytes respectively.
Alexey Samsonov1345d352013-01-16 13:23:28 +0000279 return std::max(32U, 1U << MappingScale);
Kostya Serebryany20a79972012-11-22 03:18:50 +0000280}
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000281
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000282/// AddressSanitizer: instrument the code in module to find memory bugs.
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000283struct AddressSanitizer : public FunctionPass {
Alexey Samsonov819eddc2013-03-14 12:38:58 +0000284 AddressSanitizer(bool CheckInitOrder = true,
Alexey Samsonovdf624522012-11-29 18:14:24 +0000285 bool CheckUseAfterReturn = false,
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000286 bool CheckLifetime = false,
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000287 StringRef BlacklistFile = StringRef(),
288 bool ZeroBaseShadow = false)
Alexey Samsonovdf624522012-11-29 18:14:24 +0000289 : FunctionPass(ID),
290 CheckInitOrder(CheckInitOrder || ClInitializers),
291 CheckUseAfterReturn(CheckUseAfterReturn || ClUseAfterReturn),
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000292 CheckLifetime(CheckLifetime || ClCheckLifetime),
293 BlacklistFile(BlacklistFile.empty() ? ClBlacklistFile
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000294 : BlacklistFile),
295 ZeroBaseShadow(ZeroBaseShadow) {}
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000296 virtual const char *getPassName() const {
297 return "AddressSanitizerFunctionPass";
298 }
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000299 void instrumentMop(Instruction *I);
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000300 void instrumentAddress(Instruction *OrigIns, Instruction *InsertBefore,
301 Value *Addr, uint32_t TypeSize, bool IsWrite,
302 Value *SizeArgument);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000303 Value *createSlowPathCmp(IRBuilder<> &IRB, Value *AddrLong,
304 Value *ShadowValue, uint32_t TypeSize);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000305 Instruction *generateCrashCode(Instruction *InsertBefore, Value *Addr,
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000306 bool IsWrite, size_t AccessSizeIndex,
307 Value *SizeArgument);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000308 bool instrumentMemIntrinsic(MemIntrinsic *MI);
309 void instrumentMemIntrinsicParam(Instruction *OrigIns, Value *Addr,
Kostya Serebryany874dae62012-07-16 16:15:40 +0000310 Value *Size,
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000311 Instruction *InsertBefore, bool IsWrite);
312 Value *memToShadow(Value *Shadow, IRBuilder<> &IRB);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000313 bool runOnFunction(Function &F);
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +0000314 bool maybeInsertAsanInitAtFunctionEntry(Function &F);
Alexey Samsonov1345d352013-01-16 13:23:28 +0000315 void emitShadowMapping(Module &M, IRBuilder<> &IRB) const;
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000316 virtual bool doInitialization(Module &M);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000317 static char ID; // Pass identification, replacement for typeid
318
319 private:
Kostya Serebryany4b929da2012-11-29 09:54:21 +0000320 void initializeCallbacks(Module &M);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000321
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000322 bool ShouldInstrumentGlobal(GlobalVariable *G);
Kostya Serebryany1cdc6e92011-11-18 01:41:06 +0000323 bool LooksLikeCodeInBug11395(Instruction *I);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000324 void FindDynamicInitializers(Module &M);
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000325 bool GlobalIsLinkerInitialized(GlobalVariable *G);
Bob Wilsonda4147c2013-11-15 07:16:09 +0000326 bool InjectCoverage(Function &F);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000327
Alexey Samsonovdf624522012-11-29 18:14:24 +0000328 bool CheckInitOrder;
329 bool CheckUseAfterReturn;
330 bool CheckLifetime;
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000331 SmallString<64> BlacklistFile;
332 bool ZeroBaseShadow;
333
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000334 LLVMContext *C;
Micah Villmowcdfe20b2012-10-08 16:38:25 +0000335 DataLayout *TD;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000336 int LongSize;
337 Type *IntptrTy;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000338 ShadowMapping Mapping;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000339 Function *AsanCtorFunction;
340 Function *AsanInitFunction;
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000341 Function *AsanHandleNoReturnFunc;
Bob Wilsonda4147c2013-11-15 07:16:09 +0000342 Function *AsanCovFunction;
Peter Collingbourne015370e2013-07-09 22:02:49 +0000343 OwningPtr<SpecialCaseList> BL;
Kostya Serebryany4273bb02012-07-16 14:09:42 +0000344 // This array is indexed by AccessIsWrite and log2(AccessSize).
345 Function *AsanErrorCallback[2][kNumberOfAccessSizes];
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000346 // This array is indexed by AccessIsWrite.
347 Function *AsanErrorCallbackSized[2];
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000348 InlineAsm *EmptyAsm;
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000349 SetOfDynamicallyInitializedGlobals DynamicallyInitializedGlobals;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000350
351 friend struct FunctionStackPoisoner;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000352};
Kostya Serebryany874dae62012-07-16 16:15:40 +0000353
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000354class AddressSanitizerModule : public ModulePass {
Kostya Serebryany20a79972012-11-22 03:18:50 +0000355 public:
Alexey Samsonov819eddc2013-03-14 12:38:58 +0000356 AddressSanitizerModule(bool CheckInitOrder = true,
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000357 StringRef BlacklistFile = StringRef(),
358 bool ZeroBaseShadow = false)
Alexey Samsonovdf624522012-11-29 18:14:24 +0000359 : ModulePass(ID),
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000360 CheckInitOrder(CheckInitOrder || ClInitializers),
361 BlacklistFile(BlacklistFile.empty() ? ClBlacklistFile
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000362 : BlacklistFile),
363 ZeroBaseShadow(ZeroBaseShadow) {}
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000364 bool runOnModule(Module &M);
365 static char ID; // Pass identification, replacement for typeid
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000366 virtual const char *getPassName() const {
367 return "AddressSanitizerModule";
368 }
Alexey Samsonov261177a2012-12-04 01:34:23 +0000369
Kostya Serebryany20a79972012-11-22 03:18:50 +0000370 private:
Alexey Samsonov788381b2012-12-25 12:28:20 +0000371 void initializeCallbacks(Module &M);
372
Kostya Serebryany20a79972012-11-22 03:18:50 +0000373 bool ShouldInstrumentGlobal(GlobalVariable *G);
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000374 void createInitializerPoisonCalls(Module &M, GlobalValue *ModuleName);
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000375 size_t MinRedzoneSizeForGlobal() const {
Alexey Samsonov1345d352013-01-16 13:23:28 +0000376 return RedzoneSizeForScale(Mapping.Scale);
377 }
Kostya Serebryany20a79972012-11-22 03:18:50 +0000378
Alexey Samsonovdf624522012-11-29 18:14:24 +0000379 bool CheckInitOrder;
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000380 SmallString<64> BlacklistFile;
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000381 bool ZeroBaseShadow;
382
Peter Collingbourne015370e2013-07-09 22:02:49 +0000383 OwningPtr<SpecialCaseList> BL;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000384 SetOfDynamicallyInitializedGlobals DynamicallyInitializedGlobals;
385 Type *IntptrTy;
386 LLVMContext *C;
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000387 DataLayout *TD;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000388 ShadowMapping Mapping;
Alexey Samsonov788381b2012-12-25 12:28:20 +0000389 Function *AsanPoisonGlobals;
390 Function *AsanUnpoisonGlobals;
391 Function *AsanRegisterGlobals;
392 Function *AsanUnregisterGlobals;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000393};
394
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000395// Stack poisoning does not play well with exception handling.
396// When an exception is thrown, we essentially bypass the code
397// that unpoisones the stack. This is why the run-time library has
398// to intercept __cxa_throw (as well as longjmp, etc) and unpoison the entire
399// stack in the interceptor. This however does not work inside the
400// actual function which catches the exception. Most likely because the
401// compiler hoists the load of the shadow value somewhere too high.
402// This causes asan to report a non-existing bug on 453.povray.
403// It sounds like an LLVM bug.
404struct FunctionStackPoisoner : public InstVisitor<FunctionStackPoisoner> {
405 Function &F;
406 AddressSanitizer &ASan;
407 DIBuilder DIB;
408 LLVMContext *C;
409 Type *IntptrTy;
410 Type *IntptrPtrTy;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000411 ShadowMapping Mapping;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000412
413 SmallVector<AllocaInst*, 16> AllocaVec;
414 SmallVector<Instruction*, 8> RetVec;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000415 unsigned StackAlignment;
416
Kostya Serebryany6805de52013-09-10 13:16:56 +0000417 Function *AsanStackMallocFunc[kMaxAsanStackMallocSizeClass + 1],
418 *AsanStackFreeFunc[kMaxAsanStackMallocSizeClass + 1];
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000419 Function *AsanPoisonStackMemoryFunc, *AsanUnpoisonStackMemoryFunc;
420
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000421 // Stores a place and arguments of poisoning/unpoisoning call for alloca.
422 struct AllocaPoisonCall {
423 IntrinsicInst *InsBefore;
Alexey Samsonova788b942013-11-18 14:53:55 +0000424 AllocaInst *AI;
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000425 uint64_t Size;
426 bool DoPoison;
427 };
428 SmallVector<AllocaPoisonCall, 8> AllocaPoisonCallVec;
429
430 // Maps Value to an AllocaInst from which the Value is originated.
431 typedef DenseMap<Value*, AllocaInst*> AllocaForValueMapTy;
432 AllocaForValueMapTy AllocaForValue;
433
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000434 FunctionStackPoisoner(Function &F, AddressSanitizer &ASan)
435 : F(F), ASan(ASan), DIB(*F.getParent()), C(ASan.C),
436 IntptrTy(ASan.IntptrTy), IntptrPtrTy(PointerType::get(IntptrTy, 0)),
Alexey Samsonov1345d352013-01-16 13:23:28 +0000437 Mapping(ASan.Mapping),
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000438 StackAlignment(1 << Mapping.Scale) {}
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000439
440 bool runOnFunction() {
441 if (!ClStack) return false;
442 // Collect alloca, ret, lifetime instructions etc.
443 for (df_iterator<BasicBlock*> DI = df_begin(&F.getEntryBlock()),
444 DE = df_end(&F.getEntryBlock()); DI != DE; ++DI) {
445 BasicBlock *BB = *DI;
446 visit(*BB);
447 }
448 if (AllocaVec.empty()) return false;
449
450 initializeCallbacks(*F.getParent());
451
452 poisonStack();
453
454 if (ClDebugStack) {
455 DEBUG(dbgs() << F);
456 }
457 return true;
458 }
459
460 // Finds all static Alloca instructions and puts
461 // poisoned red zones around all of them.
462 // Then unpoison everything back before the function returns.
463 void poisonStack();
464
465 // ----------------------- Visitors.
466 /// \brief Collect all Ret instructions.
467 void visitReturnInst(ReturnInst &RI) {
468 RetVec.push_back(&RI);
469 }
470
471 /// \brief Collect Alloca instructions we want (and can) handle.
472 void visitAllocaInst(AllocaInst &AI) {
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000473 if (!isInterestingAlloca(AI)) return;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000474
475 StackAlignment = std::max(StackAlignment, AI.getAlignment());
476 AllocaVec.push_back(&AI);
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000477 }
478
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000479 /// \brief Collect lifetime intrinsic calls to check for use-after-scope
480 /// errors.
481 void visitIntrinsicInst(IntrinsicInst &II) {
482 if (!ASan.CheckLifetime) return;
483 Intrinsic::ID ID = II.getIntrinsicID();
484 if (ID != Intrinsic::lifetime_start &&
485 ID != Intrinsic::lifetime_end)
486 return;
487 // Found lifetime intrinsic, add ASan instrumentation if necessary.
488 ConstantInt *Size = dyn_cast<ConstantInt>(II.getArgOperand(0));
489 // If size argument is undefined, don't do anything.
490 if (Size->isMinusOne()) return;
491 // Check that size doesn't saturate uint64_t and can
492 // be stored in IntptrTy.
493 const uint64_t SizeValue = Size->getValue().getLimitedValue();
494 if (SizeValue == ~0ULL ||
495 !ConstantInt::isValueValidForType(IntptrTy, SizeValue))
496 return;
497 // Find alloca instruction that corresponds to llvm.lifetime argument.
498 AllocaInst *AI = findAllocaForValue(II.getArgOperand(1));
499 if (!AI) return;
500 bool DoPoison = (ID == Intrinsic::lifetime_end);
Alexey Samsonova788b942013-11-18 14:53:55 +0000501 AllocaPoisonCall APC = {&II, AI, SizeValue, DoPoison};
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000502 AllocaPoisonCallVec.push_back(APC);
503 }
504
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000505 // ---------------------- Helpers.
506 void initializeCallbacks(Module &M);
507
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000508 // Check if we want (and can) handle this alloca.
Jakub Staszak23ec6a92013-08-09 20:53:48 +0000509 bool isInterestingAlloca(AllocaInst &AI) const {
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000510 return (!AI.isArrayAllocation() && AI.isStaticAlloca() &&
511 AI.getAllocatedType()->isSized() &&
512 // alloca() may be called with 0 size, ignore it.
513 getAllocaSizeInBytes(&AI) > 0);
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000514 }
515
Jakub Staszak23ec6a92013-08-09 20:53:48 +0000516 uint64_t getAllocaSizeInBytes(AllocaInst *AI) const {
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000517 Type *Ty = AI->getAllocatedType();
518 uint64_t SizeInBytes = ASan.TD->getTypeAllocSize(Ty);
519 return SizeInBytes;
520 }
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000521 /// Finds alloca where the value comes from.
522 AllocaInst *findAllocaForValue(Value *V);
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000523 void poisonRedZones(const ArrayRef<uint8_t> ShadowBytes, IRBuilder<> &IRB,
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000524 Value *ShadowBase, bool DoPoison);
Jakub Staszak23ec6a92013-08-09 20:53:48 +0000525 void poisonAlloca(Value *V, uint64_t Size, IRBuilder<> &IRB, bool DoPoison);
Kostya Serebryanybc86efb2013-09-17 12:14:50 +0000526
527 void SetShadowToStackAfterReturnInlined(IRBuilder<> &IRB, Value *ShadowBase,
528 int Size);
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000529};
530
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000531} // namespace
532
533char AddressSanitizer::ID = 0;
534INITIALIZE_PASS(AddressSanitizer, "asan",
535 "AddressSanitizer: detects use-after-free and out-of-bounds bugs.",
536 false, false)
Alexey Samsonovdf624522012-11-29 18:14:24 +0000537FunctionPass *llvm::createAddressSanitizerFunctionPass(
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000538 bool CheckInitOrder, bool CheckUseAfterReturn, bool CheckLifetime,
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000539 StringRef BlacklistFile, bool ZeroBaseShadow) {
Alexey Samsonovdf624522012-11-29 18:14:24 +0000540 return new AddressSanitizer(CheckInitOrder, CheckUseAfterReturn,
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000541 CheckLifetime, BlacklistFile, ZeroBaseShadow);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000542}
543
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000544char AddressSanitizerModule::ID = 0;
545INITIALIZE_PASS(AddressSanitizerModule, "asan-module",
546 "AddressSanitizer: detects use-after-free and out-of-bounds bugs."
547 "ModulePass", false, false)
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000548ModulePass *llvm::createAddressSanitizerModulePass(
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000549 bool CheckInitOrder, StringRef BlacklistFile, bool ZeroBaseShadow) {
550 return new AddressSanitizerModule(CheckInitOrder, BlacklistFile,
551 ZeroBaseShadow);
Alexander Potapenkoc94cf8f2012-01-23 11:22:43 +0000552}
553
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000554static size_t TypeSizeToSizeIndex(uint32_t TypeSize) {
Michael J. Spencerdf1ecbd72013-05-24 22:23:49 +0000555 size_t Res = countTrailingZeros(TypeSize / 8);
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000556 assert(Res < kNumberOfAccessSizes);
557 return Res;
558}
559
Bill Wendling58f8cef2013-08-06 22:52:42 +0000560// \brief Create a constant for Str so that we can pass it to the run-time lib.
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000561static GlobalVariable *createPrivateGlobalForString(
562 Module &M, StringRef Str, bool AllowMerging) {
Chris Lattnercf9e8f62012-02-05 02:29:43 +0000563 Constant *StrConst = ConstantDataArray::getString(M.getContext(), Str);
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000564 // For module-local strings that can be merged with another one we set the
565 // internal linkage and the unnamed_addr attribute.
566 // Non-mergeable strings are made linker_private to remove them from the
567 // symbol table. "private" linkage doesn't work for Darwin, where the
568 // "L"-prefixed globals end up in __TEXT,__const section
569 // (see http://llvm.org/bugs/show_bug.cgi?id=17976 for more info).
570 GlobalValue::LinkageTypes linkage =
571 AllowMerging ? GlobalValue::InternalLinkage
572 : GlobalValue::LinkerPrivateLinkage;
573 GlobalVariable *GV =
574 new GlobalVariable(M, StrConst->getType(), true,
575 linkage, StrConst, kAsanGenPrefix);
576 if (AllowMerging) GV->setUnnamedAddr(true);
Kostya Serebryany10cc12f2013-03-18 09:38:39 +0000577 GV->setAlignment(1); // Strings may not be merged w/o setting align 1.
578 return GV;
Kostya Serebryany139a9372012-11-20 14:16:08 +0000579}
580
581static bool GlobalWasGeneratedByAsan(GlobalVariable *G) {
582 return G->getName().find(kAsanGenPrefix) == 0;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000583}
584
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000585Value *AddressSanitizer::memToShadow(Value *Shadow, IRBuilder<> &IRB) {
586 // Shadow >> scale
Alexey Samsonov1345d352013-01-16 13:23:28 +0000587 Shadow = IRB.CreateLShr(Shadow, Mapping.Scale);
588 if (Mapping.Offset == 0)
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000589 return Shadow;
590 // (Shadow >> scale) | offset
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000591 if (Mapping.OrShadowOffset)
592 return IRB.CreateOr(Shadow, ConstantInt::get(IntptrTy, Mapping.Offset));
593 else
594 return IRB.CreateAdd(Shadow, ConstantInt::get(IntptrTy, Mapping.Offset));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000595}
596
Kostya Serebryany874dae62012-07-16 16:15:40 +0000597void AddressSanitizer::instrumentMemIntrinsicParam(
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000598 Instruction *OrigIns,
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000599 Value *Addr, Value *Size, Instruction *InsertBefore, bool IsWrite) {
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000600 IRBuilder<> IRB(InsertBefore);
601 if (Size->getType() != IntptrTy)
602 Size = IRB.CreateIntCast(Size, IntptrTy, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000603 // Check the first byte.
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000604 instrumentAddress(OrigIns, InsertBefore, Addr, 8, IsWrite, Size);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000605 // Check the last byte.
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000606 IRB.SetInsertPoint(InsertBefore);
607 Value *SizeMinusOne = IRB.CreateSub(Size, ConstantInt::get(IntptrTy, 1));
608 Value *AddrLong = IRB.CreatePointerCast(Addr, IntptrTy);
609 Value *AddrLast = IRB.CreateAdd(AddrLong, SizeMinusOne);
610 instrumentAddress(OrigIns, InsertBefore, AddrLast, 8, IsWrite, Size);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000611}
612
613// Instrument memset/memmove/memcpy
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000614bool AddressSanitizer::instrumentMemIntrinsic(MemIntrinsic *MI) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000615 Value *Dst = MI->getDest();
616 MemTransferInst *MemTran = dyn_cast<MemTransferInst>(MI);
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000617 Value *Src = MemTran ? MemTran->getSource() : 0;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000618 Value *Length = MI->getLength();
619
620 Constant *ConstLength = dyn_cast<Constant>(Length);
621 Instruction *InsertBefore = MI;
622 if (ConstLength) {
623 if (ConstLength->isNullValue()) return false;
624 } else {
625 // The size is not a constant so it could be zero -- check at run-time.
626 IRBuilder<> IRB(InsertBefore);
627
628 Value *Cmp = IRB.CreateICmpNE(Length,
Kostya Serebryanyeeaf6882012-07-02 11:42:29 +0000629 Constant::getNullValue(Length->getType()));
Evgeniy Stepanova9164e92013-12-19 13:29:56 +0000630 InsertBefore = SplitBlockAndInsertIfThen(Cmp, InsertBefore, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000631 }
632
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000633 instrumentMemIntrinsicParam(MI, Dst, Length, InsertBefore, true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000634 if (Src)
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000635 instrumentMemIntrinsicParam(MI, Src, Length, InsertBefore, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000636 return true;
637}
638
Kostya Serebryany90241602012-05-30 09:04:06 +0000639// If I is an interesting memory access, return the PointerOperand
640// and set IsWrite. Otherwise return NULL.
641static Value *isInterestingMemoryAccess(Instruction *I, bool *IsWrite) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000642 if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
Kostya Serebryany90241602012-05-30 09:04:06 +0000643 if (!ClInstrumentReads) return NULL;
644 *IsWrite = false;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000645 return LI->getPointerOperand();
646 }
Kostya Serebryany90241602012-05-30 09:04:06 +0000647 if (StoreInst *SI = dyn_cast<StoreInst>(I)) {
648 if (!ClInstrumentWrites) return NULL;
649 *IsWrite = true;
650 return SI->getPointerOperand();
651 }
652 if (AtomicRMWInst *RMW = dyn_cast<AtomicRMWInst>(I)) {
653 if (!ClInstrumentAtomics) return NULL;
654 *IsWrite = true;
655 return RMW->getPointerOperand();
656 }
657 if (AtomicCmpXchgInst *XCHG = dyn_cast<AtomicCmpXchgInst>(I)) {
658 if (!ClInstrumentAtomics) return NULL;
659 *IsWrite = true;
660 return XCHG->getPointerOperand();
661 }
662 return NULL;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000663}
664
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000665bool AddressSanitizer::GlobalIsLinkerInitialized(GlobalVariable *G) {
666 // If a global variable does not have dynamic initialization we don't
667 // have to instrument it. However, if a global does not have initializer
668 // at all, we assume it has dynamic initializer (in other TU).
669 return G->hasInitializer() && !DynamicallyInitializedGlobals.Contains(G);
670}
671
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000672void AddressSanitizer::instrumentMop(Instruction *I) {
Axel Naumann4a127062012-09-17 14:20:57 +0000673 bool IsWrite = false;
Kostya Serebryany90241602012-05-30 09:04:06 +0000674 Value *Addr = isInterestingMemoryAccess(I, &IsWrite);
675 assert(Addr);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000676 if (ClOpt && ClOptGlobals) {
677 if (GlobalVariable *G = dyn_cast<GlobalVariable>(Addr)) {
678 // If initialization order checking is disabled, a simple access to a
679 // dynamically initialized global is always valid.
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000680 if (!CheckInitOrder || GlobalIsLinkerInitialized(G)) {
681 NumOptimizedAccessesToGlobalVar++;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000682 return;
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000683 }
684 }
685 ConstantExpr *CE = dyn_cast<ConstantExpr>(Addr);
686 if (CE && CE->isGEPWithNoNotionalOverIndexing()) {
687 if (GlobalVariable *G = dyn_cast<GlobalVariable>(CE->getOperand(0))) {
688 if (CE->getOperand(1)->isNullValue() && GlobalIsLinkerInitialized(G)) {
689 NumOptimizedAccessesToGlobalArray++;
690 return;
691 }
692 }
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000693 }
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000694 }
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000695
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000696 Type *OrigPtrTy = Addr->getType();
697 Type *OrigTy = cast<PointerType>(OrigPtrTy)->getElementType();
698
699 assert(OrigTy->isSized());
Kostya Serebryany7ca384b2013-02-18 13:47:02 +0000700 uint32_t TypeSize = TD->getTypeStoreSizeInBits(OrigTy);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000701
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000702 assert((TypeSize % 8) == 0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000703
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000704 if (IsWrite)
705 NumInstrumentedWrites++;
706 else
707 NumInstrumentedReads++;
708
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000709 // Instrument a 1-, 2-, 4-, 8-, or 16- byte access with one check.
710 if (TypeSize == 8 || TypeSize == 16 ||
711 TypeSize == 32 || TypeSize == 64 || TypeSize == 128)
712 return instrumentAddress(I, I, Addr, TypeSize, IsWrite, 0);
713 // Instrument unusual size (but still multiple of 8).
714 // We can not do it with a single check, so we do 1-byte check for the first
715 // and the last bytes. We call __asan_report_*_n(addr, real_size) to be able
716 // to report the actual access size.
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000717 IRBuilder<> IRB(I);
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000718 Value *LastByte = IRB.CreateIntToPtr(
719 IRB.CreateAdd(IRB.CreatePointerCast(Addr, IntptrTy),
720 ConstantInt::get(IntptrTy, TypeSize / 8 - 1)),
721 OrigPtrTy);
722 Value *Size = ConstantInt::get(IntptrTy, TypeSize / 8);
723 instrumentAddress(I, I, Addr, 8, IsWrite, Size);
724 instrumentAddress(I, I, LastByte, 8, IsWrite, Size);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000725}
726
Alexander Potapenko056e27e2012-04-23 10:47:31 +0000727// Validate the result of Module::getOrInsertFunction called for an interface
728// function of AddressSanitizer. If the instrumented module defines a function
729// with the same name, their prototypes must match, otherwise
730// getOrInsertFunction returns a bitcast.
Kostya Serebryany20a79972012-11-22 03:18:50 +0000731static Function *checkInterfaceFunction(Constant *FuncOrBitcast) {
Alexander Potapenko056e27e2012-04-23 10:47:31 +0000732 if (isa<Function>(FuncOrBitcast)) return cast<Function>(FuncOrBitcast);
733 FuncOrBitcast->dump();
734 report_fatal_error("trying to redefine an AddressSanitizer "
735 "interface function");
736}
737
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000738Instruction *AddressSanitizer::generateCrashCode(
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000739 Instruction *InsertBefore, Value *Addr,
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000740 bool IsWrite, size_t AccessSizeIndex, Value *SizeArgument) {
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000741 IRBuilder<> IRB(InsertBefore);
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000742 CallInst *Call = SizeArgument
743 ? IRB.CreateCall2(AsanErrorCallbackSized[IsWrite], Addr, SizeArgument)
744 : IRB.CreateCall(AsanErrorCallback[IsWrite][AccessSizeIndex], Addr);
745
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000746 // We don't do Call->setDoesNotReturn() because the BB already has
747 // UnreachableInst at the end.
748 // This EmptyAsm is required to avoid callback merge.
749 IRB.CreateCall(EmptyAsm);
Kostya Serebryany3411f2e2012-01-06 18:09:21 +0000750 return Call;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000751}
752
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000753Value *AddressSanitizer::createSlowPathCmp(IRBuilder<> &IRB, Value *AddrLong,
Kostya Serebryany874dae62012-07-16 16:15:40 +0000754 Value *ShadowValue,
755 uint32_t TypeSize) {
Alexey Samsonov1345d352013-01-16 13:23:28 +0000756 size_t Granularity = 1 << Mapping.Scale;
Kostya Serebryany874dae62012-07-16 16:15:40 +0000757 // Addr & (Granularity - 1)
758 Value *LastAccessedByte = IRB.CreateAnd(
759 AddrLong, ConstantInt::get(IntptrTy, Granularity - 1));
760 // (Addr & (Granularity - 1)) + size - 1
761 if (TypeSize / 8 > 1)
762 LastAccessedByte = IRB.CreateAdd(
763 LastAccessedByte, ConstantInt::get(IntptrTy, TypeSize / 8 - 1));
764 // (uint8_t) ((Addr & (Granularity-1)) + size - 1)
765 LastAccessedByte = IRB.CreateIntCast(
Kostya Serebryany1e575ab2012-08-15 08:58:58 +0000766 LastAccessedByte, ShadowValue->getType(), false);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000767 // ((uint8_t) ((Addr & (Granularity-1)) + size - 1)) >= ShadowValue
768 return IRB.CreateICmpSGE(LastAccessedByte, ShadowValue);
769}
770
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000771void AddressSanitizer::instrumentAddress(Instruction *OrigIns,
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000772 Instruction *InsertBefore,
773 Value *Addr, uint32_t TypeSize,
774 bool IsWrite, Value *SizeArgument) {
775 IRBuilder<> IRB(InsertBefore);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000776 Value *AddrLong = IRB.CreatePointerCast(Addr, IntptrTy);
777
778 Type *ShadowTy = IntegerType::get(
Alexey Samsonov1345d352013-01-16 13:23:28 +0000779 *C, std::max(8U, TypeSize >> Mapping.Scale));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000780 Type *ShadowPtrTy = PointerType::get(ShadowTy, 0);
781 Value *ShadowPtr = memToShadow(AddrLong, IRB);
782 Value *CmpVal = Constant::getNullValue(ShadowTy);
783 Value *ShadowValue = IRB.CreateLoad(
784 IRB.CreateIntToPtr(ShadowPtr, ShadowPtrTy));
785
786 Value *Cmp = IRB.CreateICmpNE(ShadowValue, CmpVal);
Kostya Serebryany0f7a80d2012-08-13 14:08:46 +0000787 size_t AccessSizeIndex = TypeSizeToSizeIndex(TypeSize);
Alexey Samsonov1345d352013-01-16 13:23:28 +0000788 size_t Granularity = 1 << Mapping.Scale;
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000789 TerminatorInst *CrashTerm = 0;
790
Kostya Serebryany1e575ab2012-08-15 08:58:58 +0000791 if (ClAlwaysSlowPath || (TypeSize < 8 * Granularity)) {
Evgeniy Stepanov8eb77d82012-10-19 10:48:31 +0000792 TerminatorInst *CheckTerm =
Evgeniy Stepanova9164e92013-12-19 13:29:56 +0000793 SplitBlockAndInsertIfThen(Cmp, InsertBefore, false);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000794 assert(dyn_cast<BranchInst>(CheckTerm)->isUnconditional());
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000795 BasicBlock *NextBB = CheckTerm->getSuccessor(0);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000796 IRB.SetInsertPoint(CheckTerm);
797 Value *Cmp2 = createSlowPathCmp(IRB, AddrLong, ShadowValue, TypeSize);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000798 BasicBlock *CrashBlock =
799 BasicBlock::Create(*C, "", NextBB->getParent(), NextBB);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000800 CrashTerm = new UnreachableInst(*C, CrashBlock);
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000801 BranchInst *NewTerm = BranchInst::Create(CrashBlock, NextBB, Cmp2);
802 ReplaceInstWithInst(CheckTerm, NewTerm);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000803 } else {
Evgeniy Stepanova9164e92013-12-19 13:29:56 +0000804 CrashTerm = SplitBlockAndInsertIfThen(Cmp, InsertBefore, true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000805 }
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000806
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000807 Instruction *Crash = generateCrashCode(
808 CrashTerm, AddrLong, IsWrite, AccessSizeIndex, SizeArgument);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000809 Crash->setDebugLoc(OrigIns->getDebugLoc());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000810}
811
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000812void AddressSanitizerModule::createInitializerPoisonCalls(
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000813 Module &M, GlobalValue *ModuleName) {
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000814 // We do all of our poisoning and unpoisoning within _GLOBAL__I_a.
815 Function *GlobalInit = M.getFunction("_GLOBAL__I_a");
816 // If that function is not present, this TU contains no globals, or they have
817 // all been optimized away
818 if (!GlobalInit)
819 return;
820
821 // Set up the arguments to our poison/unpoison functions.
822 IRBuilder<> IRB(GlobalInit->begin()->getFirstInsertionPt());
823
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000824 // Add a call to poison all external globals before the given function starts.
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000825 Value *ModuleNameAddr = ConstantExpr::getPointerCast(ModuleName, IntptrTy);
826 IRB.CreateCall(AsanPoisonGlobals, ModuleNameAddr);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000827
828 // Add calls to unpoison all globals before each return instruction.
829 for (Function::iterator I = GlobalInit->begin(), E = GlobalInit->end();
830 I != E; ++I) {
831 if (ReturnInst *RI = dyn_cast<ReturnInst>(I->getTerminator())) {
832 CallInst::Create(AsanUnpoisonGlobals, "", RI);
833 }
834 }
835}
836
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000837bool AddressSanitizerModule::ShouldInstrumentGlobal(GlobalVariable *G) {
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000838 Type *Ty = cast<PointerType>(G->getType())->getElementType();
Kostya Serebryany20343352012-10-17 13:40:06 +0000839 DEBUG(dbgs() << "GLOBAL: " << *G << "\n");
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000840
Kostya Serebryany2fa38f82012-09-05 07:29:56 +0000841 if (BL->isIn(*G)) return false;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000842 if (!Ty->isSized()) return false;
843 if (!G->hasInitializer()) return false;
Kostya Serebryany139a9372012-11-20 14:16:08 +0000844 if (GlobalWasGeneratedByAsan(G)) return false; // Our own global.
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000845 // Touch only those globals that will not be defined in other modules.
846 // Don't handle ODR type linkages since other modules may be built w/o asan.
847 if (G->getLinkage() != GlobalVariable::ExternalLinkage &&
848 G->getLinkage() != GlobalVariable::PrivateLinkage &&
849 G->getLinkage() != GlobalVariable::InternalLinkage)
850 return false;
851 // Two problems with thread-locals:
852 // - The address of the main thread's copy can't be computed at link-time.
853 // - Need to poison all copies, not just the main thread's one.
854 if (G->isThreadLocal())
855 return false;
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000856 // For now, just ignore this Global if the alignment is large.
857 if (G->getAlignment() > MinRedzoneSizeForGlobal()) return false;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000858
859 // Ignore all the globals with the names starting with "\01L_OBJC_".
860 // Many of those are put into the .cstring section. The linker compresses
861 // that section by removing the spare \0s after the string terminator, so
862 // our redzones get broken.
863 if ((G->getName().find("\01L_OBJC_") == 0) ||
864 (G->getName().find("\01l_OBJC_") == 0)) {
865 DEBUG(dbgs() << "Ignoring \\01L_OBJC_* global: " << *G);
866 return false;
867 }
868
869 if (G->hasSection()) {
870 StringRef Section(G->getSection());
871 // Ignore the globals from the __OBJC section. The ObjC runtime assumes
872 // those conform to /usr/lib/objc/runtime.h, so we can't add redzones to
873 // them.
874 if ((Section.find("__OBJC,") == 0) ||
875 (Section.find("__DATA, __objc_") == 0)) {
876 DEBUG(dbgs() << "Ignoring ObjC runtime global: " << *G);
877 return false;
878 }
879 // See http://code.google.com/p/address-sanitizer/issues/detail?id=32
880 // Constant CFString instances are compiled in the following way:
881 // -- the string buffer is emitted into
882 // __TEXT,__cstring,cstring_literals
883 // -- the constant NSConstantString structure referencing that buffer
884 // is placed into __DATA,__cfstring
885 // Therefore there's no point in placing redzones into __DATA,__cfstring.
886 // Moreover, it causes the linker to crash on OS X 10.7
887 if (Section.find("__DATA,__cfstring") == 0) {
888 DEBUG(dbgs() << "Ignoring CFString: " << *G);
889 return false;
890 }
891 }
892
893 return true;
894}
895
Alexey Samsonov788381b2012-12-25 12:28:20 +0000896void AddressSanitizerModule::initializeCallbacks(Module &M) {
897 IRBuilder<> IRB(*C);
898 // Declare our poisoning and unpoisoning functions.
899 AsanPoisonGlobals = checkInterfaceFunction(M.getOrInsertFunction(
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000900 kAsanPoisonGlobalsName, IRB.getVoidTy(), IntptrTy, NULL));
Alexey Samsonov788381b2012-12-25 12:28:20 +0000901 AsanPoisonGlobals->setLinkage(Function::ExternalLinkage);
902 AsanUnpoisonGlobals = checkInterfaceFunction(M.getOrInsertFunction(
903 kAsanUnpoisonGlobalsName, IRB.getVoidTy(), NULL));
904 AsanUnpoisonGlobals->setLinkage(Function::ExternalLinkage);
905 // Declare functions that register/unregister globals.
906 AsanRegisterGlobals = checkInterfaceFunction(M.getOrInsertFunction(
907 kAsanRegisterGlobalsName, IRB.getVoidTy(),
908 IntptrTy, IntptrTy, NULL));
909 AsanRegisterGlobals->setLinkage(Function::ExternalLinkage);
910 AsanUnregisterGlobals = checkInterfaceFunction(M.getOrInsertFunction(
911 kAsanUnregisterGlobalsName,
912 IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
913 AsanUnregisterGlobals->setLinkage(Function::ExternalLinkage);
914}
915
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000916// This function replaces all global variables with new variables that have
917// trailing redzones. It also creates a function that poisons
918// redzones and inserts this function into llvm.global_ctors.
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000919bool AddressSanitizerModule::runOnModule(Module &M) {
920 if (!ClGlobals) return false;
921 TD = getAnalysisIfAvailable<DataLayout>();
922 if (!TD)
923 return false;
Alexey Samsonove4b5fb82013-08-12 11:46:09 +0000924 BL.reset(SpecialCaseList::createOrDie(BlacklistFile));
Alexey Samsonov9a956e82012-11-29 18:27:01 +0000925 if (BL->isIn(M)) return false;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000926 C = &(M.getContext());
Alexey Samsonov1345d352013-01-16 13:23:28 +0000927 int LongSize = TD->getPointerSizeInBits();
928 IntptrTy = Type::getIntNTy(*C, LongSize);
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000929 Mapping = getShadowMapping(M, LongSize, ZeroBaseShadow);
Alexey Samsonov788381b2012-12-25 12:28:20 +0000930 initializeCallbacks(M);
931 DynamicallyInitializedGlobals.Init(M);
Kostya Serebryany20a79972012-11-22 03:18:50 +0000932
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000933 SmallVector<GlobalVariable *, 16> GlobalsToChange;
934
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000935 for (Module::GlobalListType::iterator G = M.global_begin(),
936 E = M.global_end(); G != E; ++G) {
937 if (ShouldInstrumentGlobal(G))
938 GlobalsToChange.push_back(G);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000939 }
940
941 size_t n = GlobalsToChange.size();
942 if (n == 0) return false;
943
944 // A global is described by a structure
945 // size_t beg;
946 // size_t size;
947 // size_t size_with_redzone;
948 // const char *name;
Kostya Serebryanybd016bb2013-03-18 08:05:29 +0000949 // const char *module_name;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000950 // size_t has_dynamic_init;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000951 // We initialize an array of such structures and pass it to a run-time call.
952 StructType *GlobalStructTy = StructType::get(IntptrTy, IntptrTy,
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000953 IntptrTy, IntptrTy,
Kostya Serebryanybd016bb2013-03-18 08:05:29 +0000954 IntptrTy, IntptrTy, NULL);
Rafael Espindola44fee4e2013-10-01 13:32:03 +0000955 SmallVector<Constant *, 16> Initializers(n);
Kostya Serebryany20a79972012-11-22 03:18:50 +0000956
957 Function *CtorFunc = M.getFunction(kAsanModuleCtorName);
958 assert(CtorFunc);
959 IRBuilder<> IRB(CtorFunc->getEntryBlock().getTerminator());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000960
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000961 bool HasDynamicallyInitializedGlobals = false;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000962
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000963 // We shouldn't merge same module names, as this string serves as unique
964 // module ID in runtime.
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000965 GlobalVariable *ModuleName = createPrivateGlobalForString(
966 M, M.getModuleIdentifier(), /*AllowMerging*/false);
Kostya Serebryanybd016bb2013-03-18 08:05:29 +0000967
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000968 for (size_t i = 0; i < n; i++) {
Kostya Serebryanye35d59a2013-01-24 10:43:50 +0000969 static const uint64_t kMaxGlobalRedzone = 1 << 18;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000970 GlobalVariable *G = GlobalsToChange[i];
971 PointerType *PtrTy = cast<PointerType>(G->getType());
972 Type *Ty = PtrTy->getElementType();
Kostya Serebryany84a7f2e82012-03-21 15:28:50 +0000973 uint64_t SizeInBytes = TD->getTypeAllocSize(Ty);
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000974 uint64_t MinRZ = MinRedzoneSizeForGlobal();
Kostya Serebryany87191f62013-01-24 10:35:40 +0000975 // MinRZ <= RZ <= kMaxGlobalRedzone
976 // and trying to make RZ to be ~ 1/4 of SizeInBytes.
Kostya Serebryanye35d59a2013-01-24 10:43:50 +0000977 uint64_t RZ = std::max(MinRZ,
Kostya Serebryany87191f62013-01-24 10:35:40 +0000978 std::min(kMaxGlobalRedzone,
979 (SizeInBytes / MinRZ / 4) * MinRZ));
980 uint64_t RightRedzoneSize = RZ;
981 // Round up to MinRZ
982 if (SizeInBytes % MinRZ)
983 RightRedzoneSize += MinRZ - (SizeInBytes % MinRZ);
984 assert(((RightRedzoneSize + SizeInBytes) % MinRZ) == 0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000985 Type *RightRedZoneTy = ArrayType::get(IRB.getInt8Ty(), RightRedzoneSize);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000986 // Determine whether this global should be poisoned in initialization.
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000987 bool GlobalHasDynamicInitializer =
988 DynamicallyInitializedGlobals.Contains(G);
Kostya Serebryany2fa38f82012-09-05 07:29:56 +0000989 // Don't check initialization order if this global is blacklisted.
Peter Collingbourne49062a92013-07-09 22:03:17 +0000990 GlobalHasDynamicInitializer &= !BL->isIn(*G, "init");
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000991
992 StructType *NewTy = StructType::get(Ty, RightRedZoneTy, NULL);
993 Constant *NewInitializer = ConstantStruct::get(
994 NewTy, G->getInitializer(),
995 Constant::getNullValue(RightRedZoneTy), NULL);
996
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000997 GlobalVariable *Name =
998 createPrivateGlobalForString(M, G->getName(), /*AllowMerging*/true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000999
1000 // Create a new global variable with enough space for a redzone.
Bill Wendling58f8cef2013-08-06 22:52:42 +00001001 GlobalValue::LinkageTypes Linkage = G->getLinkage();
1002 if (G->isConstant() && Linkage == GlobalValue::PrivateLinkage)
1003 Linkage = GlobalValue::InternalLinkage;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001004 GlobalVariable *NewGlobal = new GlobalVariable(
Bill Wendling58f8cef2013-08-06 22:52:42 +00001005 M, NewTy, G->isConstant(), Linkage,
Hans Wennborgcbe34b42012-06-23 11:37:03 +00001006 NewInitializer, "", G, G->getThreadLocalMode());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001007 NewGlobal->copyAttributesFrom(G);
Kostya Serebryany87191f62013-01-24 10:35:40 +00001008 NewGlobal->setAlignment(MinRZ);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001009
1010 Value *Indices2[2];
1011 Indices2[0] = IRB.getInt32(0);
1012 Indices2[1] = IRB.getInt32(0);
1013
1014 G->replaceAllUsesWith(
Kostya Serebryany7471d132012-01-28 04:27:16 +00001015 ConstantExpr::getGetElementPtr(NewGlobal, Indices2, true));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001016 NewGlobal->takeName(G);
1017 G->eraseFromParent();
1018
1019 Initializers[i] = ConstantStruct::get(
1020 GlobalStructTy,
1021 ConstantExpr::getPointerCast(NewGlobal, IntptrTy),
1022 ConstantInt::get(IntptrTy, SizeInBytes),
1023 ConstantInt::get(IntptrTy, SizeInBytes + RightRedzoneSize),
1024 ConstantExpr::getPointerCast(Name, IntptrTy),
Kostya Serebryanybd016bb2013-03-18 08:05:29 +00001025 ConstantExpr::getPointerCast(ModuleName, IntptrTy),
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001026 ConstantInt::get(IntptrTy, GlobalHasDynamicInitializer),
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001027 NULL);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001028
1029 // Populate the first and last globals declared in this TU.
Alexey Samsonove1e26bf2013-03-26 13:05:41 +00001030 if (CheckInitOrder && GlobalHasDynamicInitializer)
1031 HasDynamicallyInitializedGlobals = true;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001032
Kostya Serebryany20343352012-10-17 13:40:06 +00001033 DEBUG(dbgs() << "NEW GLOBAL: " << *NewGlobal << "\n");
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001034 }
1035
1036 ArrayType *ArrayOfGlobalStructTy = ArrayType::get(GlobalStructTy, n);
1037 GlobalVariable *AllGlobals = new GlobalVariable(
Bill Wendling58f8cef2013-08-06 22:52:42 +00001038 M, ArrayOfGlobalStructTy, false, GlobalVariable::InternalLinkage,
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001039 ConstantArray::get(ArrayOfGlobalStructTy, Initializers), "");
1040
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001041 // Create calls for poisoning before initializers run and unpoisoning after.
Alexey Samsonove1e26bf2013-03-26 13:05:41 +00001042 if (CheckInitOrder && HasDynamicallyInitializedGlobals)
1043 createInitializerPoisonCalls(M, ModuleName);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001044 IRB.CreateCall2(AsanRegisterGlobals,
1045 IRB.CreatePointerCast(AllGlobals, IntptrTy),
1046 ConstantInt::get(IntptrTy, n));
1047
Kostya Serebryanycd1aba82011-12-15 21:59:03 +00001048 // We also need to unregister globals at the end, e.g. when a shared library
1049 // gets closed.
1050 Function *AsanDtorFunction = Function::Create(
1051 FunctionType::get(Type::getVoidTy(*C), false),
1052 GlobalValue::InternalLinkage, kAsanModuleDtorName, &M);
1053 BasicBlock *AsanDtorBB = BasicBlock::Create(*C, "", AsanDtorFunction);
1054 IRBuilder<> IRB_Dtor(ReturnInst::Create(*C, AsanDtorBB));
Kostya Serebryanycd1aba82011-12-15 21:59:03 +00001055 IRB_Dtor.CreateCall2(AsanUnregisterGlobals,
1056 IRB.CreatePointerCast(AllGlobals, IntptrTy),
1057 ConstantInt::get(IntptrTy, n));
1058 appendToGlobalDtors(M, AsanDtorFunction, kAsanCtorAndCtorPriority);
1059
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001060 DEBUG(dbgs() << M);
1061 return true;
1062}
1063
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001064void AddressSanitizer::initializeCallbacks(Module &M) {
1065 IRBuilder<> IRB(*C);
Kostya Serebryany4273bb02012-07-16 14:09:42 +00001066 // Create __asan_report* callbacks.
1067 for (size_t AccessIsWrite = 0; AccessIsWrite <= 1; AccessIsWrite++) {
1068 for (size_t AccessSizeIndex = 0; AccessSizeIndex < kNumberOfAccessSizes;
1069 AccessSizeIndex++) {
1070 // IsWrite and TypeSize are encoded in the function name.
1071 std::string FunctionName = std::string(kAsanReportErrorTemplate) +
1072 (AccessIsWrite ? "store" : "load") + itostr(1 << AccessSizeIndex);
Kostya Serebryany986b8da2012-07-17 11:04:12 +00001073 // If we are merging crash callbacks, they have two parameters.
Kostya Serebryany157a5152012-11-07 12:42:18 +00001074 AsanErrorCallback[AccessIsWrite][AccessSizeIndex] =
1075 checkInterfaceFunction(M.getOrInsertFunction(
1076 FunctionName, IRB.getVoidTy(), IntptrTy, NULL));
Kostya Serebryany4273bb02012-07-16 14:09:42 +00001077 }
1078 }
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +00001079 AsanErrorCallbackSized[0] = checkInterfaceFunction(M.getOrInsertFunction(
1080 kAsanReportLoadN, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
1081 AsanErrorCallbackSized[1] = checkInterfaceFunction(M.getOrInsertFunction(
1082 kAsanReportStoreN, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001083
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001084 AsanHandleNoReturnFunc = checkInterfaceFunction(M.getOrInsertFunction(
1085 kAsanHandleNoReturnName, IRB.getVoidTy(), NULL));
Bob Wilsonda4147c2013-11-15 07:16:09 +00001086 AsanCovFunction = checkInterfaceFunction(M.getOrInsertFunction(
1087 kAsanCovName, IRB.getVoidTy(), IntptrTy, NULL));
Kostya Serebryanyf02c6062012-07-20 09:54:50 +00001088 // We insert an empty inline asm after __asan_report* to avoid callback merge.
1089 EmptyAsm = InlineAsm::get(FunctionType::get(IRB.getVoidTy(), false),
1090 StringRef(""), StringRef(""),
1091 /*hasSideEffects=*/true);
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001092}
1093
Alexey Samsonov1345d352013-01-16 13:23:28 +00001094void AddressSanitizer::emitShadowMapping(Module &M, IRBuilder<> &IRB) const {
Alexey Samsonov347bcd32013-01-17 11:12:32 +00001095 // Tell the values of mapping offset and scale to the run-time.
1096 GlobalValue *asan_mapping_offset =
1097 new GlobalVariable(M, IntptrTy, true, GlobalValue::LinkOnceODRLinkage,
1098 ConstantInt::get(IntptrTy, Mapping.Offset),
1099 kAsanMappingOffsetName);
1100 // Read the global, otherwise it may be optimized away.
1101 IRB.CreateLoad(asan_mapping_offset, true);
Alexey Samsonov1345d352013-01-16 13:23:28 +00001102
Alexey Samsonov347bcd32013-01-17 11:12:32 +00001103 GlobalValue *asan_mapping_scale =
1104 new GlobalVariable(M, IntptrTy, true, GlobalValue::LinkOnceODRLinkage,
1105 ConstantInt::get(IntptrTy, Mapping.Scale),
1106 kAsanMappingScaleName);
1107 // Read the global, otherwise it may be optimized away.
1108 IRB.CreateLoad(asan_mapping_scale, true);
Alexey Samsonov1345d352013-01-16 13:23:28 +00001109}
1110
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001111// virtual
1112bool AddressSanitizer::doInitialization(Module &M) {
1113 // Initialize the private fields. No one has accessed them before.
1114 TD = getAnalysisIfAvailable<DataLayout>();
1115
1116 if (!TD)
1117 return false;
Alexey Samsonove4b5fb82013-08-12 11:46:09 +00001118 BL.reset(SpecialCaseList::createOrDie(BlacklistFile));
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001119 DynamicallyInitializedGlobals.Init(M);
1120
1121 C = &(M.getContext());
1122 LongSize = TD->getPointerSizeInBits();
1123 IntptrTy = Type::getIntNTy(*C, LongSize);
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001124
1125 AsanCtorFunction = Function::Create(
1126 FunctionType::get(Type::getVoidTy(*C), false),
1127 GlobalValue::InternalLinkage, kAsanModuleCtorName, &M);
1128 BasicBlock *AsanCtorBB = BasicBlock::Create(*C, "", AsanCtorFunction);
1129 // call __asan_init in the module ctor.
1130 IRBuilder<> IRB(ReturnInst::Create(*C, AsanCtorBB));
1131 AsanInitFunction = checkInterfaceFunction(
1132 M.getOrInsertFunction(kAsanInitName, IRB.getVoidTy(), NULL));
1133 AsanInitFunction->setLinkage(Function::ExternalLinkage);
1134 IRB.CreateCall(AsanInitFunction);
Kostya Serebryany4273bb02012-07-16 14:09:42 +00001135
Alexey Samsonov347bcd32013-01-17 11:12:32 +00001136 Mapping = getShadowMapping(M, LongSize, ZeroBaseShadow);
Alexey Samsonov1345d352013-01-16 13:23:28 +00001137 emitShadowMapping(M, IRB);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001138
Kostya Serebryanycd1aba82011-12-15 21:59:03 +00001139 appendToGlobalCtors(M, AsanCtorFunction, kAsanCtorAndCtorPriority);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001140 return true;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001141}
1142
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +00001143bool AddressSanitizer::maybeInsertAsanInitAtFunctionEntry(Function &F) {
1144 // For each NSObject descendant having a +load method, this method is invoked
1145 // by the ObjC runtime before any of the static constructors is called.
1146 // Therefore we need to instrument such methods with a call to __asan_init
1147 // at the beginning in order to initialize our runtime before any access to
1148 // the shadow memory.
1149 // We cannot just ignore these methods, because they may call other
1150 // instrumented functions.
1151 if (F.getName().find(" load]") != std::string::npos) {
1152 IRBuilder<> IRB(F.begin()->begin());
1153 IRB.CreateCall(AsanInitFunction);
1154 return true;
1155 }
1156 return false;
1157}
1158
Bob Wilsonda4147c2013-11-15 07:16:09 +00001159// Poor man's coverage that works with ASan.
1160// We create a Guard boolean variable with the same linkage
1161// as the function and inject this code into the entry block:
1162// if (*Guard) {
1163// __sanitizer_cov(&F);
1164// *Guard = 1;
1165// }
1166// The accesses to Guard are atomic. The rest of the logic is
1167// in __sanitizer_cov (it's fine to call it more than once).
1168//
1169// This coverage implementation provides very limited data:
1170// it only tells if a given function was ever executed.
1171// No counters, no per-basic-block or per-edge data.
1172// But for many use cases this is what we need and the added slowdown
1173// is negligible. This simple implementation will probably be obsoleted
1174// by the upcoming Clang-based coverage implementation.
1175// By having it here and now we hope to
1176// a) get the functionality to users earlier and
1177// b) collect usage statistics to help improve Clang coverage design.
1178bool AddressSanitizer::InjectCoverage(Function &F) {
1179 if (!ClCoverage) return false;
Reid Kleckner30b2a9a2013-12-10 21:49:28 +00001180
1181 // Skip static allocas at the top of the entry block so they don't become
1182 // dynamic when we split the block. If we used our optimized stack layout,
1183 // then there will only be one alloca and it will come first.
1184 BasicBlock &Entry = F.getEntryBlock();
1185 BasicBlock::iterator IP = Entry.getFirstInsertionPt(), BE = Entry.end();
1186 for (; IP != BE; ++IP) {
1187 AllocaInst *AI = dyn_cast<AllocaInst>(IP);
1188 if (!AI || !AI->isStaticAlloca())
1189 break;
1190 }
1191
1192 IRBuilder<> IRB(IP);
Bob Wilsonda4147c2013-11-15 07:16:09 +00001193 Type *Int8Ty = IRB.getInt8Ty();
1194 GlobalVariable *Guard = new GlobalVariable(
Kostya Serebryany0604c622013-11-15 09:52:05 +00001195 *F.getParent(), Int8Ty, false, GlobalValue::PrivateLinkage,
Bob Wilsonda4147c2013-11-15 07:16:09 +00001196 Constant::getNullValue(Int8Ty), "__asan_gen_cov_" + F.getName());
1197 LoadInst *Load = IRB.CreateLoad(Guard);
1198 Load->setAtomic(Monotonic);
1199 Load->setAlignment(1);
1200 Value *Cmp = IRB.CreateICmpEQ(Constant::getNullValue(Int8Ty), Load);
Evgeniy Stepanova9164e92013-12-19 13:29:56 +00001201 Instruction *Ins = SplitBlockAndInsertIfThen(Cmp, IP, false);
Bob Wilsonda4147c2013-11-15 07:16:09 +00001202 IRB.SetInsertPoint(Ins);
1203 // We pass &F to __sanitizer_cov. We could avoid this and rely on
1204 // GET_CALLER_PC, but having the PC of the first instruction is just nice.
1205 IRB.CreateCall(AsanCovFunction, IRB.CreatePointerCast(&F, IntptrTy));
1206 StoreInst *Store = IRB.CreateStore(ConstantInt::get(Int8Ty, 1), Guard);
1207 Store->setAtomic(Monotonic);
1208 Store->setAlignment(1);
1209 return true;
1210}
1211
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001212bool AddressSanitizer::runOnFunction(Function &F) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001213 if (BL->isIn(F)) return false;
1214 if (&F == AsanCtorFunction) return false;
Kostya Serebryany6b5b58d2013-03-18 07:33:49 +00001215 if (F.getLinkage() == GlobalValue::AvailableExternallyLinkage) return false;
Kostya Serebryany20343352012-10-17 13:40:06 +00001216 DEBUG(dbgs() << "ASAN instrumenting:\n" << F << "\n");
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001217 initializeCallbacks(*F.getParent());
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +00001218
Kostya Serebryanycf880b92013-02-26 06:58:09 +00001219 // If needed, insert __asan_init before checking for SanitizeAddress attr.
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +00001220 maybeInsertAsanInitAtFunctionEntry(F);
1221
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001222 if (!F.hasFnAttribute(Attribute::SanitizeAddress))
Bill Wendlingc9b22d72012-10-09 07:45:08 +00001223 return false;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001224
1225 if (!ClDebugFunc.empty() && ClDebugFunc != F.getName())
1226 return false;
Bill Wendlingc9b22d72012-10-09 07:45:08 +00001227
1228 // We want to instrument every address only once per basic block (unless there
1229 // are calls between uses).
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001230 SmallSet<Value*, 16> TempsToInstrument;
1231 SmallVector<Instruction*, 16> ToInstrument;
Kostya Serebryany154a54d2012-02-08 21:36:17 +00001232 SmallVector<Instruction*, 8> NoReturnCalls;
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001233 int NumAllocas = 0;
Kostya Serebryany90241602012-05-30 09:04:06 +00001234 bool IsWrite;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001235
1236 // Fill the set of memory operations to instrument.
1237 for (Function::iterator FI = F.begin(), FE = F.end();
1238 FI != FE; ++FI) {
1239 TempsToInstrument.clear();
Kostya Serebryanyc387ca72012-06-28 09:34:41 +00001240 int NumInsnsPerBB = 0;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001241 for (BasicBlock::iterator BI = FI->begin(), BE = FI->end();
1242 BI != BE; ++BI) {
Kostya Serebryany687d0782012-01-11 18:15:23 +00001243 if (LooksLikeCodeInBug11395(BI)) return false;
Kostya Serebryany90241602012-05-30 09:04:06 +00001244 if (Value *Addr = isInterestingMemoryAccess(BI, &IsWrite)) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001245 if (ClOpt && ClOptSameTemp) {
1246 if (!TempsToInstrument.insert(Addr))
1247 continue; // We've seen this temp in the current BB.
1248 }
1249 } else if (isa<MemIntrinsic>(BI) && ClMemIntrin) {
1250 // ok, take it.
1251 } else {
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001252 if (isa<AllocaInst>(BI))
1253 NumAllocas++;
Kostya Serebryany699ac282013-02-20 12:35:15 +00001254 CallSite CS(BI);
1255 if (CS) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001256 // A call inside BB.
1257 TempsToInstrument.clear();
Kostya Serebryany699ac282013-02-20 12:35:15 +00001258 if (CS.doesNotReturn())
1259 NoReturnCalls.push_back(CS.getInstruction());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001260 }
1261 continue;
1262 }
1263 ToInstrument.push_back(BI);
Kostya Serebryanyc387ca72012-06-28 09:34:41 +00001264 NumInsnsPerBB++;
1265 if (NumInsnsPerBB >= ClMaxInsnsToInstrumentPerBB)
1266 break;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001267 }
1268 }
1269
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001270 Function *UninstrumentedDuplicate = 0;
1271 bool LikelyToInstrument =
1272 !NoReturnCalls.empty() || !ToInstrument.empty() || (NumAllocas > 0);
1273 if (ClKeepUninstrumented && LikelyToInstrument) {
1274 ValueToValueMapTy VMap;
1275 UninstrumentedDuplicate = CloneFunction(&F, VMap, false);
1276 UninstrumentedDuplicate->removeFnAttr(Attribute::SanitizeAddress);
1277 UninstrumentedDuplicate->setName("NOASAN_" + F.getName());
1278 F.getParent()->getFunctionList().push_back(UninstrumentedDuplicate);
1279 }
1280
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001281 // Instrument.
1282 int NumInstrumented = 0;
1283 for (size_t i = 0, n = ToInstrument.size(); i != n; i++) {
1284 Instruction *Inst = ToInstrument[i];
1285 if (ClDebugMin < 0 || ClDebugMax < 0 ||
1286 (NumInstrumented >= ClDebugMin && NumInstrumented <= ClDebugMax)) {
Kostya Serebryany90241602012-05-30 09:04:06 +00001287 if (isInterestingMemoryAccess(Inst, &IsWrite))
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001288 instrumentMop(Inst);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001289 else
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001290 instrumentMemIntrinsic(cast<MemIntrinsic>(Inst));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001291 }
1292 NumInstrumented++;
1293 }
1294
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001295 FunctionStackPoisoner FSP(F, *this);
1296 bool ChangedStack = FSP.runOnFunction();
Kostya Serebryany154a54d2012-02-08 21:36:17 +00001297
1298 // We must unpoison the stack before every NoReturn call (throw, _exit, etc).
1299 // See e.g. http://code.google.com/p/address-sanitizer/issues/detail?id=37
1300 for (size_t i = 0, n = NoReturnCalls.size(); i != n; i++) {
1301 Instruction *CI = NoReturnCalls[i];
1302 IRBuilder<> IRB(CI);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001303 IRB.CreateCall(AsanHandleNoReturnFunc);
Kostya Serebryany154a54d2012-02-08 21:36:17 +00001304 }
1305
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001306 bool res = NumInstrumented > 0 || ChangedStack || !NoReturnCalls.empty();
Bob Wilsonda4147c2013-11-15 07:16:09 +00001307
1308 if (InjectCoverage(F))
1309 res = true;
1310
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001311 DEBUG(dbgs() << "ASAN done instrumenting: " << res << " " << F << "\n");
1312
1313 if (ClKeepUninstrumented) {
1314 if (!res) {
1315 // No instrumentation is done, no need for the duplicate.
1316 if (UninstrumentedDuplicate)
1317 UninstrumentedDuplicate->eraseFromParent();
1318 } else {
1319 // The function was instrumented. We must have the duplicate.
1320 assert(UninstrumentedDuplicate);
1321 UninstrumentedDuplicate->setSection("NOASAN");
1322 assert(!F.hasSection());
1323 F.setSection("ASAN");
1324 }
1325 }
1326
1327 return res;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001328}
1329
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001330// Workaround for bug 11395: we don't want to instrument stack in functions
1331// with large assembly blobs (32-bit only), otherwise reg alloc may crash.
1332// FIXME: remove once the bug 11395 is fixed.
1333bool AddressSanitizer::LooksLikeCodeInBug11395(Instruction *I) {
1334 if (LongSize != 32) return false;
1335 CallInst *CI = dyn_cast<CallInst>(I);
1336 if (!CI || !CI->isInlineAsm()) return false;
1337 if (CI->getNumArgOperands() <= 5) return false;
1338 // We have inline assembly with quite a few arguments.
1339 return true;
1340}
1341
1342void FunctionStackPoisoner::initializeCallbacks(Module &M) {
1343 IRBuilder<> IRB(*C);
Kostya Serebryany6805de52013-09-10 13:16:56 +00001344 for (int i = 0; i <= kMaxAsanStackMallocSizeClass; i++) {
1345 std::string Suffix = itostr(i);
1346 AsanStackMallocFunc[i] = checkInterfaceFunction(
1347 M.getOrInsertFunction(kAsanStackMallocNameTemplate + Suffix, IntptrTy,
1348 IntptrTy, IntptrTy, NULL));
1349 AsanStackFreeFunc[i] = checkInterfaceFunction(M.getOrInsertFunction(
1350 kAsanStackFreeNameTemplate + Suffix, IRB.getVoidTy(), IntptrTy,
1351 IntptrTy, IntptrTy, NULL));
1352 }
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001353 AsanPoisonStackMemoryFunc = checkInterfaceFunction(M.getOrInsertFunction(
1354 kAsanPoisonStackMemoryName, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
1355 AsanUnpoisonStackMemoryFunc = checkInterfaceFunction(M.getOrInsertFunction(
1356 kAsanUnpoisonStackMemoryName, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
1357}
1358
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001359void
1360FunctionStackPoisoner::poisonRedZones(const ArrayRef<uint8_t> ShadowBytes,
1361 IRBuilder<> &IRB, Value *ShadowBase,
1362 bool DoPoison) {
1363 size_t n = ShadowBytes.size();
Kostya Serebryanyff7bde12013-12-23 09:24:36 +00001364 size_t i = 0;
1365 // We need to (un)poison n bytes of stack shadow. Poison as many as we can
1366 // using 64-bit stores (if we are on 64-bit arch), then poison the rest
1367 // with 32-bit stores, then with 16-byte stores, then with 8-byte stores.
1368 for (size_t LargeStoreSizeInBytes = ASan.LongSize / 8;
1369 LargeStoreSizeInBytes != 0; LargeStoreSizeInBytes /= 2) {
1370 for (; i + LargeStoreSizeInBytes - 1 < n; i += LargeStoreSizeInBytes) {
1371 uint64_t Val = 0;
1372 for (size_t j = 0; j < LargeStoreSizeInBytes; j++) {
1373 if (ASan.TD->isLittleEndian())
1374 Val |= (uint64_t)ShadowBytes[i + j] << (8 * j);
1375 else
1376 Val = (Val << 8) | ShadowBytes[i + j];
1377 }
1378 if (!Val) continue;
1379 Value *Ptr = IRB.CreateAdd(ShadowBase, ConstantInt::get(IntptrTy, i));
1380 Type *StoreTy = Type::getIntNTy(*C, LargeStoreSizeInBytes * 8);
1381 Value *Poison = ConstantInt::get(StoreTy, DoPoison ? Val : 0);
1382 IRB.CreateStore(Poison, IRB.CreateIntToPtr(Ptr, StoreTy->getPointerTo()));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001383 }
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001384 }
1385}
1386
Kostya Serebryany6805de52013-09-10 13:16:56 +00001387// Fake stack allocator (asan_fake_stack.h) has 11 size classes
1388// for every power of 2 from kMinStackMallocSize to kMaxAsanStackMallocSizeClass
1389static int StackMallocSizeClass(uint64_t LocalStackSize) {
1390 assert(LocalStackSize <= kMaxStackMallocSize);
1391 uint64_t MaxSize = kMinStackMallocSize;
1392 for (int i = 0; ; i++, MaxSize *= 2)
1393 if (LocalStackSize <= MaxSize)
1394 return i;
1395 llvm_unreachable("impossible LocalStackSize");
1396}
1397
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001398// Set Size bytes starting from ShadowBase to kAsanStackAfterReturnMagic.
1399// We can not use MemSet intrinsic because it may end up calling the actual
1400// memset. Size is a multiple of 8.
1401// Currently this generates 8-byte stores on x86_64; it may be better to
1402// generate wider stores.
1403void FunctionStackPoisoner::SetShadowToStackAfterReturnInlined(
1404 IRBuilder<> &IRB, Value *ShadowBase, int Size) {
1405 assert(!(Size % 8));
1406 assert(kAsanStackAfterReturnMagic == 0xf5);
1407 for (int i = 0; i < Size; i += 8) {
1408 Value *p = IRB.CreateAdd(ShadowBase, ConstantInt::get(IntptrTy, i));
1409 IRB.CreateStore(ConstantInt::get(IRB.getInt64Ty(), 0xf5f5f5f5f5f5f5f5ULL),
1410 IRB.CreateIntToPtr(p, IRB.getInt64Ty()->getPointerTo()));
1411 }
1412}
1413
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001414void FunctionStackPoisoner::poisonStack() {
Kostya Serebryany6805de52013-09-10 13:16:56 +00001415 int StackMallocIdx = -1;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001416
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001417 assert(AllocaVec.size() > 0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001418 Instruction *InsBefore = AllocaVec[0];
1419 IRBuilder<> IRB(InsBefore);
1420
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001421 SmallVector<ASanStackVariableDescription, 16> SVD;
1422 SVD.reserve(AllocaVec.size());
1423 for (size_t i = 0, n = AllocaVec.size(); i < n; i++) {
1424 AllocaInst *AI = AllocaVec[i];
1425 ASanStackVariableDescription D = { AI->getName().data(),
1426 getAllocaSizeInBytes(AI),
1427 AI->getAlignment(), AI, 0};
1428 SVD.push_back(D);
1429 }
1430 // Minimal header size (left redzone) is 4 pointers,
1431 // i.e. 32 bytes on 64-bit platforms and 16 bytes in 32-bit platforms.
1432 size_t MinHeaderSize = ASan.LongSize / 2;
1433 ASanStackFrameLayout L;
1434 ComputeASanStackFrameLayout(SVD, 1UL << Mapping.Scale, MinHeaderSize, &L);
1435 DEBUG(dbgs() << L.DescriptionString << " --- " << L.FrameSize << "\n");
1436 uint64_t LocalStackSize = L.FrameSize;
1437 bool DoStackMalloc =
1438 ASan.CheckUseAfterReturn && LocalStackSize <= kMaxStackMallocSize;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001439
1440 Type *ByteArrayTy = ArrayType::get(IRB.getInt8Ty(), LocalStackSize);
1441 AllocaInst *MyAlloca =
1442 new AllocaInst(ByteArrayTy, "MyAlloca", InsBefore);
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001443 assert((ClRealignStack & (ClRealignStack - 1)) == 0);
1444 size_t FrameAlignment = std::max(L.FrameAlignment, (size_t)ClRealignStack);
1445 MyAlloca->setAlignment(FrameAlignment);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001446 assert(MyAlloca->isStaticAlloca());
1447 Value *OrigStackBase = IRB.CreatePointerCast(MyAlloca, IntptrTy);
1448 Value *LocalStackBase = OrigStackBase;
1449
1450 if (DoStackMalloc) {
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001451 // LocalStackBase = OrigStackBase
1452 // if (__asan_option_detect_stack_use_after_return)
1453 // LocalStackBase = __asan_stack_malloc_N(LocalStackBase, OrigStackBase);
Kostya Serebryany6805de52013-09-10 13:16:56 +00001454 StackMallocIdx = StackMallocSizeClass(LocalStackSize);
1455 assert(StackMallocIdx <= kMaxAsanStackMallocSizeClass);
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001456 Constant *OptionDetectUAR = F.getParent()->getOrInsertGlobal(
1457 kAsanOptionDetectUAR, IRB.getInt32Ty());
1458 Value *Cmp = IRB.CreateICmpNE(IRB.CreateLoad(OptionDetectUAR),
1459 Constant::getNullValue(IRB.getInt32Ty()));
Evgeniy Stepanova9164e92013-12-19 13:29:56 +00001460 Instruction *Term = SplitBlockAndInsertIfThen(Cmp, InsBefore, false);
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001461 BasicBlock *CmpBlock = cast<Instruction>(Cmp)->getParent();
1462 IRBuilder<> IRBIf(Term);
1463 LocalStackBase = IRBIf.CreateCall2(
1464 AsanStackMallocFunc[StackMallocIdx],
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001465 ConstantInt::get(IntptrTy, LocalStackSize), OrigStackBase);
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001466 BasicBlock *SetBlock = cast<Instruction>(LocalStackBase)->getParent();
1467 IRB.SetInsertPoint(InsBefore);
1468 PHINode *Phi = IRB.CreatePHI(IntptrTy, 2);
1469 Phi->addIncoming(OrigStackBase, CmpBlock);
1470 Phi->addIncoming(LocalStackBase, SetBlock);
1471 LocalStackBase = Phi;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001472 }
1473
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001474 // Insert poison calls for lifetime intrinsics for alloca.
1475 bool HavePoisonedAllocas = false;
1476 for (size_t i = 0, n = AllocaPoisonCallVec.size(); i < n; i++) {
1477 const AllocaPoisonCall &APC = AllocaPoisonCallVec[i];
Alexey Samsonova788b942013-11-18 14:53:55 +00001478 assert(APC.InsBefore);
1479 assert(APC.AI);
1480 IRBuilder<> IRB(APC.InsBefore);
1481 poisonAlloca(APC.AI, APC.Size, IRB, APC.DoPoison);
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001482 HavePoisonedAllocas |= APC.DoPoison;
1483 }
1484
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001485 // Replace Alloca instructions with base+offset.
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001486 for (size_t i = 0, n = SVD.size(); i < n; i++) {
1487 AllocaInst *AI = SVD[i].AI;
Alexey Samsonov261177a2012-12-04 01:34:23 +00001488 Value *NewAllocaPtr = IRB.CreateIntToPtr(
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001489 IRB.CreateAdd(LocalStackBase,
1490 ConstantInt::get(IntptrTy, SVD[i].Offset)),
1491 AI->getType());
Alexey Samsonov3d43b632012-12-12 14:31:53 +00001492 replaceDbgDeclareForAlloca(AI, NewAllocaPtr, DIB);
Alexey Samsonov261177a2012-12-04 01:34:23 +00001493 AI->replaceAllUsesWith(NewAllocaPtr);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001494 }
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001495
Kostya Serebryanycdd35a92013-03-22 10:37:20 +00001496 // The left-most redzone has enough space for at least 4 pointers.
1497 // Write the Magic value to redzone[0].
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001498 Value *BasePlus0 = IRB.CreateIntToPtr(LocalStackBase, IntptrPtrTy);
1499 IRB.CreateStore(ConstantInt::get(IntptrTy, kCurrentStackFrameMagic),
1500 BasePlus0);
Kostya Serebryanycdd35a92013-03-22 10:37:20 +00001501 // Write the frame description constant to redzone[1].
1502 Value *BasePlus1 = IRB.CreateIntToPtr(
1503 IRB.CreateAdd(LocalStackBase, ConstantInt::get(IntptrTy, ASan.LongSize/8)),
1504 IntptrPtrTy);
Alexey Samsonov9bdb63a2012-11-02 12:20:34 +00001505 GlobalVariable *StackDescriptionGlobal =
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +00001506 createPrivateGlobalForString(*F.getParent(), L.DescriptionString,
1507 /*AllowMerging*/true);
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001508 Value *Description = IRB.CreatePointerCast(StackDescriptionGlobal,
1509 IntptrTy);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001510 IRB.CreateStore(Description, BasePlus1);
Kostya Serebryanycdd35a92013-03-22 10:37:20 +00001511 // Write the PC to redzone[2].
1512 Value *BasePlus2 = IRB.CreateIntToPtr(
1513 IRB.CreateAdd(LocalStackBase, ConstantInt::get(IntptrTy,
1514 2 * ASan.LongSize/8)),
1515 IntptrPtrTy);
1516 IRB.CreateStore(IRB.CreatePointerCast(&F, IntptrTy), BasePlus2);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001517
1518 // Poison the stack redzones at the entry.
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001519 Value *ShadowBase = ASan.memToShadow(LocalStackBase, IRB);
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001520 poisonRedZones(L.ShadowBytes, IRB, ShadowBase, true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001521
Kostya Serebryany530e2072013-12-23 14:15:08 +00001522 // (Un)poison the stack before all ret instructions.
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001523 for (size_t i = 0, n = RetVec.size(); i < n; i++) {
1524 Instruction *Ret = RetVec[i];
1525 IRBuilder<> IRBRet(Ret);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001526 // Mark the current frame as retired.
1527 IRBRet.CreateStore(ConstantInt::get(IntptrTy, kRetiredStackFrameMagic),
1528 BasePlus0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001529 if (DoStackMalloc) {
Kostya Serebryany6805de52013-09-10 13:16:56 +00001530 assert(StackMallocIdx >= 0);
Kostya Serebryany530e2072013-12-23 14:15:08 +00001531 // if LocalStackBase != OrigStackBase:
1532 // // In use-after-return mode, poison the whole stack frame.
1533 // if StackMallocIdx <= 4
1534 // // For small sizes inline the whole thing:
1535 // memset(ShadowBase, kAsanStackAfterReturnMagic, ShadowSize);
1536 // **SavedFlagPtr(LocalStackBase) = 0
1537 // else
1538 // __asan_stack_free_N(LocalStackBase, OrigStackBase)
1539 // else
1540 // <This is not a fake stack; unpoison the redzones>
1541 Value *Cmp = IRBRet.CreateICmpNE(LocalStackBase, OrigStackBase);
1542 TerminatorInst *ThenTerm, *ElseTerm;
1543 SplitBlockAndInsertIfThenElse(Cmp, Ret, &ThenTerm, &ElseTerm);
1544
1545 IRBuilder<> IRBPoison(ThenTerm);
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001546 if (StackMallocIdx <= 4) {
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001547 int ClassSize = kMinStackMallocSize << StackMallocIdx;
1548 SetShadowToStackAfterReturnInlined(IRBPoison, ShadowBase,
1549 ClassSize >> Mapping.Scale);
1550 Value *SavedFlagPtrPtr = IRBPoison.CreateAdd(
1551 LocalStackBase,
1552 ConstantInt::get(IntptrTy, ClassSize - ASan.LongSize / 8));
1553 Value *SavedFlagPtr = IRBPoison.CreateLoad(
1554 IRBPoison.CreateIntToPtr(SavedFlagPtrPtr, IntptrPtrTy));
1555 IRBPoison.CreateStore(
1556 Constant::getNullValue(IRBPoison.getInt8Ty()),
1557 IRBPoison.CreateIntToPtr(SavedFlagPtr, IRBPoison.getInt8PtrTy()));
1558 } else {
1559 // For larger frames call __asan_stack_free_*.
Kostya Serebryany530e2072013-12-23 14:15:08 +00001560 IRBPoison.CreateCall3(AsanStackFreeFunc[StackMallocIdx], LocalStackBase,
1561 ConstantInt::get(IntptrTy, LocalStackSize),
1562 OrigStackBase);
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001563 }
Kostya Serebryany530e2072013-12-23 14:15:08 +00001564
1565 IRBuilder<> IRBElse(ElseTerm);
1566 poisonRedZones(L.ShadowBytes, IRBElse, ShadowBase, false);
Alexey Samsonov261177a2012-12-04 01:34:23 +00001567 } else if (HavePoisonedAllocas) {
1568 // If we poisoned some allocas in llvm.lifetime analysis,
1569 // unpoison whole stack frame now.
1570 assert(LocalStackBase == OrigStackBase);
1571 poisonAlloca(LocalStackBase, LocalStackSize, IRBRet, false);
Kostya Serebryany530e2072013-12-23 14:15:08 +00001572 } else {
1573 poisonRedZones(L.ShadowBytes, IRBRet, ShadowBase, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001574 }
1575 }
1576
Kostya Serebryany09959942012-10-19 06:20:53 +00001577 // We are done. Remove the old unused alloca instructions.
1578 for (size_t i = 0, n = AllocaVec.size(); i < n; i++)
1579 AllocaVec[i]->eraseFromParent();
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001580}
Alexey Samsonov261177a2012-12-04 01:34:23 +00001581
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001582void FunctionStackPoisoner::poisonAlloca(Value *V, uint64_t Size,
Jakub Staszak23ec6a92013-08-09 20:53:48 +00001583 IRBuilder<> &IRB, bool DoPoison) {
Alexey Samsonov261177a2012-12-04 01:34:23 +00001584 // For now just insert the call to ASan runtime.
1585 Value *AddrArg = IRB.CreatePointerCast(V, IntptrTy);
1586 Value *SizeArg = ConstantInt::get(IntptrTy, Size);
1587 IRB.CreateCall2(DoPoison ? AsanPoisonStackMemoryFunc
1588 : AsanUnpoisonStackMemoryFunc,
1589 AddrArg, SizeArg);
1590}
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001591
1592// Handling llvm.lifetime intrinsics for a given %alloca:
1593// (1) collect all llvm.lifetime.xxx(%size, %value) describing the alloca.
1594// (2) if %size is constant, poison memory for llvm.lifetime.end (to detect
1595// invalid accesses) and unpoison it for llvm.lifetime.start (the memory
1596// could be poisoned by previous llvm.lifetime.end instruction, as the
1597// variable may go in and out of scope several times, e.g. in loops).
1598// (3) if we poisoned at least one %alloca in a function,
1599// unpoison the whole stack frame at function exit.
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001600
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001601AllocaInst *FunctionStackPoisoner::findAllocaForValue(Value *V) {
1602 if (AllocaInst *AI = dyn_cast<AllocaInst>(V))
1603 // We're intested only in allocas we can handle.
1604 return isInterestingAlloca(*AI) ? AI : 0;
1605 // See if we've already calculated (or started to calculate) alloca for a
1606 // given value.
1607 AllocaForValueMapTy::iterator I = AllocaForValue.find(V);
1608 if (I != AllocaForValue.end())
1609 return I->second;
1610 // Store 0 while we're calculating alloca for value V to avoid
1611 // infinite recursion if the value references itself.
1612 AllocaForValue[V] = 0;
1613 AllocaInst *Res = 0;
1614 if (CastInst *CI = dyn_cast<CastInst>(V))
1615 Res = findAllocaForValue(CI->getOperand(0));
1616 else if (PHINode *PN = dyn_cast<PHINode>(V)) {
1617 for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {
1618 Value *IncValue = PN->getIncomingValue(i);
1619 // Allow self-referencing phi-nodes.
1620 if (IncValue == PN) continue;
1621 AllocaInst *IncValueAI = findAllocaForValue(IncValue);
1622 // AI for incoming values should exist and should all be equal.
1623 if (IncValueAI == 0 || (Res != 0 && IncValueAI != Res))
1624 return 0;
1625 Res = IncValueAI;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001626 }
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001627 }
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001628 if (Res != 0)
1629 AllocaForValue[V] = Res;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001630 return Res;
1631}