blob: c03075c9ea06baf4101a53e9c0b53f25d767df28 [file] [log] [blame]
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001//===-- AddressSanitizer.cpp - memory error detector ------------*- C++ -*-===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file is a part of AddressSanitizer, an address sanity checker.
11// Details of the algorithm:
12// http://code.google.com/p/address-sanitizer/wiki/AddressSanitizerAlgorithm
13//
14//===----------------------------------------------------------------------===//
15
16#define DEBUG_TYPE "asan"
17
Chandler Carruthed0881b2012-12-03 16:50:05 +000018#include "llvm/Transforms/Instrumentation.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000019#include "llvm/ADT/ArrayRef.h"
Alexey Samsonov29dd7f22012-12-27 08:50:58 +000020#include "llvm/ADT/DenseMap.h"
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +000021#include "llvm/ADT/DepthFirstIterator.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000022#include "llvm/ADT/OwningPtr.h"
23#include "llvm/ADT/SmallSet.h"
24#include "llvm/ADT/SmallString.h"
25#include "llvm/ADT/SmallVector.h"
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +000026#include "llvm/ADT/Statistic.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000027#include "llvm/ADT/StringExtras.h"
Evgeniy Stepanov617232f2012-05-23 11:52:12 +000028#include "llvm/ADT/Triple.h"
Alexey Samsonov3d43b632012-12-12 14:31:53 +000029#include "llvm/DIBuilder.h"
Chandler Carruth9fb823b2013-01-02 11:36:10 +000030#include "llvm/IR/DataLayout.h"
31#include "llvm/IR/Function.h"
32#include "llvm/IR/IRBuilder.h"
33#include "llvm/IR/InlineAsm.h"
34#include "llvm/IR/IntrinsicInst.h"
35#include "llvm/IR/LLVMContext.h"
36#include "llvm/IR/Module.h"
37#include "llvm/IR/Type.h"
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +000038#include "llvm/InstVisitor.h"
Kostya Serebryany699ac282013-02-20 12:35:15 +000039#include "llvm/Support/CallSite.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000040#include "llvm/Support/CommandLine.h"
41#include "llvm/Support/DataTypes.h"
42#include "llvm/Support/Debug.h"
Kostya Serebryany9e62b302013-06-03 14:46:56 +000043#include "llvm/Support/Endian.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000044#include "llvm/Support/system_error.h"
Kostya Serebryany4fb78012013-12-06 09:00:17 +000045#include "llvm/Transforms/Utils/ASanStackFrameLayout.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000046#include "llvm/Transforms/Utils/BasicBlockUtils.h"
Kostya Serebryany9f5213f2013-06-26 09:18:17 +000047#include "llvm/Transforms/Utils/Cloning.h"
Alexey Samsonov3d43b632012-12-12 14:31:53 +000048#include "llvm/Transforms/Utils/Local.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000049#include "llvm/Transforms/Utils/ModuleUtils.h"
Peter Collingbourne015370e2013-07-09 22:02:49 +000050#include "llvm/Transforms/Utils/SpecialCaseList.h"
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000051#include <algorithm>
Chandler Carruthed0881b2012-12-03 16:50:05 +000052#include <string>
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000053
54using namespace llvm;
55
56static const uint64_t kDefaultShadowScale = 3;
57static const uint64_t kDefaultShadowOffset32 = 1ULL << 29;
58static const uint64_t kDefaultShadowOffset64 = 1ULL << 44;
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +000059static const uint64_t kDefaultShort64bitShadowOffset = 0x7FFF8000; // < 2G.
Kostya Serebryany4766fe62013-01-23 12:54:55 +000060static const uint64_t kPPC64_ShadowOffset64 = 1ULL << 41;
Kostya Serebryany9e62b302013-06-03 14:46:56 +000061static const uint64_t kMIPS32_ShadowOffset32 = 0x0aaa8000;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000062
Kostya Serebryany6805de52013-09-10 13:16:56 +000063static const size_t kMinStackMallocSize = 1 << 6; // 64B
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000064static const size_t kMaxStackMallocSize = 1 << 16; // 64K
65static const uintptr_t kCurrentStackFrameMagic = 0x41B58AB3;
66static const uintptr_t kRetiredStackFrameMagic = 0x45E0360E;
67
Craig Topperd3a34f82013-07-16 01:17:10 +000068static const char *const kAsanModuleCtorName = "asan.module_ctor";
69static const char *const kAsanModuleDtorName = "asan.module_dtor";
70static const int kAsanCtorAndCtorPriority = 1;
71static const char *const kAsanReportErrorTemplate = "__asan_report_";
72static const char *const kAsanReportLoadN = "__asan_report_load_n";
73static const char *const kAsanReportStoreN = "__asan_report_store_n";
74static const char *const kAsanRegisterGlobalsName = "__asan_register_globals";
Alexey Samsonovf52b7172013-08-05 13:19:49 +000075static const char *const kAsanUnregisterGlobalsName =
76 "__asan_unregister_globals";
Craig Topperd3a34f82013-07-16 01:17:10 +000077static const char *const kAsanPoisonGlobalsName = "__asan_before_dynamic_init";
78static const char *const kAsanUnpoisonGlobalsName = "__asan_after_dynamic_init";
79static const char *const kAsanInitName = "__asan_init_v3";
Bob Wilsonda4147c2013-11-15 07:16:09 +000080static const char *const kAsanCovName = "__sanitizer_cov";
Craig Topperd3a34f82013-07-16 01:17:10 +000081static const char *const kAsanHandleNoReturnName = "__asan_handle_no_return";
82static const char *const kAsanMappingOffsetName = "__asan_mapping_offset";
83static const char *const kAsanMappingScaleName = "__asan_mapping_scale";
Kostya Serebryany6805de52013-09-10 13:16:56 +000084static const int kMaxAsanStackMallocSizeClass = 10;
85static const char *const kAsanStackMallocNameTemplate = "__asan_stack_malloc_";
86static const char *const kAsanStackFreeNameTemplate = "__asan_stack_free_";
Craig Topperd3a34f82013-07-16 01:17:10 +000087static const char *const kAsanGenPrefix = "__asan_gen_";
88static const char *const kAsanPoisonStackMemoryName =
89 "__asan_poison_stack_memory";
90static const char *const kAsanUnpoisonStackMemoryName =
Alexey Samsonov261177a2012-12-04 01:34:23 +000091 "__asan_unpoison_stack_memory";
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000092
Kostya Serebryanyf3223822013-09-18 14:07:14 +000093static const char *const kAsanOptionDetectUAR =
94 "__asan_option_detect_stack_use_after_return";
95
David Blaikieeacc2872013-09-18 00:11:27 +000096#ifndef NDEBUG
Kostya Serebryanybc86efb2013-09-17 12:14:50 +000097static const int kAsanStackAfterReturnMagic = 0xf5;
David Blaikieeacc2872013-09-18 00:11:27 +000098#endif
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +000099
Kostya Serebryany874dae62012-07-16 16:15:40 +0000100// Accesses sizes are powers of two: 1, 2, 4, 8, 16.
101static const size_t kNumberOfAccessSizes = 5;
102
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000103// Command-line flags.
104
105// This flag may need to be replaced with -f[no-]asan-reads.
106static cl::opt<bool> ClInstrumentReads("asan-instrument-reads",
107 cl::desc("instrument read instructions"), cl::Hidden, cl::init(true));
108static cl::opt<bool> ClInstrumentWrites("asan-instrument-writes",
109 cl::desc("instrument write instructions"), cl::Hidden, cl::init(true));
Kostya Serebryany90241602012-05-30 09:04:06 +0000110static cl::opt<bool> ClInstrumentAtomics("asan-instrument-atomics",
111 cl::desc("instrument atomic instructions (rmw, cmpxchg)"),
112 cl::Hidden, cl::init(true));
Kostya Serebryany1e575ab2012-08-15 08:58:58 +0000113static cl::opt<bool> ClAlwaysSlowPath("asan-always-slow-path",
114 cl::desc("use instrumentation with slow path for all accesses"),
115 cl::Hidden, cl::init(false));
Kostya Serebryany874dae62012-07-16 16:15:40 +0000116// This flag limits the number of instructions to be instrumented
Kostya Serebryanyc387ca72012-06-28 09:34:41 +0000117// in any given BB. Normally, this should be set to unlimited (INT_MAX),
118// but due to http://llvm.org/bugs/show_bug.cgi?id=12652 we temporary
119// set it to 10000.
120static cl::opt<int> ClMaxInsnsToInstrumentPerBB("asan-max-ins-per-bb",
121 cl::init(10000),
122 cl::desc("maximal number of instructions to instrument in any given BB"),
123 cl::Hidden);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000124// This flag may need to be replaced with -f[no]asan-stack.
125static cl::opt<bool> ClStack("asan-stack",
126 cl::desc("Handle stack memory"), cl::Hidden, cl::init(true));
127// This flag may need to be replaced with -f[no]asan-use-after-return.
128static cl::opt<bool> ClUseAfterReturn("asan-use-after-return",
129 cl::desc("Check return-after-free"), cl::Hidden, cl::init(false));
130// This flag may need to be replaced with -f[no]asan-globals.
131static cl::opt<bool> ClGlobals("asan-globals",
132 cl::desc("Handle global objects"), cl::Hidden, cl::init(true));
Bob Wilsonda4147c2013-11-15 07:16:09 +0000133static cl::opt<bool> ClCoverage("asan-coverage",
134 cl::desc("ASan coverage"), cl::Hidden, cl::init(false));
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000135static cl::opt<bool> ClInitializers("asan-initialization-order",
136 cl::desc("Handle C++ initializer order"), cl::Hidden, cl::init(false));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000137static cl::opt<bool> ClMemIntrin("asan-memintrin",
138 cl::desc("Handle memset/memcpy/memmove"), cl::Hidden, cl::init(true));
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000139static cl::opt<unsigned> ClRealignStack("asan-realign-stack",
140 cl::desc("Realign stack to the value of this flag (power of two)"),
141 cl::Hidden, cl::init(32));
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000142static cl::opt<std::string> ClBlacklistFile("asan-blacklist",
143 cl::desc("File containing the list of objects to ignore "
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000144 "during instrumentation"), cl::Hidden);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000145
Kostya Serebryany9f5213f2013-06-26 09:18:17 +0000146// This is an experimental feature that will allow to choose between
147// instrumented and non-instrumented code at link-time.
148// If this option is on, just before instrumenting a function we create its
149// clone; if the function is not changed by asan the clone is deleted.
150// If we end up with a clone, we put the instrumented function into a section
151// called "ASAN" and the uninstrumented function into a section called "NOASAN".
152//
153// This is still a prototype, we need to figure out a way to keep two copies of
154// a function so that the linker can easily choose one of them.
155static cl::opt<bool> ClKeepUninstrumented("asan-keep-uninstrumented-functions",
156 cl::desc("Keep uninstrumented copies of functions"),
157 cl::Hidden, cl::init(false));
158
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000159// These flags allow to change the shadow mapping.
160// The shadow mapping looks like
161// Shadow = (Mem >> scale) + (1 << offset_log)
162static cl::opt<int> ClMappingScale("asan-mapping-scale",
163 cl::desc("scale of asan shadow mapping"), cl::Hidden, cl::init(0));
164static cl::opt<int> ClMappingOffsetLog("asan-mapping-offset-log",
165 cl::desc("offset of asan shadow mapping"), cl::Hidden, cl::init(-1));
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +0000166static cl::opt<bool> ClShort64BitOffset("asan-short-64bit-mapping-offset",
167 cl::desc("Use short immediate constant as the mapping offset for 64bit"),
Kostya Serebryanybe733372013-02-12 11:11:02 +0000168 cl::Hidden, cl::init(true));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000169
170// Optimization flags. Not user visible, used mostly for testing
171// and benchmarking the tool.
172static cl::opt<bool> ClOpt("asan-opt",
173 cl::desc("Optimize instrumentation"), cl::Hidden, cl::init(true));
174static cl::opt<bool> ClOptSameTemp("asan-opt-same-temp",
175 cl::desc("Instrument the same temp just once"), cl::Hidden,
176 cl::init(true));
177static cl::opt<bool> ClOptGlobals("asan-opt-globals",
178 cl::desc("Don't instrument scalar globals"), cl::Hidden, cl::init(true));
179
Alexey Samsonovdf624522012-11-29 18:14:24 +0000180static cl::opt<bool> ClCheckLifetime("asan-check-lifetime",
181 cl::desc("Use llvm.lifetime intrinsics to insert extra checks"),
182 cl::Hidden, cl::init(false));
183
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000184// Debug flags.
185static cl::opt<int> ClDebug("asan-debug", cl::desc("debug"), cl::Hidden,
186 cl::init(0));
187static cl::opt<int> ClDebugStack("asan-debug-stack", cl::desc("debug stack"),
188 cl::Hidden, cl::init(0));
189static cl::opt<std::string> ClDebugFunc("asan-debug-func",
190 cl::Hidden, cl::desc("Debug func"));
191static cl::opt<int> ClDebugMin("asan-debug-min", cl::desc("Debug min inst"),
192 cl::Hidden, cl::init(-1));
193static cl::opt<int> ClDebugMax("asan-debug-max", cl::desc("Debug man inst"),
194 cl::Hidden, cl::init(-1));
195
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000196STATISTIC(NumInstrumentedReads, "Number of instrumented reads");
197STATISTIC(NumInstrumentedWrites, "Number of instrumented writes");
198STATISTIC(NumOptimizedAccessesToGlobalArray,
199 "Number of optimized accesses to global arrays");
200STATISTIC(NumOptimizedAccessesToGlobalVar,
201 "Number of optimized accesses to global vars");
202
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000203namespace {
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000204/// A set of dynamically initialized globals extracted from metadata.
205class SetOfDynamicallyInitializedGlobals {
206 public:
207 void Init(Module& M) {
208 // Clang generates metadata identifying all dynamically initialized globals.
209 NamedMDNode *DynamicGlobals =
210 M.getNamedMetadata("llvm.asan.dynamically_initialized_globals");
211 if (!DynamicGlobals)
212 return;
213 for (int i = 0, n = DynamicGlobals->getNumOperands(); i < n; ++i) {
214 MDNode *MDN = DynamicGlobals->getOperand(i);
215 assert(MDN->getNumOperands() == 1);
216 Value *VG = MDN->getOperand(0);
217 // The optimizer may optimize away a global entirely, in which case we
218 // cannot instrument access to it.
219 if (!VG)
220 continue;
221 DynInitGlobals.insert(cast<GlobalVariable>(VG));
222 }
223 }
224 bool Contains(GlobalVariable *G) { return DynInitGlobals.count(G) != 0; }
225 private:
226 SmallSet<GlobalValue*, 32> DynInitGlobals;
227};
228
Alexey Samsonov1345d352013-01-16 13:23:28 +0000229/// This struct defines the shadow mapping using the rule:
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000230/// shadow = (mem >> Scale) ADD-or-OR Offset.
Alexey Samsonov1345d352013-01-16 13:23:28 +0000231struct ShadowMapping {
232 int Scale;
233 uint64_t Offset;
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000234 bool OrShadowOffset;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000235};
236
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000237static ShadowMapping getShadowMapping(const Module &M, int LongSize) {
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000238 llvm::Triple TargetTriple(M.getTargetTriple());
239 bool IsAndroid = TargetTriple.getEnvironment() == llvm::Triple::Android;
Alexander Potapenko259e8122013-02-12 12:41:12 +0000240 bool IsMacOSX = TargetTriple.getOS() == llvm::Triple::MacOSX;
Bill Schmidt0a9170d2013-07-26 01:35:43 +0000241 bool IsPPC64 = TargetTriple.getArch() == llvm::Triple::ppc64 ||
242 TargetTriple.getArch() == llvm::Triple::ppc64le;
Kostya Serebryanybe733372013-02-12 11:11:02 +0000243 bool IsX86_64 = TargetTriple.getArch() == llvm::Triple::x86_64;
Kostya Serebryany9e62b302013-06-03 14:46:56 +0000244 bool IsMIPS32 = TargetTriple.getArch() == llvm::Triple::mips ||
245 TargetTriple.getArch() == llvm::Triple::mipsel;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000246
247 ShadowMapping Mapping;
248
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000249 // OR-ing shadow offset if more efficient (at least on x86),
250 // but on ppc64 we have to use add since the shadow offset is not neccesary
251 // 1/8-th of the address space.
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +0000252 Mapping.OrShadowOffset = !IsPPC64 && !ClShort64BitOffset;
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000253
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000254 Mapping.Offset = IsAndroid ? 0 :
Kostya Serebryany9e62b302013-06-03 14:46:56 +0000255 (LongSize == 32 ?
256 (IsMIPS32 ? kMIPS32_ShadowOffset32 : kDefaultShadowOffset32) :
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000257 IsPPC64 ? kPPC64_ShadowOffset64 : kDefaultShadowOffset64);
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000258 if (!IsAndroid && ClShort64BitOffset && IsX86_64 && !IsMacOSX) {
Kostya Serebryanybe733372013-02-12 11:11:02 +0000259 assert(LongSize == 64);
Kostya Serebryanyc5f44bc2013-02-11 14:36:01 +0000260 Mapping.Offset = kDefaultShort64bitShadowOffset;
Kostya Serebryanycaf11af2013-02-13 05:14:12 +0000261 }
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000262 if (!IsAndroid && ClMappingOffsetLog >= 0) {
Alexey Samsonov1345d352013-01-16 13:23:28 +0000263 // Zero offset log is the special case.
264 Mapping.Offset = (ClMappingOffsetLog == 0) ? 0 : 1ULL << ClMappingOffsetLog;
265 }
266
267 Mapping.Scale = kDefaultShadowScale;
268 if (ClMappingScale) {
269 Mapping.Scale = ClMappingScale;
270 }
271
272 return Mapping;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000273}
274
Alexey Samsonov1345d352013-01-16 13:23:28 +0000275static size_t RedzoneSizeForScale(int MappingScale) {
Kostya Serebryany20a79972012-11-22 03:18:50 +0000276 // Redzone used for stack and globals is at least 32 bytes.
277 // For scales 6 and 7, the redzone has to be 64 and 128 bytes respectively.
Alexey Samsonov1345d352013-01-16 13:23:28 +0000278 return std::max(32U, 1U << MappingScale);
Kostya Serebryany20a79972012-11-22 03:18:50 +0000279}
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000280
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000281/// AddressSanitizer: instrument the code in module to find memory bugs.
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000282struct AddressSanitizer : public FunctionPass {
Alexey Samsonov819eddc2013-03-14 12:38:58 +0000283 AddressSanitizer(bool CheckInitOrder = true,
Alexey Samsonovdf624522012-11-29 18:14:24 +0000284 bool CheckUseAfterReturn = false,
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000285 bool CheckLifetime = false,
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000286 StringRef BlacklistFile = StringRef())
Alexey Samsonovdf624522012-11-29 18:14:24 +0000287 : FunctionPass(ID),
288 CheckInitOrder(CheckInitOrder || ClInitializers),
289 CheckUseAfterReturn(CheckUseAfterReturn || ClUseAfterReturn),
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000290 CheckLifetime(CheckLifetime || ClCheckLifetime),
291 BlacklistFile(BlacklistFile.empty() ? ClBlacklistFile
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000292 : BlacklistFile) {}
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000293 virtual const char *getPassName() const {
294 return "AddressSanitizerFunctionPass";
295 }
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000296 void instrumentMop(Instruction *I);
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000297 void instrumentAddress(Instruction *OrigIns, Instruction *InsertBefore,
298 Value *Addr, uint32_t TypeSize, bool IsWrite,
299 Value *SizeArgument);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000300 Value *createSlowPathCmp(IRBuilder<> &IRB, Value *AddrLong,
301 Value *ShadowValue, uint32_t TypeSize);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000302 Instruction *generateCrashCode(Instruction *InsertBefore, Value *Addr,
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000303 bool IsWrite, size_t AccessSizeIndex,
304 Value *SizeArgument);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000305 bool instrumentMemIntrinsic(MemIntrinsic *MI);
306 void instrumentMemIntrinsicParam(Instruction *OrigIns, Value *Addr,
Kostya Serebryany874dae62012-07-16 16:15:40 +0000307 Value *Size,
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000308 Instruction *InsertBefore, bool IsWrite);
309 Value *memToShadow(Value *Shadow, IRBuilder<> &IRB);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000310 bool runOnFunction(Function &F);
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +0000311 bool maybeInsertAsanInitAtFunctionEntry(Function &F);
Alexey Samsonov1345d352013-01-16 13:23:28 +0000312 void emitShadowMapping(Module &M, IRBuilder<> &IRB) const;
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000313 virtual bool doInitialization(Module &M);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000314 static char ID; // Pass identification, replacement for typeid
315
316 private:
Kostya Serebryany4b929da2012-11-29 09:54:21 +0000317 void initializeCallbacks(Module &M);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000318
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000319 bool ShouldInstrumentGlobal(GlobalVariable *G);
Kostya Serebryany1cdc6e92011-11-18 01:41:06 +0000320 bool LooksLikeCodeInBug11395(Instruction *I);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000321 void FindDynamicInitializers(Module &M);
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000322 bool GlobalIsLinkerInitialized(GlobalVariable *G);
Bob Wilsonda4147c2013-11-15 07:16:09 +0000323 bool InjectCoverage(Function &F);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000324
Alexey Samsonovdf624522012-11-29 18:14:24 +0000325 bool CheckInitOrder;
326 bool CheckUseAfterReturn;
327 bool CheckLifetime;
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000328 SmallString<64> BlacklistFile;
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000329
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000330 LLVMContext *C;
Micah Villmowcdfe20b2012-10-08 16:38:25 +0000331 DataLayout *TD;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000332 int LongSize;
333 Type *IntptrTy;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000334 ShadowMapping Mapping;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000335 Function *AsanCtorFunction;
336 Function *AsanInitFunction;
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000337 Function *AsanHandleNoReturnFunc;
Bob Wilsonda4147c2013-11-15 07:16:09 +0000338 Function *AsanCovFunction;
Peter Collingbourne015370e2013-07-09 22:02:49 +0000339 OwningPtr<SpecialCaseList> BL;
Kostya Serebryany4273bb02012-07-16 14:09:42 +0000340 // This array is indexed by AccessIsWrite and log2(AccessSize).
341 Function *AsanErrorCallback[2][kNumberOfAccessSizes];
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000342 // This array is indexed by AccessIsWrite.
343 Function *AsanErrorCallbackSized[2];
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000344 InlineAsm *EmptyAsm;
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000345 SetOfDynamicallyInitializedGlobals DynamicallyInitializedGlobals;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000346
347 friend struct FunctionStackPoisoner;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000348};
Kostya Serebryany874dae62012-07-16 16:15:40 +0000349
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000350class AddressSanitizerModule : public ModulePass {
Kostya Serebryany20a79972012-11-22 03:18:50 +0000351 public:
Alexey Samsonov819eddc2013-03-14 12:38:58 +0000352 AddressSanitizerModule(bool CheckInitOrder = true,
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000353 StringRef BlacklistFile = StringRef())
Alexey Samsonovdf624522012-11-29 18:14:24 +0000354 : ModulePass(ID),
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000355 CheckInitOrder(CheckInitOrder || ClInitializers),
356 BlacklistFile(BlacklistFile.empty() ? ClBlacklistFile
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000357 : BlacklistFile) {}
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000358 bool runOnModule(Module &M);
359 static char ID; // Pass identification, replacement for typeid
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000360 virtual const char *getPassName() const {
361 return "AddressSanitizerModule";
362 }
Alexey Samsonov261177a2012-12-04 01:34:23 +0000363
Kostya Serebryany20a79972012-11-22 03:18:50 +0000364 private:
Alexey Samsonov788381b2012-12-25 12:28:20 +0000365 void initializeCallbacks(Module &M);
366
Kostya Serebryany20a79972012-11-22 03:18:50 +0000367 bool ShouldInstrumentGlobal(GlobalVariable *G);
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000368 void createInitializerPoisonCalls(Module &M, GlobalValue *ModuleName);
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000369 size_t MinRedzoneSizeForGlobal() const {
Alexey Samsonov1345d352013-01-16 13:23:28 +0000370 return RedzoneSizeForScale(Mapping.Scale);
371 }
Kostya Serebryany20a79972012-11-22 03:18:50 +0000372
Alexey Samsonovdf624522012-11-29 18:14:24 +0000373 bool CheckInitOrder;
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000374 SmallString<64> BlacklistFile;
Alexey Samsonov347bcd32013-01-17 11:12:32 +0000375
Peter Collingbourne015370e2013-07-09 22:02:49 +0000376 OwningPtr<SpecialCaseList> BL;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000377 SetOfDynamicallyInitializedGlobals DynamicallyInitializedGlobals;
378 Type *IntptrTy;
379 LLVMContext *C;
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000380 DataLayout *TD;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000381 ShadowMapping Mapping;
Alexey Samsonov788381b2012-12-25 12:28:20 +0000382 Function *AsanPoisonGlobals;
383 Function *AsanUnpoisonGlobals;
384 Function *AsanRegisterGlobals;
385 Function *AsanUnregisterGlobals;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000386};
387
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000388// Stack poisoning does not play well with exception handling.
389// When an exception is thrown, we essentially bypass the code
390// that unpoisones the stack. This is why the run-time library has
391// to intercept __cxa_throw (as well as longjmp, etc) and unpoison the entire
392// stack in the interceptor. This however does not work inside the
393// actual function which catches the exception. Most likely because the
394// compiler hoists the load of the shadow value somewhere too high.
395// This causes asan to report a non-existing bug on 453.povray.
396// It sounds like an LLVM bug.
397struct FunctionStackPoisoner : public InstVisitor<FunctionStackPoisoner> {
398 Function &F;
399 AddressSanitizer &ASan;
400 DIBuilder DIB;
401 LLVMContext *C;
402 Type *IntptrTy;
403 Type *IntptrPtrTy;
Alexey Samsonov1345d352013-01-16 13:23:28 +0000404 ShadowMapping Mapping;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000405
406 SmallVector<AllocaInst*, 16> AllocaVec;
407 SmallVector<Instruction*, 8> RetVec;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000408 unsigned StackAlignment;
409
Kostya Serebryany6805de52013-09-10 13:16:56 +0000410 Function *AsanStackMallocFunc[kMaxAsanStackMallocSizeClass + 1],
411 *AsanStackFreeFunc[kMaxAsanStackMallocSizeClass + 1];
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000412 Function *AsanPoisonStackMemoryFunc, *AsanUnpoisonStackMemoryFunc;
413
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000414 // Stores a place and arguments of poisoning/unpoisoning call for alloca.
415 struct AllocaPoisonCall {
416 IntrinsicInst *InsBefore;
Alexey Samsonova788b942013-11-18 14:53:55 +0000417 AllocaInst *AI;
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000418 uint64_t Size;
419 bool DoPoison;
420 };
421 SmallVector<AllocaPoisonCall, 8> AllocaPoisonCallVec;
422
423 // Maps Value to an AllocaInst from which the Value is originated.
424 typedef DenseMap<Value*, AllocaInst*> AllocaForValueMapTy;
425 AllocaForValueMapTy AllocaForValue;
426
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000427 FunctionStackPoisoner(Function &F, AddressSanitizer &ASan)
428 : F(F), ASan(ASan), DIB(*F.getParent()), C(ASan.C),
429 IntptrTy(ASan.IntptrTy), IntptrPtrTy(PointerType::get(IntptrTy, 0)),
Alexey Samsonov1345d352013-01-16 13:23:28 +0000430 Mapping(ASan.Mapping),
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000431 StackAlignment(1 << Mapping.Scale) {}
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000432
433 bool runOnFunction() {
434 if (!ClStack) return false;
435 // Collect alloca, ret, lifetime instructions etc.
436 for (df_iterator<BasicBlock*> DI = df_begin(&F.getEntryBlock()),
437 DE = df_end(&F.getEntryBlock()); DI != DE; ++DI) {
438 BasicBlock *BB = *DI;
439 visit(*BB);
440 }
441 if (AllocaVec.empty()) return false;
442
443 initializeCallbacks(*F.getParent());
444
445 poisonStack();
446
447 if (ClDebugStack) {
448 DEBUG(dbgs() << F);
449 }
450 return true;
451 }
452
453 // Finds all static Alloca instructions and puts
454 // poisoned red zones around all of them.
455 // Then unpoison everything back before the function returns.
456 void poisonStack();
457
458 // ----------------------- Visitors.
459 /// \brief Collect all Ret instructions.
460 void visitReturnInst(ReturnInst &RI) {
461 RetVec.push_back(&RI);
462 }
463
464 /// \brief Collect Alloca instructions we want (and can) handle.
465 void visitAllocaInst(AllocaInst &AI) {
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000466 if (!isInterestingAlloca(AI)) return;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000467
468 StackAlignment = std::max(StackAlignment, AI.getAlignment());
469 AllocaVec.push_back(&AI);
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000470 }
471
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000472 /// \brief Collect lifetime intrinsic calls to check for use-after-scope
473 /// errors.
474 void visitIntrinsicInst(IntrinsicInst &II) {
475 if (!ASan.CheckLifetime) return;
476 Intrinsic::ID ID = II.getIntrinsicID();
477 if (ID != Intrinsic::lifetime_start &&
478 ID != Intrinsic::lifetime_end)
479 return;
480 // Found lifetime intrinsic, add ASan instrumentation if necessary.
481 ConstantInt *Size = dyn_cast<ConstantInt>(II.getArgOperand(0));
482 // If size argument is undefined, don't do anything.
483 if (Size->isMinusOne()) return;
484 // Check that size doesn't saturate uint64_t and can
485 // be stored in IntptrTy.
486 const uint64_t SizeValue = Size->getValue().getLimitedValue();
487 if (SizeValue == ~0ULL ||
488 !ConstantInt::isValueValidForType(IntptrTy, SizeValue))
489 return;
490 // Find alloca instruction that corresponds to llvm.lifetime argument.
491 AllocaInst *AI = findAllocaForValue(II.getArgOperand(1));
492 if (!AI) return;
493 bool DoPoison = (ID == Intrinsic::lifetime_end);
Alexey Samsonova788b942013-11-18 14:53:55 +0000494 AllocaPoisonCall APC = {&II, AI, SizeValue, DoPoison};
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000495 AllocaPoisonCallVec.push_back(APC);
496 }
497
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000498 // ---------------------- Helpers.
499 void initializeCallbacks(Module &M);
500
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000501 // Check if we want (and can) handle this alloca.
Jakub Staszak23ec6a92013-08-09 20:53:48 +0000502 bool isInterestingAlloca(AllocaInst &AI) const {
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000503 return (!AI.isArrayAllocation() && AI.isStaticAlloca() &&
504 AI.getAllocatedType()->isSized() &&
505 // alloca() may be called with 0 size, ignore it.
506 getAllocaSizeInBytes(&AI) > 0);
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000507 }
508
Jakub Staszak23ec6a92013-08-09 20:53:48 +0000509 uint64_t getAllocaSizeInBytes(AllocaInst *AI) const {
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000510 Type *Ty = AI->getAllocatedType();
511 uint64_t SizeInBytes = ASan.TD->getTypeAllocSize(Ty);
512 return SizeInBytes;
513 }
Alexey Samsonov29dd7f22012-12-27 08:50:58 +0000514 /// Finds alloca where the value comes from.
515 AllocaInst *findAllocaForValue(Value *V);
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000516 void poisonRedZones(const ArrayRef<uint8_t> ShadowBytes, IRBuilder<> &IRB,
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000517 Value *ShadowBase, bool DoPoison);
Jakub Staszak23ec6a92013-08-09 20:53:48 +0000518 void poisonAlloca(Value *V, uint64_t Size, IRBuilder<> &IRB, bool DoPoison);
Kostya Serebryanybc86efb2013-09-17 12:14:50 +0000519
520 void SetShadowToStackAfterReturnInlined(IRBuilder<> &IRB, Value *ShadowBase,
521 int Size);
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +0000522};
523
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000524} // namespace
525
526char AddressSanitizer::ID = 0;
527INITIALIZE_PASS(AddressSanitizer, "asan",
528 "AddressSanitizer: detects use-after-free and out-of-bounds bugs.",
529 false, false)
Alexey Samsonovdf624522012-11-29 18:14:24 +0000530FunctionPass *llvm::createAddressSanitizerFunctionPass(
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000531 bool CheckInitOrder, bool CheckUseAfterReturn, bool CheckLifetime,
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000532 StringRef BlacklistFile) {
Alexey Samsonovdf624522012-11-29 18:14:24 +0000533 return new AddressSanitizer(CheckInitOrder, CheckUseAfterReturn,
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000534 CheckLifetime, BlacklistFile);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000535}
536
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000537char AddressSanitizerModule::ID = 0;
538INITIALIZE_PASS(AddressSanitizerModule, "asan-module",
539 "AddressSanitizer: detects use-after-free and out-of-bounds bugs."
540 "ModulePass", false, false)
Alexey Samsonovef51c3f2012-12-03 19:09:26 +0000541ModulePass *llvm::createAddressSanitizerModulePass(
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000542 bool CheckInitOrder, StringRef BlacklistFile) {
543 return new AddressSanitizerModule(CheckInitOrder, BlacklistFile);
Alexander Potapenkoc94cf8f2012-01-23 11:22:43 +0000544}
545
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000546static size_t TypeSizeToSizeIndex(uint32_t TypeSize) {
Michael J. Spencerdf1ecbd72013-05-24 22:23:49 +0000547 size_t Res = countTrailingZeros(TypeSize / 8);
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000548 assert(Res < kNumberOfAccessSizes);
549 return Res;
550}
551
Bill Wendling58f8cef2013-08-06 22:52:42 +0000552// \brief Create a constant for Str so that we can pass it to the run-time lib.
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000553static GlobalVariable *createPrivateGlobalForString(
554 Module &M, StringRef Str, bool AllowMerging) {
Chris Lattnercf9e8f62012-02-05 02:29:43 +0000555 Constant *StrConst = ConstantDataArray::getString(M.getContext(), Str);
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000556 // For module-local strings that can be merged with another one we set the
Alexander Potapenko4f0335f2013-12-25 16:46:27 +0000557 // private linkage and the unnamed_addr attribute.
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000558 // Non-mergeable strings are made linker_private to remove them from the
559 // symbol table. "private" linkage doesn't work for Darwin, where the
560 // "L"-prefixed globals end up in __TEXT,__const section
561 // (see http://llvm.org/bugs/show_bug.cgi?id=17976 for more info).
562 GlobalValue::LinkageTypes linkage =
Alexander Potapenko4f0335f2013-12-25 16:46:27 +0000563 AllowMerging ? GlobalValue::PrivateLinkage
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000564 : GlobalValue::LinkerPrivateLinkage;
565 GlobalVariable *GV =
566 new GlobalVariable(M, StrConst->getType(), true,
567 linkage, StrConst, kAsanGenPrefix);
568 if (AllowMerging) GV->setUnnamedAddr(true);
Kostya Serebryany10cc12f2013-03-18 09:38:39 +0000569 GV->setAlignment(1); // Strings may not be merged w/o setting align 1.
570 return GV;
Kostya Serebryany139a9372012-11-20 14:16:08 +0000571}
572
573static bool GlobalWasGeneratedByAsan(GlobalVariable *G) {
574 return G->getName().find(kAsanGenPrefix) == 0;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000575}
576
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000577Value *AddressSanitizer::memToShadow(Value *Shadow, IRBuilder<> &IRB) {
578 // Shadow >> scale
Alexey Samsonov1345d352013-01-16 13:23:28 +0000579 Shadow = IRB.CreateLShr(Shadow, Mapping.Scale);
580 if (Mapping.Offset == 0)
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000581 return Shadow;
582 // (Shadow >> scale) | offset
Kostya Serebryany4766fe62013-01-23 12:54:55 +0000583 if (Mapping.OrShadowOffset)
584 return IRB.CreateOr(Shadow, ConstantInt::get(IntptrTy, Mapping.Offset));
585 else
586 return IRB.CreateAdd(Shadow, ConstantInt::get(IntptrTy, Mapping.Offset));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000587}
588
Kostya Serebryany874dae62012-07-16 16:15:40 +0000589void AddressSanitizer::instrumentMemIntrinsicParam(
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000590 Instruction *OrigIns,
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000591 Value *Addr, Value *Size, Instruction *InsertBefore, bool IsWrite) {
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000592 IRBuilder<> IRB(InsertBefore);
593 if (Size->getType() != IntptrTy)
594 Size = IRB.CreateIntCast(Size, IntptrTy, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000595 // Check the first byte.
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000596 instrumentAddress(OrigIns, InsertBefore, Addr, 8, IsWrite, Size);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000597 // Check the last byte.
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000598 IRB.SetInsertPoint(InsertBefore);
599 Value *SizeMinusOne = IRB.CreateSub(Size, ConstantInt::get(IntptrTy, 1));
600 Value *AddrLong = IRB.CreatePointerCast(Addr, IntptrTy);
601 Value *AddrLast = IRB.CreateAdd(AddrLong, SizeMinusOne);
602 instrumentAddress(OrigIns, InsertBefore, AddrLast, 8, IsWrite, Size);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000603}
604
605// Instrument memset/memmove/memcpy
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000606bool AddressSanitizer::instrumentMemIntrinsic(MemIntrinsic *MI) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000607 Value *Dst = MI->getDest();
608 MemTransferInst *MemTran = dyn_cast<MemTransferInst>(MI);
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000609 Value *Src = MemTran ? MemTran->getSource() : 0;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000610 Value *Length = MI->getLength();
611
612 Constant *ConstLength = dyn_cast<Constant>(Length);
613 Instruction *InsertBefore = MI;
614 if (ConstLength) {
615 if (ConstLength->isNullValue()) return false;
616 } else {
617 // The size is not a constant so it could be zero -- check at run-time.
618 IRBuilder<> IRB(InsertBefore);
619
620 Value *Cmp = IRB.CreateICmpNE(Length,
Kostya Serebryanyeeaf6882012-07-02 11:42:29 +0000621 Constant::getNullValue(Length->getType()));
Evgeniy Stepanova9164e92013-12-19 13:29:56 +0000622 InsertBefore = SplitBlockAndInsertIfThen(Cmp, InsertBefore, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000623 }
624
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000625 instrumentMemIntrinsicParam(MI, Dst, Length, InsertBefore, true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000626 if (Src)
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000627 instrumentMemIntrinsicParam(MI, Src, Length, InsertBefore, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000628 return true;
629}
630
Kostya Serebryany90241602012-05-30 09:04:06 +0000631// If I is an interesting memory access, return the PointerOperand
632// and set IsWrite. Otherwise return NULL.
633static Value *isInterestingMemoryAccess(Instruction *I, bool *IsWrite) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000634 if (LoadInst *LI = dyn_cast<LoadInst>(I)) {
Kostya Serebryany90241602012-05-30 09:04:06 +0000635 if (!ClInstrumentReads) return NULL;
636 *IsWrite = false;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000637 return LI->getPointerOperand();
638 }
Kostya Serebryany90241602012-05-30 09:04:06 +0000639 if (StoreInst *SI = dyn_cast<StoreInst>(I)) {
640 if (!ClInstrumentWrites) return NULL;
641 *IsWrite = true;
642 return SI->getPointerOperand();
643 }
644 if (AtomicRMWInst *RMW = dyn_cast<AtomicRMWInst>(I)) {
645 if (!ClInstrumentAtomics) return NULL;
646 *IsWrite = true;
647 return RMW->getPointerOperand();
648 }
649 if (AtomicCmpXchgInst *XCHG = dyn_cast<AtomicCmpXchgInst>(I)) {
650 if (!ClInstrumentAtomics) return NULL;
651 *IsWrite = true;
652 return XCHG->getPointerOperand();
653 }
654 return NULL;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000655}
656
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000657bool AddressSanitizer::GlobalIsLinkerInitialized(GlobalVariable *G) {
658 // If a global variable does not have dynamic initialization we don't
659 // have to instrument it. However, if a global does not have initializer
660 // at all, we assume it has dynamic initializer (in other TU).
661 return G->hasInitializer() && !DynamicallyInitializedGlobals.Contains(G);
662}
663
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000664void AddressSanitizer::instrumentMop(Instruction *I) {
Axel Naumann4a127062012-09-17 14:20:57 +0000665 bool IsWrite = false;
Kostya Serebryany90241602012-05-30 09:04:06 +0000666 Value *Addr = isInterestingMemoryAccess(I, &IsWrite);
667 assert(Addr);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000668 if (ClOpt && ClOptGlobals) {
669 if (GlobalVariable *G = dyn_cast<GlobalVariable>(Addr)) {
670 // If initialization order checking is disabled, a simple access to a
671 // dynamically initialized global is always valid.
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000672 if (!CheckInitOrder || GlobalIsLinkerInitialized(G)) {
673 NumOptimizedAccessesToGlobalVar++;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000674 return;
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000675 }
676 }
677 ConstantExpr *CE = dyn_cast<ConstantExpr>(Addr);
678 if (CE && CE->isGEPWithNoNotionalOverIndexing()) {
679 if (GlobalVariable *G = dyn_cast<GlobalVariable>(CE->getOperand(0))) {
680 if (CE->getOperand(1)->isNullValue() && GlobalIsLinkerInitialized(G)) {
681 NumOptimizedAccessesToGlobalArray++;
682 return;
683 }
684 }
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000685 }
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000686 }
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000687
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000688 Type *OrigPtrTy = Addr->getType();
689 Type *OrigTy = cast<PointerType>(OrigPtrTy)->getElementType();
690
691 assert(OrigTy->isSized());
Kostya Serebryany7ca384b2013-02-18 13:47:02 +0000692 uint32_t TypeSize = TD->getTypeStoreSizeInBits(OrigTy);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000693
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000694 assert((TypeSize % 8) == 0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000695
Kostya Serebryanyd3d23be2013-10-16 14:06:14 +0000696 if (IsWrite)
697 NumInstrumentedWrites++;
698 else
699 NumInstrumentedReads++;
700
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000701 // Instrument a 1-, 2-, 4-, 8-, or 16- byte access with one check.
702 if (TypeSize == 8 || TypeSize == 16 ||
703 TypeSize == 32 || TypeSize == 64 || TypeSize == 128)
704 return instrumentAddress(I, I, Addr, TypeSize, IsWrite, 0);
705 // Instrument unusual size (but still multiple of 8).
706 // We can not do it with a single check, so we do 1-byte check for the first
707 // and the last bytes. We call __asan_report_*_n(addr, real_size) to be able
708 // to report the actual access size.
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000709 IRBuilder<> IRB(I);
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000710 Value *LastByte = IRB.CreateIntToPtr(
711 IRB.CreateAdd(IRB.CreatePointerCast(Addr, IntptrTy),
712 ConstantInt::get(IntptrTy, TypeSize / 8 - 1)),
713 OrigPtrTy);
714 Value *Size = ConstantInt::get(IntptrTy, TypeSize / 8);
715 instrumentAddress(I, I, Addr, 8, IsWrite, Size);
716 instrumentAddress(I, I, LastByte, 8, IsWrite, Size);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000717}
718
Alexander Potapenko056e27e2012-04-23 10:47:31 +0000719// Validate the result of Module::getOrInsertFunction called for an interface
720// function of AddressSanitizer. If the instrumented module defines a function
721// with the same name, their prototypes must match, otherwise
722// getOrInsertFunction returns a bitcast.
Kostya Serebryany20a79972012-11-22 03:18:50 +0000723static Function *checkInterfaceFunction(Constant *FuncOrBitcast) {
Alexander Potapenko056e27e2012-04-23 10:47:31 +0000724 if (isa<Function>(FuncOrBitcast)) return cast<Function>(FuncOrBitcast);
725 FuncOrBitcast->dump();
726 report_fatal_error("trying to redefine an AddressSanitizer "
727 "interface function");
728}
729
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000730Instruction *AddressSanitizer::generateCrashCode(
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000731 Instruction *InsertBefore, Value *Addr,
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000732 bool IsWrite, size_t AccessSizeIndex, Value *SizeArgument) {
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000733 IRBuilder<> IRB(InsertBefore);
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000734 CallInst *Call = SizeArgument
735 ? IRB.CreateCall2(AsanErrorCallbackSized[IsWrite], Addr, SizeArgument)
736 : IRB.CreateCall(AsanErrorCallback[IsWrite][AccessSizeIndex], Addr);
737
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000738 // We don't do Call->setDoesNotReturn() because the BB already has
739 // UnreachableInst at the end.
740 // This EmptyAsm is required to avoid callback merge.
741 IRB.CreateCall(EmptyAsm);
Kostya Serebryany3411f2e2012-01-06 18:09:21 +0000742 return Call;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000743}
744
Kostya Serebryanyc4ce5df2012-07-16 17:12:07 +0000745Value *AddressSanitizer::createSlowPathCmp(IRBuilder<> &IRB, Value *AddrLong,
Kostya Serebryany874dae62012-07-16 16:15:40 +0000746 Value *ShadowValue,
747 uint32_t TypeSize) {
Alexey Samsonov1345d352013-01-16 13:23:28 +0000748 size_t Granularity = 1 << Mapping.Scale;
Kostya Serebryany874dae62012-07-16 16:15:40 +0000749 // Addr & (Granularity - 1)
750 Value *LastAccessedByte = IRB.CreateAnd(
751 AddrLong, ConstantInt::get(IntptrTy, Granularity - 1));
752 // (Addr & (Granularity - 1)) + size - 1
753 if (TypeSize / 8 > 1)
754 LastAccessedByte = IRB.CreateAdd(
755 LastAccessedByte, ConstantInt::get(IntptrTy, TypeSize / 8 - 1));
756 // (uint8_t) ((Addr & (Granularity-1)) + size - 1)
757 LastAccessedByte = IRB.CreateIntCast(
Kostya Serebryany1e575ab2012-08-15 08:58:58 +0000758 LastAccessedByte, ShadowValue->getType(), false);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000759 // ((uint8_t) ((Addr & (Granularity-1)) + size - 1)) >= ShadowValue
760 return IRB.CreateICmpSGE(LastAccessedByte, ShadowValue);
761}
762
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000763void AddressSanitizer::instrumentAddress(Instruction *OrigIns,
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000764 Instruction *InsertBefore,
765 Value *Addr, uint32_t TypeSize,
766 bool IsWrite, Value *SizeArgument) {
767 IRBuilder<> IRB(InsertBefore);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000768 Value *AddrLong = IRB.CreatePointerCast(Addr, IntptrTy);
769
770 Type *ShadowTy = IntegerType::get(
Alexey Samsonov1345d352013-01-16 13:23:28 +0000771 *C, std::max(8U, TypeSize >> Mapping.Scale));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000772 Type *ShadowPtrTy = PointerType::get(ShadowTy, 0);
773 Value *ShadowPtr = memToShadow(AddrLong, IRB);
774 Value *CmpVal = Constant::getNullValue(ShadowTy);
775 Value *ShadowValue = IRB.CreateLoad(
776 IRB.CreateIntToPtr(ShadowPtr, ShadowPtrTy));
777
778 Value *Cmp = IRB.CreateICmpNE(ShadowValue, CmpVal);
Kostya Serebryany0f7a80d2012-08-13 14:08:46 +0000779 size_t AccessSizeIndex = TypeSizeToSizeIndex(TypeSize);
Alexey Samsonov1345d352013-01-16 13:23:28 +0000780 size_t Granularity = 1 << Mapping.Scale;
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000781 TerminatorInst *CrashTerm = 0;
782
Kostya Serebryany1e575ab2012-08-15 08:58:58 +0000783 if (ClAlwaysSlowPath || (TypeSize < 8 * Granularity)) {
Evgeniy Stepanov8eb77d82012-10-19 10:48:31 +0000784 TerminatorInst *CheckTerm =
Evgeniy Stepanova9164e92013-12-19 13:29:56 +0000785 SplitBlockAndInsertIfThen(Cmp, InsertBefore, false);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000786 assert(dyn_cast<BranchInst>(CheckTerm)->isUnconditional());
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000787 BasicBlock *NextBB = CheckTerm->getSuccessor(0);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000788 IRB.SetInsertPoint(CheckTerm);
789 Value *Cmp2 = createSlowPathCmp(IRB, AddrLong, ShadowValue, TypeSize);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +0000790 BasicBlock *CrashBlock =
791 BasicBlock::Create(*C, "", NextBB->getParent(), NextBB);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000792 CrashTerm = new UnreachableInst(*C, CrashBlock);
Kostya Serebryanyf02c6062012-07-20 09:54:50 +0000793 BranchInst *NewTerm = BranchInst::Create(CrashBlock, NextBB, Cmp2);
794 ReplaceInstWithInst(CheckTerm, NewTerm);
Kostya Serebryany874dae62012-07-16 16:15:40 +0000795 } else {
Evgeniy Stepanova9164e92013-12-19 13:29:56 +0000796 CrashTerm = SplitBlockAndInsertIfThen(Cmp, InsertBefore, true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000797 }
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000798
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +0000799 Instruction *Crash = generateCrashCode(
800 CrashTerm, AddrLong, IsWrite, AccessSizeIndex, SizeArgument);
Kostya Serebryanyfda7a132012-08-14 14:04:51 +0000801 Crash->setDebugLoc(OrigIns->getDebugLoc());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000802}
803
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000804void AddressSanitizerModule::createInitializerPoisonCalls(
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000805 Module &M, GlobalValue *ModuleName) {
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000806 // We do all of our poisoning and unpoisoning within _GLOBAL__I_a.
807 Function *GlobalInit = M.getFunction("_GLOBAL__I_a");
808 // If that function is not present, this TU contains no globals, or they have
809 // all been optimized away
810 if (!GlobalInit)
811 return;
812
813 // Set up the arguments to our poison/unpoison functions.
814 IRBuilder<> IRB(GlobalInit->begin()->getFirstInsertionPt());
815
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000816 // Add a call to poison all external globals before the given function starts.
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000817 Value *ModuleNameAddr = ConstantExpr::getPointerCast(ModuleName, IntptrTy);
818 IRB.CreateCall(AsanPoisonGlobals, ModuleNameAddr);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000819
820 // Add calls to unpoison all globals before each return instruction.
821 for (Function::iterator I = GlobalInit->begin(), E = GlobalInit->end();
822 I != E; ++I) {
823 if (ReturnInst *RI = dyn_cast<ReturnInst>(I->getTerminator())) {
824 CallInst::Create(AsanUnpoisonGlobals, "", RI);
825 }
826 }
827}
828
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000829bool AddressSanitizerModule::ShouldInstrumentGlobal(GlobalVariable *G) {
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000830 Type *Ty = cast<PointerType>(G->getType())->getElementType();
Kostya Serebryany20343352012-10-17 13:40:06 +0000831 DEBUG(dbgs() << "GLOBAL: " << *G << "\n");
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000832
Kostya Serebryany2fa38f82012-09-05 07:29:56 +0000833 if (BL->isIn(*G)) return false;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000834 if (!Ty->isSized()) return false;
835 if (!G->hasInitializer()) return false;
Kostya Serebryany139a9372012-11-20 14:16:08 +0000836 if (GlobalWasGeneratedByAsan(G)) return false; // Our own global.
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000837 // Touch only those globals that will not be defined in other modules.
838 // Don't handle ODR type linkages since other modules may be built w/o asan.
839 if (G->getLinkage() != GlobalVariable::ExternalLinkage &&
840 G->getLinkage() != GlobalVariable::PrivateLinkage &&
841 G->getLinkage() != GlobalVariable::InternalLinkage)
842 return false;
843 // Two problems with thread-locals:
844 // - The address of the main thread's copy can't be computed at link-time.
845 // - Need to poison all copies, not just the main thread's one.
846 if (G->isThreadLocal())
847 return false;
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000848 // For now, just ignore this Global if the alignment is large.
849 if (G->getAlignment() > MinRedzoneSizeForGlobal()) return false;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000850
851 // Ignore all the globals with the names starting with "\01L_OBJC_".
852 // Many of those are put into the .cstring section. The linker compresses
853 // that section by removing the spare \0s after the string terminator, so
854 // our redzones get broken.
855 if ((G->getName().find("\01L_OBJC_") == 0) ||
856 (G->getName().find("\01l_OBJC_") == 0)) {
857 DEBUG(dbgs() << "Ignoring \\01L_OBJC_* global: " << *G);
858 return false;
859 }
860
861 if (G->hasSection()) {
862 StringRef Section(G->getSection());
863 // Ignore the globals from the __OBJC section. The ObjC runtime assumes
864 // those conform to /usr/lib/objc/runtime.h, so we can't add redzones to
865 // them.
866 if ((Section.find("__OBJC,") == 0) ||
867 (Section.find("__DATA, __objc_") == 0)) {
868 DEBUG(dbgs() << "Ignoring ObjC runtime global: " << *G);
869 return false;
870 }
871 // See http://code.google.com/p/address-sanitizer/issues/detail?id=32
872 // Constant CFString instances are compiled in the following way:
873 // -- the string buffer is emitted into
874 // __TEXT,__cstring,cstring_literals
875 // -- the constant NSConstantString structure referencing that buffer
876 // is placed into __DATA,__cfstring
877 // Therefore there's no point in placing redzones into __DATA,__cfstring.
878 // Moreover, it causes the linker to crash on OS X 10.7
879 if (Section.find("__DATA,__cfstring") == 0) {
880 DEBUG(dbgs() << "Ignoring CFString: " << *G);
881 return false;
882 }
883 }
884
885 return true;
886}
887
Alexey Samsonov788381b2012-12-25 12:28:20 +0000888void AddressSanitizerModule::initializeCallbacks(Module &M) {
889 IRBuilder<> IRB(*C);
890 // Declare our poisoning and unpoisoning functions.
891 AsanPoisonGlobals = checkInterfaceFunction(M.getOrInsertFunction(
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000892 kAsanPoisonGlobalsName, IRB.getVoidTy(), IntptrTy, NULL));
Alexey Samsonov788381b2012-12-25 12:28:20 +0000893 AsanPoisonGlobals->setLinkage(Function::ExternalLinkage);
894 AsanUnpoisonGlobals = checkInterfaceFunction(M.getOrInsertFunction(
895 kAsanUnpoisonGlobalsName, IRB.getVoidTy(), NULL));
896 AsanUnpoisonGlobals->setLinkage(Function::ExternalLinkage);
897 // Declare functions that register/unregister globals.
898 AsanRegisterGlobals = checkInterfaceFunction(M.getOrInsertFunction(
899 kAsanRegisterGlobalsName, IRB.getVoidTy(),
900 IntptrTy, IntptrTy, NULL));
901 AsanRegisterGlobals->setLinkage(Function::ExternalLinkage);
902 AsanUnregisterGlobals = checkInterfaceFunction(M.getOrInsertFunction(
903 kAsanUnregisterGlobalsName,
904 IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
905 AsanUnregisterGlobals->setLinkage(Function::ExternalLinkage);
906}
907
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000908// This function replaces all global variables with new variables that have
909// trailing redzones. It also creates a function that poisons
910// redzones and inserts this function into llvm.global_ctors.
Kostya Serebryanydfe9e792012-11-28 10:31:36 +0000911bool AddressSanitizerModule::runOnModule(Module &M) {
912 if (!ClGlobals) return false;
913 TD = getAnalysisIfAvailable<DataLayout>();
914 if (!TD)
915 return false;
Alexey Samsonove4b5fb82013-08-12 11:46:09 +0000916 BL.reset(SpecialCaseList::createOrDie(BlacklistFile));
Alexey Samsonov9a956e82012-11-29 18:27:01 +0000917 if (BL->isIn(M)) return false;
Kostya Serebryany20a79972012-11-22 03:18:50 +0000918 C = &(M.getContext());
Alexey Samsonov1345d352013-01-16 13:23:28 +0000919 int LongSize = TD->getPointerSizeInBits();
920 IntptrTy = Type::getIntNTy(*C, LongSize);
Evgeniy Stepanov13665362014-01-16 10:19:12 +0000921 Mapping = getShadowMapping(M, LongSize);
Alexey Samsonov788381b2012-12-25 12:28:20 +0000922 initializeCallbacks(M);
923 DynamicallyInitializedGlobals.Init(M);
Kostya Serebryany20a79972012-11-22 03:18:50 +0000924
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000925 SmallVector<GlobalVariable *, 16> GlobalsToChange;
926
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000927 for (Module::GlobalListType::iterator G = M.global_begin(),
928 E = M.global_end(); G != E; ++G) {
929 if (ShouldInstrumentGlobal(G))
930 GlobalsToChange.push_back(G);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000931 }
932
933 size_t n = GlobalsToChange.size();
934 if (n == 0) return false;
935
936 // A global is described by a structure
937 // size_t beg;
938 // size_t size;
939 // size_t size_with_redzone;
940 // const char *name;
Kostya Serebryanybd016bb2013-03-18 08:05:29 +0000941 // const char *module_name;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000942 // size_t has_dynamic_init;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000943 // We initialize an array of such structures and pass it to a run-time call.
944 StructType *GlobalStructTy = StructType::get(IntptrTy, IntptrTy,
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000945 IntptrTy, IntptrTy,
Kostya Serebryanybd016bb2013-03-18 08:05:29 +0000946 IntptrTy, IntptrTy, NULL);
Rafael Espindola44fee4e2013-10-01 13:32:03 +0000947 SmallVector<Constant *, 16> Initializers(n);
Kostya Serebryany20a79972012-11-22 03:18:50 +0000948
949 Function *CtorFunc = M.getFunction(kAsanModuleCtorName);
950 assert(CtorFunc);
951 IRBuilder<> IRB(CtorFunc->getEntryBlock().getTerminator());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000952
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000953 bool HasDynamicallyInitializedGlobals = false;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000954
Alexey Samsonove1e26bf2013-03-26 13:05:41 +0000955 // We shouldn't merge same module names, as this string serves as unique
956 // module ID in runtime.
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000957 GlobalVariable *ModuleName = createPrivateGlobalForString(
958 M, M.getModuleIdentifier(), /*AllowMerging*/false);
Kostya Serebryanybd016bb2013-03-18 08:05:29 +0000959
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000960 for (size_t i = 0; i < n; i++) {
Kostya Serebryanye35d59a2013-01-24 10:43:50 +0000961 static const uint64_t kMaxGlobalRedzone = 1 << 18;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000962 GlobalVariable *G = GlobalsToChange[i];
963 PointerType *PtrTy = cast<PointerType>(G->getType());
964 Type *Ty = PtrTy->getElementType();
Kostya Serebryany84a7f2e82012-03-21 15:28:50 +0000965 uint64_t SizeInBytes = TD->getTypeAllocSize(Ty);
Kostya Serebryany4fb78012013-12-06 09:00:17 +0000966 uint64_t MinRZ = MinRedzoneSizeForGlobal();
Kostya Serebryany87191f62013-01-24 10:35:40 +0000967 // MinRZ <= RZ <= kMaxGlobalRedzone
968 // and trying to make RZ to be ~ 1/4 of SizeInBytes.
Kostya Serebryanye35d59a2013-01-24 10:43:50 +0000969 uint64_t RZ = std::max(MinRZ,
Kostya Serebryany87191f62013-01-24 10:35:40 +0000970 std::min(kMaxGlobalRedzone,
971 (SizeInBytes / MinRZ / 4) * MinRZ));
972 uint64_t RightRedzoneSize = RZ;
973 // Round up to MinRZ
974 if (SizeInBytes % MinRZ)
975 RightRedzoneSize += MinRZ - (SizeInBytes % MinRZ);
976 assert(((RightRedzoneSize + SizeInBytes) % MinRZ) == 0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000977 Type *RightRedZoneTy = ArrayType::get(IRB.getInt8Ty(), RightRedzoneSize);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +0000978 // Determine whether this global should be poisoned in initialization.
Kostya Serebryanyb3bd6052012-11-20 13:00:01 +0000979 bool GlobalHasDynamicInitializer =
980 DynamicallyInitializedGlobals.Contains(G);
Kostya Serebryany2fa38f82012-09-05 07:29:56 +0000981 // Don't check initialization order if this global is blacklisted.
Peter Collingbourne49062a92013-07-09 22:03:17 +0000982 GlobalHasDynamicInitializer &= !BL->isIn(*G, "init");
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000983
984 StructType *NewTy = StructType::get(Ty, RightRedZoneTy, NULL);
985 Constant *NewInitializer = ConstantStruct::get(
986 NewTy, G->getInitializer(),
987 Constant::getNullValue(RightRedZoneTy), NULL);
988
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +0000989 GlobalVariable *Name =
990 createPrivateGlobalForString(M, G->getName(), /*AllowMerging*/true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000991
992 // Create a new global variable with enough space for a redzone.
Bill Wendling58f8cef2013-08-06 22:52:42 +0000993 GlobalValue::LinkageTypes Linkage = G->getLinkage();
994 if (G->isConstant() && Linkage == GlobalValue::PrivateLinkage)
995 Linkage = GlobalValue::InternalLinkage;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000996 GlobalVariable *NewGlobal = new GlobalVariable(
Bill Wendling58f8cef2013-08-06 22:52:42 +0000997 M, NewTy, G->isConstant(), Linkage,
Hans Wennborgcbe34b42012-06-23 11:37:03 +0000998 NewInitializer, "", G, G->getThreadLocalMode());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +0000999 NewGlobal->copyAttributesFrom(G);
Kostya Serebryany87191f62013-01-24 10:35:40 +00001000 NewGlobal->setAlignment(MinRZ);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001001
1002 Value *Indices2[2];
1003 Indices2[0] = IRB.getInt32(0);
1004 Indices2[1] = IRB.getInt32(0);
1005
1006 G->replaceAllUsesWith(
Kostya Serebryany7471d132012-01-28 04:27:16 +00001007 ConstantExpr::getGetElementPtr(NewGlobal, Indices2, true));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001008 NewGlobal->takeName(G);
1009 G->eraseFromParent();
1010
1011 Initializers[i] = ConstantStruct::get(
1012 GlobalStructTy,
1013 ConstantExpr::getPointerCast(NewGlobal, IntptrTy),
1014 ConstantInt::get(IntptrTy, SizeInBytes),
1015 ConstantInt::get(IntptrTy, SizeInBytes + RightRedzoneSize),
1016 ConstantExpr::getPointerCast(Name, IntptrTy),
Kostya Serebryanybd016bb2013-03-18 08:05:29 +00001017 ConstantExpr::getPointerCast(ModuleName, IntptrTy),
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001018 ConstantInt::get(IntptrTy, GlobalHasDynamicInitializer),
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001019 NULL);
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001020
1021 // Populate the first and last globals declared in this TU.
Alexey Samsonove1e26bf2013-03-26 13:05:41 +00001022 if (CheckInitOrder && GlobalHasDynamicInitializer)
1023 HasDynamicallyInitializedGlobals = true;
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001024
Kostya Serebryany20343352012-10-17 13:40:06 +00001025 DEBUG(dbgs() << "NEW GLOBAL: " << *NewGlobal << "\n");
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001026 }
1027
1028 ArrayType *ArrayOfGlobalStructTy = ArrayType::get(GlobalStructTy, n);
1029 GlobalVariable *AllGlobals = new GlobalVariable(
Bill Wendling58f8cef2013-08-06 22:52:42 +00001030 M, ArrayOfGlobalStructTy, false, GlobalVariable::InternalLinkage,
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001031 ConstantArray::get(ArrayOfGlobalStructTy, Initializers), "");
1032
Kostya Serebryanyf4be0192012-08-21 08:24:25 +00001033 // Create calls for poisoning before initializers run and unpoisoning after.
Alexey Samsonove1e26bf2013-03-26 13:05:41 +00001034 if (CheckInitOrder && HasDynamicallyInitializedGlobals)
1035 createInitializerPoisonCalls(M, ModuleName);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001036 IRB.CreateCall2(AsanRegisterGlobals,
1037 IRB.CreatePointerCast(AllGlobals, IntptrTy),
1038 ConstantInt::get(IntptrTy, n));
1039
Kostya Serebryanycd1aba82011-12-15 21:59:03 +00001040 // We also need to unregister globals at the end, e.g. when a shared library
1041 // gets closed.
1042 Function *AsanDtorFunction = Function::Create(
1043 FunctionType::get(Type::getVoidTy(*C), false),
1044 GlobalValue::InternalLinkage, kAsanModuleDtorName, &M);
1045 BasicBlock *AsanDtorBB = BasicBlock::Create(*C, "", AsanDtorFunction);
1046 IRBuilder<> IRB_Dtor(ReturnInst::Create(*C, AsanDtorBB));
Kostya Serebryanycd1aba82011-12-15 21:59:03 +00001047 IRB_Dtor.CreateCall2(AsanUnregisterGlobals,
1048 IRB.CreatePointerCast(AllGlobals, IntptrTy),
1049 ConstantInt::get(IntptrTy, n));
1050 appendToGlobalDtors(M, AsanDtorFunction, kAsanCtorAndCtorPriority);
1051
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001052 DEBUG(dbgs() << M);
1053 return true;
1054}
1055
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001056void AddressSanitizer::initializeCallbacks(Module &M) {
1057 IRBuilder<> IRB(*C);
Kostya Serebryany4273bb02012-07-16 14:09:42 +00001058 // Create __asan_report* callbacks.
1059 for (size_t AccessIsWrite = 0; AccessIsWrite <= 1; AccessIsWrite++) {
1060 for (size_t AccessSizeIndex = 0; AccessSizeIndex < kNumberOfAccessSizes;
1061 AccessSizeIndex++) {
1062 // IsWrite and TypeSize are encoded in the function name.
1063 std::string FunctionName = std::string(kAsanReportErrorTemplate) +
1064 (AccessIsWrite ? "store" : "load") + itostr(1 << AccessSizeIndex);
Kostya Serebryany986b8da2012-07-17 11:04:12 +00001065 // If we are merging crash callbacks, they have two parameters.
Kostya Serebryany157a5152012-11-07 12:42:18 +00001066 AsanErrorCallback[AccessIsWrite][AccessSizeIndex] =
1067 checkInterfaceFunction(M.getOrInsertFunction(
1068 FunctionName, IRB.getVoidTy(), IntptrTy, NULL));
Kostya Serebryany4273bb02012-07-16 14:09:42 +00001069 }
1070 }
Kostya Serebryany3ece9bea2013-02-19 11:29:21 +00001071 AsanErrorCallbackSized[0] = checkInterfaceFunction(M.getOrInsertFunction(
1072 kAsanReportLoadN, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
1073 AsanErrorCallbackSized[1] = checkInterfaceFunction(M.getOrInsertFunction(
1074 kAsanReportStoreN, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001075
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001076 AsanHandleNoReturnFunc = checkInterfaceFunction(M.getOrInsertFunction(
1077 kAsanHandleNoReturnName, IRB.getVoidTy(), NULL));
Bob Wilsonda4147c2013-11-15 07:16:09 +00001078 AsanCovFunction = checkInterfaceFunction(M.getOrInsertFunction(
1079 kAsanCovName, IRB.getVoidTy(), IntptrTy, NULL));
Kostya Serebryanyf02c6062012-07-20 09:54:50 +00001080 // We insert an empty inline asm after __asan_report* to avoid callback merge.
1081 EmptyAsm = InlineAsm::get(FunctionType::get(IRB.getVoidTy(), false),
1082 StringRef(""), StringRef(""),
1083 /*hasSideEffects=*/true);
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001084}
1085
Alexey Samsonov1345d352013-01-16 13:23:28 +00001086void AddressSanitizer::emitShadowMapping(Module &M, IRBuilder<> &IRB) const {
Alexey Samsonov347bcd32013-01-17 11:12:32 +00001087 // Tell the values of mapping offset and scale to the run-time.
1088 GlobalValue *asan_mapping_offset =
1089 new GlobalVariable(M, IntptrTy, true, GlobalValue::LinkOnceODRLinkage,
1090 ConstantInt::get(IntptrTy, Mapping.Offset),
1091 kAsanMappingOffsetName);
1092 // Read the global, otherwise it may be optimized away.
1093 IRB.CreateLoad(asan_mapping_offset, true);
Alexey Samsonov1345d352013-01-16 13:23:28 +00001094
Alexey Samsonov347bcd32013-01-17 11:12:32 +00001095 GlobalValue *asan_mapping_scale =
1096 new GlobalVariable(M, IntptrTy, true, GlobalValue::LinkOnceODRLinkage,
1097 ConstantInt::get(IntptrTy, Mapping.Scale),
1098 kAsanMappingScaleName);
1099 // Read the global, otherwise it may be optimized away.
1100 IRB.CreateLoad(asan_mapping_scale, true);
Alexey Samsonov1345d352013-01-16 13:23:28 +00001101}
1102
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001103// virtual
1104bool AddressSanitizer::doInitialization(Module &M) {
1105 // Initialize the private fields. No one has accessed them before.
1106 TD = getAnalysisIfAvailable<DataLayout>();
1107
1108 if (!TD)
1109 return false;
Alexey Samsonove4b5fb82013-08-12 11:46:09 +00001110 BL.reset(SpecialCaseList::createOrDie(BlacklistFile));
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001111 DynamicallyInitializedGlobals.Init(M);
1112
1113 C = &(M.getContext());
1114 LongSize = TD->getPointerSizeInBits();
1115 IntptrTy = Type::getIntNTy(*C, LongSize);
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001116
1117 AsanCtorFunction = Function::Create(
1118 FunctionType::get(Type::getVoidTy(*C), false),
1119 GlobalValue::InternalLinkage, kAsanModuleCtorName, &M);
1120 BasicBlock *AsanCtorBB = BasicBlock::Create(*C, "", AsanCtorFunction);
1121 // call __asan_init in the module ctor.
1122 IRBuilder<> IRB(ReturnInst::Create(*C, AsanCtorBB));
1123 AsanInitFunction = checkInterfaceFunction(
1124 M.getOrInsertFunction(kAsanInitName, IRB.getVoidTy(), NULL));
1125 AsanInitFunction->setLinkage(Function::ExternalLinkage);
1126 IRB.CreateCall(AsanInitFunction);
Kostya Serebryany4273bb02012-07-16 14:09:42 +00001127
Evgeniy Stepanov13665362014-01-16 10:19:12 +00001128 Mapping = getShadowMapping(M, LongSize);
Alexey Samsonov1345d352013-01-16 13:23:28 +00001129 emitShadowMapping(M, IRB);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001130
Kostya Serebryanycd1aba82011-12-15 21:59:03 +00001131 appendToGlobalCtors(M, AsanCtorFunction, kAsanCtorAndCtorPriority);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001132 return true;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001133}
1134
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +00001135bool AddressSanitizer::maybeInsertAsanInitAtFunctionEntry(Function &F) {
1136 // For each NSObject descendant having a +load method, this method is invoked
1137 // by the ObjC runtime before any of the static constructors is called.
1138 // Therefore we need to instrument such methods with a call to __asan_init
1139 // at the beginning in order to initialize our runtime before any access to
1140 // the shadow memory.
1141 // We cannot just ignore these methods, because they may call other
1142 // instrumented functions.
1143 if (F.getName().find(" load]") != std::string::npos) {
1144 IRBuilder<> IRB(F.begin()->begin());
1145 IRB.CreateCall(AsanInitFunction);
1146 return true;
1147 }
1148 return false;
1149}
1150
Bob Wilsonda4147c2013-11-15 07:16:09 +00001151// Poor man's coverage that works with ASan.
1152// We create a Guard boolean variable with the same linkage
1153// as the function and inject this code into the entry block:
1154// if (*Guard) {
1155// __sanitizer_cov(&F);
1156// *Guard = 1;
1157// }
1158// The accesses to Guard are atomic. The rest of the logic is
1159// in __sanitizer_cov (it's fine to call it more than once).
1160//
1161// This coverage implementation provides very limited data:
1162// it only tells if a given function was ever executed.
1163// No counters, no per-basic-block or per-edge data.
1164// But for many use cases this is what we need and the added slowdown
1165// is negligible. This simple implementation will probably be obsoleted
1166// by the upcoming Clang-based coverage implementation.
1167// By having it here and now we hope to
1168// a) get the functionality to users earlier and
1169// b) collect usage statistics to help improve Clang coverage design.
1170bool AddressSanitizer::InjectCoverage(Function &F) {
1171 if (!ClCoverage) return false;
Reid Kleckner30b2a9a2013-12-10 21:49:28 +00001172
1173 // Skip static allocas at the top of the entry block so they don't become
1174 // dynamic when we split the block. If we used our optimized stack layout,
1175 // then there will only be one alloca and it will come first.
1176 BasicBlock &Entry = F.getEntryBlock();
1177 BasicBlock::iterator IP = Entry.getFirstInsertionPt(), BE = Entry.end();
1178 for (; IP != BE; ++IP) {
1179 AllocaInst *AI = dyn_cast<AllocaInst>(IP);
1180 if (!AI || !AI->isStaticAlloca())
1181 break;
1182 }
1183
1184 IRBuilder<> IRB(IP);
Bob Wilsonda4147c2013-11-15 07:16:09 +00001185 Type *Int8Ty = IRB.getInt8Ty();
1186 GlobalVariable *Guard = new GlobalVariable(
Kostya Serebryany0604c622013-11-15 09:52:05 +00001187 *F.getParent(), Int8Ty, false, GlobalValue::PrivateLinkage,
Bob Wilsonda4147c2013-11-15 07:16:09 +00001188 Constant::getNullValue(Int8Ty), "__asan_gen_cov_" + F.getName());
1189 LoadInst *Load = IRB.CreateLoad(Guard);
1190 Load->setAtomic(Monotonic);
1191 Load->setAlignment(1);
1192 Value *Cmp = IRB.CreateICmpEQ(Constant::getNullValue(Int8Ty), Load);
Evgeniy Stepanova9164e92013-12-19 13:29:56 +00001193 Instruction *Ins = SplitBlockAndInsertIfThen(Cmp, IP, false);
Bob Wilsonda4147c2013-11-15 07:16:09 +00001194 IRB.SetInsertPoint(Ins);
1195 // We pass &F to __sanitizer_cov. We could avoid this and rely on
1196 // GET_CALLER_PC, but having the PC of the first instruction is just nice.
1197 IRB.CreateCall(AsanCovFunction, IRB.CreatePointerCast(&F, IntptrTy));
1198 StoreInst *Store = IRB.CreateStore(ConstantInt::get(Int8Ty, 1), Guard);
1199 Store->setAtomic(Monotonic);
1200 Store->setAlignment(1);
1201 return true;
1202}
1203
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001204bool AddressSanitizer::runOnFunction(Function &F) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001205 if (BL->isIn(F)) return false;
1206 if (&F == AsanCtorFunction) return false;
Kostya Serebryany6b5b58d2013-03-18 07:33:49 +00001207 if (F.getLinkage() == GlobalValue::AvailableExternallyLinkage) return false;
Kostya Serebryany20343352012-10-17 13:40:06 +00001208 DEBUG(dbgs() << "ASAN instrumenting:\n" << F << "\n");
Kostya Serebryany4b929da2012-11-29 09:54:21 +00001209 initializeCallbacks(*F.getParent());
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +00001210
Kostya Serebryanycf880b92013-02-26 06:58:09 +00001211 // If needed, insert __asan_init before checking for SanitizeAddress attr.
Kostya Serebryany22ddcfd2012-01-30 23:50:10 +00001212 maybeInsertAsanInitAtFunctionEntry(F);
1213
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001214 if (!F.hasFnAttribute(Attribute::SanitizeAddress))
Bill Wendlingc9b22d72012-10-09 07:45:08 +00001215 return false;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001216
1217 if (!ClDebugFunc.empty() && ClDebugFunc != F.getName())
1218 return false;
Bill Wendlingc9b22d72012-10-09 07:45:08 +00001219
1220 // We want to instrument every address only once per basic block (unless there
1221 // are calls between uses).
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001222 SmallSet<Value*, 16> TempsToInstrument;
1223 SmallVector<Instruction*, 16> ToInstrument;
Kostya Serebryany154a54d2012-02-08 21:36:17 +00001224 SmallVector<Instruction*, 8> NoReturnCalls;
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001225 int NumAllocas = 0;
Kostya Serebryany90241602012-05-30 09:04:06 +00001226 bool IsWrite;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001227
1228 // Fill the set of memory operations to instrument.
1229 for (Function::iterator FI = F.begin(), FE = F.end();
1230 FI != FE; ++FI) {
1231 TempsToInstrument.clear();
Kostya Serebryanyc387ca72012-06-28 09:34:41 +00001232 int NumInsnsPerBB = 0;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001233 for (BasicBlock::iterator BI = FI->begin(), BE = FI->end();
1234 BI != BE; ++BI) {
Kostya Serebryany687d0782012-01-11 18:15:23 +00001235 if (LooksLikeCodeInBug11395(BI)) return false;
Kostya Serebryany90241602012-05-30 09:04:06 +00001236 if (Value *Addr = isInterestingMemoryAccess(BI, &IsWrite)) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001237 if (ClOpt && ClOptSameTemp) {
1238 if (!TempsToInstrument.insert(Addr))
1239 continue; // We've seen this temp in the current BB.
1240 }
1241 } else if (isa<MemIntrinsic>(BI) && ClMemIntrin) {
1242 // ok, take it.
1243 } else {
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001244 if (isa<AllocaInst>(BI))
1245 NumAllocas++;
Kostya Serebryany699ac282013-02-20 12:35:15 +00001246 CallSite CS(BI);
1247 if (CS) {
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001248 // A call inside BB.
1249 TempsToInstrument.clear();
Kostya Serebryany699ac282013-02-20 12:35:15 +00001250 if (CS.doesNotReturn())
1251 NoReturnCalls.push_back(CS.getInstruction());
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001252 }
1253 continue;
1254 }
1255 ToInstrument.push_back(BI);
Kostya Serebryanyc387ca72012-06-28 09:34:41 +00001256 NumInsnsPerBB++;
1257 if (NumInsnsPerBB >= ClMaxInsnsToInstrumentPerBB)
1258 break;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001259 }
1260 }
1261
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001262 Function *UninstrumentedDuplicate = 0;
1263 bool LikelyToInstrument =
1264 !NoReturnCalls.empty() || !ToInstrument.empty() || (NumAllocas > 0);
1265 if (ClKeepUninstrumented && LikelyToInstrument) {
1266 ValueToValueMapTy VMap;
1267 UninstrumentedDuplicate = CloneFunction(&F, VMap, false);
1268 UninstrumentedDuplicate->removeFnAttr(Attribute::SanitizeAddress);
1269 UninstrumentedDuplicate->setName("NOASAN_" + F.getName());
1270 F.getParent()->getFunctionList().push_back(UninstrumentedDuplicate);
1271 }
1272
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001273 // Instrument.
1274 int NumInstrumented = 0;
1275 for (size_t i = 0, n = ToInstrument.size(); i != n; i++) {
1276 Instruction *Inst = ToInstrument[i];
1277 if (ClDebugMin < 0 || ClDebugMax < 0 ||
1278 (NumInstrumented >= ClDebugMin && NumInstrumented <= ClDebugMax)) {
Kostya Serebryany90241602012-05-30 09:04:06 +00001279 if (isInterestingMemoryAccess(Inst, &IsWrite))
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001280 instrumentMop(Inst);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001281 else
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001282 instrumentMemIntrinsic(cast<MemIntrinsic>(Inst));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001283 }
1284 NumInstrumented++;
1285 }
1286
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001287 FunctionStackPoisoner FSP(F, *this);
1288 bool ChangedStack = FSP.runOnFunction();
Kostya Serebryany154a54d2012-02-08 21:36:17 +00001289
1290 // We must unpoison the stack before every NoReturn call (throw, _exit, etc).
1291 // See e.g. http://code.google.com/p/address-sanitizer/issues/detail?id=37
1292 for (size_t i = 0, n = NoReturnCalls.size(); i != n; i++) {
1293 Instruction *CI = NoReturnCalls[i];
1294 IRBuilder<> IRB(CI);
Kostya Serebryanyb0e25062012-10-15 14:20:06 +00001295 IRB.CreateCall(AsanHandleNoReturnFunc);
Kostya Serebryany154a54d2012-02-08 21:36:17 +00001296 }
1297
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001298 bool res = NumInstrumented > 0 || ChangedStack || !NoReturnCalls.empty();
Bob Wilsonda4147c2013-11-15 07:16:09 +00001299
1300 if (InjectCoverage(F))
1301 res = true;
1302
Kostya Serebryany9f5213f2013-06-26 09:18:17 +00001303 DEBUG(dbgs() << "ASAN done instrumenting: " << res << " " << F << "\n");
1304
1305 if (ClKeepUninstrumented) {
1306 if (!res) {
1307 // No instrumentation is done, no need for the duplicate.
1308 if (UninstrumentedDuplicate)
1309 UninstrumentedDuplicate->eraseFromParent();
1310 } else {
1311 // The function was instrumented. We must have the duplicate.
1312 assert(UninstrumentedDuplicate);
1313 UninstrumentedDuplicate->setSection("NOASAN");
1314 assert(!F.hasSection());
1315 F.setSection("ASAN");
1316 }
1317 }
1318
1319 return res;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001320}
1321
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001322// Workaround for bug 11395: we don't want to instrument stack in functions
1323// with large assembly blobs (32-bit only), otherwise reg alloc may crash.
1324// FIXME: remove once the bug 11395 is fixed.
1325bool AddressSanitizer::LooksLikeCodeInBug11395(Instruction *I) {
1326 if (LongSize != 32) return false;
1327 CallInst *CI = dyn_cast<CallInst>(I);
1328 if (!CI || !CI->isInlineAsm()) return false;
1329 if (CI->getNumArgOperands() <= 5) return false;
1330 // We have inline assembly with quite a few arguments.
1331 return true;
1332}
1333
1334void FunctionStackPoisoner::initializeCallbacks(Module &M) {
1335 IRBuilder<> IRB(*C);
Kostya Serebryany6805de52013-09-10 13:16:56 +00001336 for (int i = 0; i <= kMaxAsanStackMallocSizeClass; i++) {
1337 std::string Suffix = itostr(i);
1338 AsanStackMallocFunc[i] = checkInterfaceFunction(
1339 M.getOrInsertFunction(kAsanStackMallocNameTemplate + Suffix, IntptrTy,
1340 IntptrTy, IntptrTy, NULL));
1341 AsanStackFreeFunc[i] = checkInterfaceFunction(M.getOrInsertFunction(
1342 kAsanStackFreeNameTemplate + Suffix, IRB.getVoidTy(), IntptrTy,
1343 IntptrTy, IntptrTy, NULL));
1344 }
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001345 AsanPoisonStackMemoryFunc = checkInterfaceFunction(M.getOrInsertFunction(
1346 kAsanPoisonStackMemoryName, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
1347 AsanUnpoisonStackMemoryFunc = checkInterfaceFunction(M.getOrInsertFunction(
1348 kAsanUnpoisonStackMemoryName, IRB.getVoidTy(), IntptrTy, IntptrTy, NULL));
1349}
1350
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001351void
1352FunctionStackPoisoner::poisonRedZones(const ArrayRef<uint8_t> ShadowBytes,
1353 IRBuilder<> &IRB, Value *ShadowBase,
1354 bool DoPoison) {
1355 size_t n = ShadowBytes.size();
Kostya Serebryanyff7bde12013-12-23 09:24:36 +00001356 size_t i = 0;
1357 // We need to (un)poison n bytes of stack shadow. Poison as many as we can
1358 // using 64-bit stores (if we are on 64-bit arch), then poison the rest
1359 // with 32-bit stores, then with 16-byte stores, then with 8-byte stores.
1360 for (size_t LargeStoreSizeInBytes = ASan.LongSize / 8;
1361 LargeStoreSizeInBytes != 0; LargeStoreSizeInBytes /= 2) {
1362 for (; i + LargeStoreSizeInBytes - 1 < n; i += LargeStoreSizeInBytes) {
1363 uint64_t Val = 0;
1364 for (size_t j = 0; j < LargeStoreSizeInBytes; j++) {
1365 if (ASan.TD->isLittleEndian())
1366 Val |= (uint64_t)ShadowBytes[i + j] << (8 * j);
1367 else
1368 Val = (Val << 8) | ShadowBytes[i + j];
1369 }
1370 if (!Val) continue;
1371 Value *Ptr = IRB.CreateAdd(ShadowBase, ConstantInt::get(IntptrTy, i));
1372 Type *StoreTy = Type::getIntNTy(*C, LargeStoreSizeInBytes * 8);
1373 Value *Poison = ConstantInt::get(StoreTy, DoPoison ? Val : 0);
1374 IRB.CreateStore(Poison, IRB.CreateIntToPtr(Ptr, StoreTy->getPointerTo()));
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001375 }
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001376 }
1377}
1378
Kostya Serebryany6805de52013-09-10 13:16:56 +00001379// Fake stack allocator (asan_fake_stack.h) has 11 size classes
1380// for every power of 2 from kMinStackMallocSize to kMaxAsanStackMallocSizeClass
1381static int StackMallocSizeClass(uint64_t LocalStackSize) {
1382 assert(LocalStackSize <= kMaxStackMallocSize);
1383 uint64_t MaxSize = kMinStackMallocSize;
1384 for (int i = 0; ; i++, MaxSize *= 2)
1385 if (LocalStackSize <= MaxSize)
1386 return i;
1387 llvm_unreachable("impossible LocalStackSize");
1388}
1389
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001390// Set Size bytes starting from ShadowBase to kAsanStackAfterReturnMagic.
1391// We can not use MemSet intrinsic because it may end up calling the actual
1392// memset. Size is a multiple of 8.
1393// Currently this generates 8-byte stores on x86_64; it may be better to
1394// generate wider stores.
1395void FunctionStackPoisoner::SetShadowToStackAfterReturnInlined(
1396 IRBuilder<> &IRB, Value *ShadowBase, int Size) {
1397 assert(!(Size % 8));
1398 assert(kAsanStackAfterReturnMagic == 0xf5);
1399 for (int i = 0; i < Size; i += 8) {
1400 Value *p = IRB.CreateAdd(ShadowBase, ConstantInt::get(IntptrTy, i));
1401 IRB.CreateStore(ConstantInt::get(IRB.getInt64Ty(), 0xf5f5f5f5f5f5f5f5ULL),
1402 IRB.CreateIntToPtr(p, IRB.getInt64Ty()->getPointerTo()));
1403 }
1404}
1405
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001406void FunctionStackPoisoner::poisonStack() {
Kostya Serebryany6805de52013-09-10 13:16:56 +00001407 int StackMallocIdx = -1;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001408
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001409 assert(AllocaVec.size() > 0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001410 Instruction *InsBefore = AllocaVec[0];
1411 IRBuilder<> IRB(InsBefore);
1412
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001413 SmallVector<ASanStackVariableDescription, 16> SVD;
1414 SVD.reserve(AllocaVec.size());
1415 for (size_t i = 0, n = AllocaVec.size(); i < n; i++) {
1416 AllocaInst *AI = AllocaVec[i];
1417 ASanStackVariableDescription D = { AI->getName().data(),
1418 getAllocaSizeInBytes(AI),
1419 AI->getAlignment(), AI, 0};
1420 SVD.push_back(D);
1421 }
1422 // Minimal header size (left redzone) is 4 pointers,
1423 // i.e. 32 bytes on 64-bit platforms and 16 bytes in 32-bit platforms.
1424 size_t MinHeaderSize = ASan.LongSize / 2;
1425 ASanStackFrameLayout L;
1426 ComputeASanStackFrameLayout(SVD, 1UL << Mapping.Scale, MinHeaderSize, &L);
1427 DEBUG(dbgs() << L.DescriptionString << " --- " << L.FrameSize << "\n");
1428 uint64_t LocalStackSize = L.FrameSize;
1429 bool DoStackMalloc =
1430 ASan.CheckUseAfterReturn && LocalStackSize <= kMaxStackMallocSize;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001431
1432 Type *ByteArrayTy = ArrayType::get(IRB.getInt8Ty(), LocalStackSize);
1433 AllocaInst *MyAlloca =
1434 new AllocaInst(ByteArrayTy, "MyAlloca", InsBefore);
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001435 assert((ClRealignStack & (ClRealignStack - 1)) == 0);
1436 size_t FrameAlignment = std::max(L.FrameAlignment, (size_t)ClRealignStack);
1437 MyAlloca->setAlignment(FrameAlignment);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001438 assert(MyAlloca->isStaticAlloca());
1439 Value *OrigStackBase = IRB.CreatePointerCast(MyAlloca, IntptrTy);
1440 Value *LocalStackBase = OrigStackBase;
1441
1442 if (DoStackMalloc) {
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001443 // LocalStackBase = OrigStackBase
1444 // if (__asan_option_detect_stack_use_after_return)
1445 // LocalStackBase = __asan_stack_malloc_N(LocalStackBase, OrigStackBase);
Kostya Serebryany6805de52013-09-10 13:16:56 +00001446 StackMallocIdx = StackMallocSizeClass(LocalStackSize);
1447 assert(StackMallocIdx <= kMaxAsanStackMallocSizeClass);
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001448 Constant *OptionDetectUAR = F.getParent()->getOrInsertGlobal(
1449 kAsanOptionDetectUAR, IRB.getInt32Ty());
1450 Value *Cmp = IRB.CreateICmpNE(IRB.CreateLoad(OptionDetectUAR),
1451 Constant::getNullValue(IRB.getInt32Ty()));
Evgeniy Stepanova9164e92013-12-19 13:29:56 +00001452 Instruction *Term = SplitBlockAndInsertIfThen(Cmp, InsBefore, false);
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001453 BasicBlock *CmpBlock = cast<Instruction>(Cmp)->getParent();
1454 IRBuilder<> IRBIf(Term);
1455 LocalStackBase = IRBIf.CreateCall2(
1456 AsanStackMallocFunc[StackMallocIdx],
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001457 ConstantInt::get(IntptrTy, LocalStackSize), OrigStackBase);
Kostya Serebryanyf3223822013-09-18 14:07:14 +00001458 BasicBlock *SetBlock = cast<Instruction>(LocalStackBase)->getParent();
1459 IRB.SetInsertPoint(InsBefore);
1460 PHINode *Phi = IRB.CreatePHI(IntptrTy, 2);
1461 Phi->addIncoming(OrigStackBase, CmpBlock);
1462 Phi->addIncoming(LocalStackBase, SetBlock);
1463 LocalStackBase = Phi;
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001464 }
1465
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001466 // Insert poison calls for lifetime intrinsics for alloca.
1467 bool HavePoisonedAllocas = false;
1468 for (size_t i = 0, n = AllocaPoisonCallVec.size(); i < n; i++) {
1469 const AllocaPoisonCall &APC = AllocaPoisonCallVec[i];
Alexey Samsonova788b942013-11-18 14:53:55 +00001470 assert(APC.InsBefore);
1471 assert(APC.AI);
1472 IRBuilder<> IRB(APC.InsBefore);
1473 poisonAlloca(APC.AI, APC.Size, IRB, APC.DoPoison);
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001474 HavePoisonedAllocas |= APC.DoPoison;
1475 }
1476
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001477 // Replace Alloca instructions with base+offset.
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001478 for (size_t i = 0, n = SVD.size(); i < n; i++) {
1479 AllocaInst *AI = SVD[i].AI;
Alexey Samsonov261177a2012-12-04 01:34:23 +00001480 Value *NewAllocaPtr = IRB.CreateIntToPtr(
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001481 IRB.CreateAdd(LocalStackBase,
1482 ConstantInt::get(IntptrTy, SVD[i].Offset)),
1483 AI->getType());
Alexey Samsonov3d43b632012-12-12 14:31:53 +00001484 replaceDbgDeclareForAlloca(AI, NewAllocaPtr, DIB);
Alexey Samsonov261177a2012-12-04 01:34:23 +00001485 AI->replaceAllUsesWith(NewAllocaPtr);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001486 }
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001487
Kostya Serebryanycdd35a92013-03-22 10:37:20 +00001488 // The left-most redzone has enough space for at least 4 pointers.
1489 // Write the Magic value to redzone[0].
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001490 Value *BasePlus0 = IRB.CreateIntToPtr(LocalStackBase, IntptrPtrTy);
1491 IRB.CreateStore(ConstantInt::get(IntptrTy, kCurrentStackFrameMagic),
1492 BasePlus0);
Kostya Serebryanycdd35a92013-03-22 10:37:20 +00001493 // Write the frame description constant to redzone[1].
1494 Value *BasePlus1 = IRB.CreateIntToPtr(
1495 IRB.CreateAdd(LocalStackBase, ConstantInt::get(IntptrTy, ASan.LongSize/8)),
1496 IntptrPtrTy);
Alexey Samsonov9bdb63a2012-11-02 12:20:34 +00001497 GlobalVariable *StackDescriptionGlobal =
Alexander Potapenkodaf96ae2013-12-25 14:22:15 +00001498 createPrivateGlobalForString(*F.getParent(), L.DescriptionString,
1499 /*AllowMerging*/true);
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001500 Value *Description = IRB.CreatePointerCast(StackDescriptionGlobal,
1501 IntptrTy);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001502 IRB.CreateStore(Description, BasePlus1);
Kostya Serebryanycdd35a92013-03-22 10:37:20 +00001503 // Write the PC to redzone[2].
1504 Value *BasePlus2 = IRB.CreateIntToPtr(
1505 IRB.CreateAdd(LocalStackBase, ConstantInt::get(IntptrTy,
1506 2 * ASan.LongSize/8)),
1507 IntptrPtrTy);
1508 IRB.CreateStore(IRB.CreatePointerCast(&F, IntptrTy), BasePlus2);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001509
1510 // Poison the stack redzones at the entry.
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001511 Value *ShadowBase = ASan.memToShadow(LocalStackBase, IRB);
Kostya Serebryany4fb78012013-12-06 09:00:17 +00001512 poisonRedZones(L.ShadowBytes, IRB, ShadowBase, true);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001513
Kostya Serebryany530e2072013-12-23 14:15:08 +00001514 // (Un)poison the stack before all ret instructions.
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001515 for (size_t i = 0, n = RetVec.size(); i < n; i++) {
1516 Instruction *Ret = RetVec[i];
1517 IRBuilder<> IRBRet(Ret);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001518 // Mark the current frame as retired.
1519 IRBRet.CreateStore(ConstantInt::get(IntptrTy, kRetiredStackFrameMagic),
1520 BasePlus0);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001521 if (DoStackMalloc) {
Kostya Serebryany6805de52013-09-10 13:16:56 +00001522 assert(StackMallocIdx >= 0);
Kostya Serebryany530e2072013-12-23 14:15:08 +00001523 // if LocalStackBase != OrigStackBase:
1524 // // In use-after-return mode, poison the whole stack frame.
1525 // if StackMallocIdx <= 4
1526 // // For small sizes inline the whole thing:
1527 // memset(ShadowBase, kAsanStackAfterReturnMagic, ShadowSize);
1528 // **SavedFlagPtr(LocalStackBase) = 0
1529 // else
1530 // __asan_stack_free_N(LocalStackBase, OrigStackBase)
1531 // else
1532 // <This is not a fake stack; unpoison the redzones>
1533 Value *Cmp = IRBRet.CreateICmpNE(LocalStackBase, OrigStackBase);
1534 TerminatorInst *ThenTerm, *ElseTerm;
1535 SplitBlockAndInsertIfThenElse(Cmp, Ret, &ThenTerm, &ElseTerm);
1536
1537 IRBuilder<> IRBPoison(ThenTerm);
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001538 if (StackMallocIdx <= 4) {
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001539 int ClassSize = kMinStackMallocSize << StackMallocIdx;
1540 SetShadowToStackAfterReturnInlined(IRBPoison, ShadowBase,
1541 ClassSize >> Mapping.Scale);
1542 Value *SavedFlagPtrPtr = IRBPoison.CreateAdd(
1543 LocalStackBase,
1544 ConstantInt::get(IntptrTy, ClassSize - ASan.LongSize / 8));
1545 Value *SavedFlagPtr = IRBPoison.CreateLoad(
1546 IRBPoison.CreateIntToPtr(SavedFlagPtrPtr, IntptrPtrTy));
1547 IRBPoison.CreateStore(
1548 Constant::getNullValue(IRBPoison.getInt8Ty()),
1549 IRBPoison.CreateIntToPtr(SavedFlagPtr, IRBPoison.getInt8PtrTy()));
1550 } else {
1551 // For larger frames call __asan_stack_free_*.
Kostya Serebryany530e2072013-12-23 14:15:08 +00001552 IRBPoison.CreateCall3(AsanStackFreeFunc[StackMallocIdx], LocalStackBase,
1553 ConstantInt::get(IntptrTy, LocalStackSize),
1554 OrigStackBase);
Kostya Serebryanybc86efb2013-09-17 12:14:50 +00001555 }
Kostya Serebryany530e2072013-12-23 14:15:08 +00001556
1557 IRBuilder<> IRBElse(ElseTerm);
1558 poisonRedZones(L.ShadowBytes, IRBElse, ShadowBase, false);
Alexey Samsonov261177a2012-12-04 01:34:23 +00001559 } else if (HavePoisonedAllocas) {
1560 // If we poisoned some allocas in llvm.lifetime analysis,
1561 // unpoison whole stack frame now.
1562 assert(LocalStackBase == OrigStackBase);
1563 poisonAlloca(LocalStackBase, LocalStackSize, IRBRet, false);
Kostya Serebryany530e2072013-12-23 14:15:08 +00001564 } else {
1565 poisonRedZones(L.ShadowBytes, IRBRet, ShadowBase, false);
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001566 }
1567 }
1568
Kostya Serebryany09959942012-10-19 06:20:53 +00001569 // We are done. Remove the old unused alloca instructions.
1570 for (size_t i = 0, n = AllocaVec.size(); i < n; i++)
1571 AllocaVec[i]->eraseFromParent();
Kostya Serebryany6e6b03e2011-11-16 01:35:23 +00001572}
Alexey Samsonov261177a2012-12-04 01:34:23 +00001573
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001574void FunctionStackPoisoner::poisonAlloca(Value *V, uint64_t Size,
Jakub Staszak23ec6a92013-08-09 20:53:48 +00001575 IRBuilder<> &IRB, bool DoPoison) {
Alexey Samsonov261177a2012-12-04 01:34:23 +00001576 // For now just insert the call to ASan runtime.
1577 Value *AddrArg = IRB.CreatePointerCast(V, IntptrTy);
1578 Value *SizeArg = ConstantInt::get(IntptrTy, Size);
1579 IRB.CreateCall2(DoPoison ? AsanPoisonStackMemoryFunc
1580 : AsanUnpoisonStackMemoryFunc,
1581 AddrArg, SizeArg);
1582}
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001583
1584// Handling llvm.lifetime intrinsics for a given %alloca:
1585// (1) collect all llvm.lifetime.xxx(%size, %value) describing the alloca.
1586// (2) if %size is constant, poison memory for llvm.lifetime.end (to detect
1587// invalid accesses) and unpoison it for llvm.lifetime.start (the memory
1588// could be poisoned by previous llvm.lifetime.end instruction, as the
1589// variable may go in and out of scope several times, e.g. in loops).
1590// (3) if we poisoned at least one %alloca in a function,
1591// unpoison the whole stack frame at function exit.
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001592
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001593AllocaInst *FunctionStackPoisoner::findAllocaForValue(Value *V) {
1594 if (AllocaInst *AI = dyn_cast<AllocaInst>(V))
1595 // We're intested only in allocas we can handle.
1596 return isInterestingAlloca(*AI) ? AI : 0;
1597 // See if we've already calculated (or started to calculate) alloca for a
1598 // given value.
1599 AllocaForValueMapTy::iterator I = AllocaForValue.find(V);
1600 if (I != AllocaForValue.end())
1601 return I->second;
1602 // Store 0 while we're calculating alloca for value V to avoid
1603 // infinite recursion if the value references itself.
1604 AllocaForValue[V] = 0;
1605 AllocaInst *Res = 0;
1606 if (CastInst *CI = dyn_cast<CastInst>(V))
1607 Res = findAllocaForValue(CI->getOperand(0));
1608 else if (PHINode *PN = dyn_cast<PHINode>(V)) {
1609 for (unsigned i = 0, e = PN->getNumIncomingValues(); i != e; ++i) {
1610 Value *IncValue = PN->getIncomingValue(i);
1611 // Allow self-referencing phi-nodes.
1612 if (IncValue == PN) continue;
1613 AllocaInst *IncValueAI = findAllocaForValue(IncValue);
1614 // AI for incoming values should exist and should all be equal.
1615 if (IncValueAI == 0 || (Res != 0 && IncValueAI != Res))
1616 return 0;
1617 Res = IncValueAI;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001618 }
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001619 }
Alexey Samsonov29dd7f22012-12-27 08:50:58 +00001620 if (Res != 0)
1621 AllocaForValue[V] = Res;
Alexey Samsonov1e3f7ba2012-12-25 12:04:36 +00001622 return Res;
1623}