blob: 39d6e6026210129c6557858cd20f9e1b0214d361 [file] [log] [blame]
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +00001//===- FuzzerTracePC.cpp - PC tracing--------------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// Trace PCs.
Kostya Serebryanya00b2432016-09-14 02:13:06 +000010// This module implements __sanitizer_cov_trace_pc_guard[_init],
11// the callback required for -fsanitize-coverage=trace-pc-guard instrumentation.
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000012//
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000013//===----------------------------------------------------------------------===//
14
Kostya Serebryany1c73f1b2016-10-05 22:56:21 +000015#include "FuzzerCorpus.h"
Kostya Serebryany86586182016-09-21 21:17:23 +000016#include "FuzzerDefs.h"
Kostya Serebryanya5f94fb2016-10-14 20:20:33 +000017#include "FuzzerDictionary.h"
Kostya Serebryany95b1a432016-10-19 00:12:03 +000018#include "FuzzerExtFunctions.h"
Zachary Turner24a148b2016-11-30 19:06:14 +000019#include "FuzzerIO.h"
Kostya Serebryany6f5a8042016-09-21 01:50:50 +000020#include "FuzzerTracePC.h"
Kostya Serebryany86586182016-09-21 21:17:23 +000021#include "FuzzerValueBitMap.h"
Zachary Turner24a148b2016-11-30 19:06:14 +000022#include <map>
Mike Aizatsky9b415be2016-12-19 22:18:08 +000023#include <sanitizer/coverage_interface.h>
Zachary Turner24a148b2016-11-30 19:06:14 +000024#include <set>
25#include <sstream>
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000026
27namespace fuzzer {
Mike Aizatsky1aa501e2016-05-10 23:43:15 +000028
Kostya Serebryanya00b2432016-09-14 02:13:06 +000029TracePC TPC;
Mike Aizatsky1aa501e2016-05-10 23:43:15 +000030
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +000031void TracePC::HandleTrace(uint32_t *Guard, uintptr_t PC) {
32 uint32_t Idx = *Guard;
Kostya Serebryany8e781a82016-09-18 04:52:23 +000033 if (!Idx) return;
Kostya Serebryany2fabeca2016-10-26 18:52:04 +000034 PCs[Idx % kNumPCs] = PC;
35 Counters[Idx % kNumCounters]++;
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000036}
Kostya Serebryanya5277d52016-09-15 01:30:18 +000037
Kostya Serebryany275e2602016-10-25 23:52:25 +000038size_t TracePC::GetTotalPCCoverage() {
39 size_t Res = 0;
Kostya Serebryany06b87572016-10-26 00:42:52 +000040 for (size_t i = 1; i < GetNumPCs(); i++)
Kostya Serebryany275e2602016-10-25 23:52:25 +000041 if (PCs[i])
42 Res++;
43 return Res;
44}
45
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +000046void TracePC::HandleInit(uint32_t *Start, uint32_t *Stop) {
Kostya Serebryany3e36ec12016-09-17 05:04:47 +000047 if (Start == Stop || *Start) return;
48 assert(NumModules < sizeof(Modules) / sizeof(Modules[0]));
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +000049 for (uint32_t *P = Start; P < Stop; P++)
Kostya Serebryany8e781a82016-09-18 04:52:23 +000050 *P = ++NumGuards;
Kostya Serebryany3e36ec12016-09-17 05:04:47 +000051 Modules[NumModules].Start = Start;
52 Modules[NumModules].Stop = Stop;
53 NumModules++;
54}
55
56void TracePC::PrintModuleInfo() {
57 Printf("INFO: Loaded %zd modules (%zd guards): ", NumModules, NumGuards);
58 for (size_t i = 0; i < NumModules; i++)
59 Printf("[%p, %p), ", Modules[i].Start, Modules[i].Stop);
60 Printf("\n");
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000061}
Kostya Serebryanya5277d52016-09-15 01:30:18 +000062
Kostya Serebryany09845172016-09-15 22:16:15 +000063void TracePC::HandleCallerCallee(uintptr_t Caller, uintptr_t Callee) {
64 const uintptr_t kBits = 12;
65 const uintptr_t kMask = (1 << kBits) - 1;
Kostya Serebryany1c73f1b2016-10-05 22:56:21 +000066 uintptr_t Idx = (Caller & kMask) | ((Callee & kMask) << kBits);
67 HandleValueProfile(Idx);
Kostya Serebryany09845172016-09-15 22:16:15 +000068}
69
Kostya Serebryany95b1a432016-10-19 00:12:03 +000070static bool IsInterestingCoverageFile(std::string &File) {
71 if (File.find("compiler-rt/lib/") != std::string::npos)
72 return false; // sanitizer internal.
73 if (File.find("/usr/lib/") != std::string::npos)
74 return false;
75 if (File.find("/usr/include/") != std::string::npos)
76 return false;
77 if (File == "<null>")
78 return false;
79 return true;
80}
81
Kostya Serebryany11a22bc2016-12-30 01:13:07 +000082void TracePC::InitializePrintNewPCs() {
Kostya Serebryany4986e812017-01-03 18:51:28 +000083 if (!DoPrintNewPCs) return;
Kostya Serebryany11a22bc2016-12-30 01:13:07 +000084 assert(!PrintedPCs);
85 PrintedPCs = new std::set<uintptr_t>;
86 for (size_t i = 1; i < GetNumPCs(); i++)
87 if (PCs[i])
88 PrintedPCs->insert(PCs[i]);
89}
90
Kostya Serebryanya5b2e542016-10-26 00:20:51 +000091void TracePC::PrintNewPCs() {
Kostya Serebryany4986e812017-01-03 18:51:28 +000092 if (!DoPrintNewPCs) return;
Kostya Serebryany11a22bc2016-12-30 01:13:07 +000093 assert(PrintedPCs);
94 for (size_t i = 1; i < GetNumPCs(); i++)
95 if (PCs[i] && PrintedPCs->insert(PCs[i]).second)
96 PrintPC("\tNEW_PC: %p %F %L\n", "\tNEW_PC: %p\n", PCs[i]);
Kostya Serebryanya5b2e542016-10-26 00:20:51 +000097}
98
Kostya Serebryanyb706b482016-09-18 21:47:08 +000099void TracePC::PrintCoverage() {
Kostya Serebryany1394ce22016-12-10 01:19:35 +0000100 if (!EF->__sanitizer_symbolize_pc ||
101 !EF->__sanitizer_get_module_and_offset_for_pc) {
102 Printf("INFO: __sanitizer_symbolize_pc or "
103 "__sanitizer_get_module_and_offset_for_pc is not available,"
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000104 " not printing coverage\n");
105 return;
106 }
107 std::map<std::string, std::vector<uintptr_t>> CoveredPCsPerModule;
108 std::map<std::string, uintptr_t> ModuleOffsets;
Kostya Serebryany1cba0a92016-11-30 21:53:32 +0000109 std::set<std::string> CoveredDirs, CoveredFiles, CoveredFunctions,
110 CoveredLines;
Kostya Serebryanyb706b482016-09-18 21:47:08 +0000111 Printf("COVERAGE:\n");
Kostya Serebryany06b87572016-10-26 00:42:52 +0000112 for (size_t i = 1; i < GetNumPCs(); i++) {
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000113 if (!PCs[i]) continue;
114 std::string FileStr = DescribePC("%s", PCs[i]);
115 if (!IsInterestingCoverageFile(FileStr)) continue;
116 std::string FixedPCStr = DescribePC("%p", PCs[i]);
117 std::string FunctionStr = DescribePC("%F", PCs[i]);
118 std::string LineStr = DescribePC("%l", PCs[i]);
Kostya Serebryany1394ce22016-12-10 01:19:35 +0000119 char ModulePathRaw[4096] = ""; // What's PATH_MAX in portable C++?
120 void *OffsetRaw = nullptr;
121 if (!EF->__sanitizer_get_module_and_offset_for_pc(
122 reinterpret_cast<void *>(PCs[i]), ModulePathRaw,
123 sizeof(ModulePathRaw), &OffsetRaw))
124 continue;
125 std::string Module = ModulePathRaw;
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000126 uintptr_t FixedPC = std::stol(FixedPCStr, 0, 16);
Kostya Serebryany1394ce22016-12-10 01:19:35 +0000127 uintptr_t PcOffset = reinterpret_cast<uintptr_t>(OffsetRaw);
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000128 ModuleOffsets[Module] = FixedPC - PcOffset;
129 CoveredPCsPerModule[Module].push_back(PcOffset);
130 CoveredFunctions.insert(FunctionStr);
131 CoveredFiles.insert(FileStr);
Kostya Serebryany1cba0a92016-11-30 21:53:32 +0000132 CoveredDirs.insert(DirName(FileStr));
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000133 if (!CoveredLines.insert(FileStr + ":" + LineStr).second)
134 continue;
135 Printf("COVERED: %s %s:%s\n", FunctionStr.c_str(),
136 FileStr.c_str(), LineStr.c_str());
137 }
138
Kostya Serebryany1cba0a92016-11-30 21:53:32 +0000139 std::string CoveredDirsStr;
140 for (auto &Dir : CoveredDirs) {
141 if (!CoveredDirsStr.empty())
142 CoveredDirsStr += ",";
143 CoveredDirsStr += Dir;
144 }
145 Printf("COVERED_DIRS: %s\n", CoveredDirsStr.c_str());
146
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000147 for (auto &M : CoveredPCsPerModule) {
148 std::set<std::string> UncoveredFiles, UncoveredFunctions;
149 std::map<std::string, std::set<int> > UncoveredLines; // Func+File => lines
150 auto &ModuleName = M.first;
151 auto &CoveredOffsets = M.second;
152 uintptr_t ModuleOffset = ModuleOffsets[ModuleName];
153 std::sort(CoveredOffsets.begin(), CoveredOffsets.end());
154 Printf("MODULE_WITH_COVERAGE: %s\n", ModuleName.c_str());
155 // sancov does not yet fully support DSOs.
156 // std::string Cmd = "sancov -print-coverage-pcs " + ModuleName;
157 std::string Cmd = "objdump -d " + ModuleName +
158 " | grep 'call.*__sanitizer_cov_trace_pc_guard' | awk -F: '{print $1}'";
159 std::string SanCovOutput;
160 if (!ExecuteCommandAndReadOutput(Cmd, &SanCovOutput)) {
161 Printf("INFO: Command failed: %s\n", Cmd.c_str());
162 continue;
163 }
164 std::istringstream ISS(SanCovOutput);
165 std::string S;
166 while (std::getline(ISS, S, '\n')) {
167 uintptr_t PcOffset = std::stol(S, 0, 16);
168 if (!std::binary_search(CoveredOffsets.begin(), CoveredOffsets.end(),
169 PcOffset)) {
170 uintptr_t PC = ModuleOffset + PcOffset;
171 auto FileStr = DescribePC("%s", PC);
172 if (!IsInterestingCoverageFile(FileStr)) continue;
173 if (CoveredFiles.count(FileStr) == 0) {
174 UncoveredFiles.insert(FileStr);
175 continue;
176 }
177 auto FunctionStr = DescribePC("%F", PC);
178 if (CoveredFunctions.count(FunctionStr) == 0) {
179 UncoveredFunctions.insert(FunctionStr);
180 continue;
181 }
182 std::string LineStr = DescribePC("%l", PC);
183 uintptr_t Line = std::stoi(LineStr);
184 std::string FileLineStr = FileStr + ":" + LineStr;
185 if (CoveredLines.count(FileLineStr) == 0)
186 UncoveredLines[FunctionStr + " " + FileStr].insert(Line);
187 }
188 }
189 for (auto &FileLine: UncoveredLines)
190 for (int Line : FileLine.second)
191 Printf("UNCOVERED_LINE: %s:%d\n", FileLine.first.c_str(), Line);
192 for (auto &Func : UncoveredFunctions)
193 Printf("UNCOVERED_FUNC: %s\n", Func.c_str());
194 for (auto &File : UncoveredFiles)
195 Printf("UNCOVERED_FILE: %s\n", File.c_str());
Kostya Serebryanyb706b482016-09-18 21:47:08 +0000196 }
197}
198
Mike Aizatsky9b415be2016-12-19 22:18:08 +0000199void TracePC::DumpCoverage() {
200 __sanitizer_dump_coverage(PCs, GetNumPCs());
201}
202
Kostya Serebryany379359c2016-10-05 01:09:40 +0000203// Value profile.
204// We keep track of various values that affect control flow.
205// These values are inserted into a bit-set-based hash map.
206// Every new bit in the map is treated as a new coverage.
207//
208// For memcmp/strcmp/etc the interesting value is the length of the common
209// prefix of the parameters.
210// For cmp instructions the interesting value is a XOR of the parameters.
211// The interesting value is mixed up with the PC and is then added to the map.
212
Kostya Serebryany3a4e2dd2016-12-16 22:45:25 +0000213ATTRIBUTE_NO_SANITIZE_MEMORY
Kostya Serebryany379359c2016-10-05 01:09:40 +0000214void TracePC::AddValueForMemcmp(void *caller_pc, const void *s1, const void *s2,
215 size_t n) {
216 if (!n) return;
217 size_t Len = std::min(n, (size_t)32);
218 const uint8_t *A1 = reinterpret_cast<const uint8_t *>(s1);
219 const uint8_t *A2 = reinterpret_cast<const uint8_t *>(s2);
220 size_t I = 0;
221 for (; I < Len; I++)
222 if (A1[I] != A2[I])
223 break;
224 size_t PC = reinterpret_cast<size_t>(caller_pc);
225 size_t Idx = I;
226 // if (I < Len)
227 // Idx += __builtin_popcountl((A1[I] ^ A2[I])) - 1;
228 TPC.HandleValueProfile((PC & 4095) | (Idx << 12));
229}
230
Kostya Serebryany3a4e2dd2016-12-16 22:45:25 +0000231ATTRIBUTE_NO_SANITIZE_MEMORY
Kostya Serebryany379359c2016-10-05 01:09:40 +0000232void TracePC::AddValueForStrcmp(void *caller_pc, const char *s1, const char *s2,
233 size_t n) {
234 if (!n) return;
235 size_t Len = std::min(n, (size_t)32);
236 const uint8_t *A1 = reinterpret_cast<const uint8_t *>(s1);
237 const uint8_t *A2 = reinterpret_cast<const uint8_t *>(s2);
238 size_t I = 0;
239 for (; I < Len; I++)
240 if (A1[I] != A2[I] || A1[I] == 0)
241 break;
242 size_t PC = reinterpret_cast<size_t>(caller_pc);
243 size_t Idx = I;
244 // if (I < Len && A1[I])
245 // Idx += __builtin_popcountl((A1[I] ^ A2[I])) - 1;
246 TPC.HandleValueProfile((PC & 4095) | (Idx << 12));
247}
248
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000249template <class T>
Kostya Serebryany379359c2016-10-05 01:09:40 +0000250ATTRIBUTE_TARGET_POPCNT
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000251#ifdef __clang__ // g++ can't handle this __attribute__ here :(
252__attribute__((always_inline))
253#endif // __clang__
254void TracePC::HandleCmp(void *PC, T Arg1, T Arg2) {
255 uintptr_t PCuint = reinterpret_cast<uintptr_t>(PC);
Kostya Serebryanya5f94fb2016-10-14 20:20:33 +0000256 uint64_t ArgXor = Arg1 ^ Arg2;
257 uint64_t ArgDistance = __builtin_popcountl(ArgXor) + 1; // [1,65]
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000258 uintptr_t Idx = ((PCuint & 4095) + 1) * ArgDistance;
Kostya Serebryany94c427c2016-10-27 00:36:38 +0000259 if (sizeof(T) == 4)
260 TORC4.Insert(ArgXor, Arg1, Arg2);
261 else if (sizeof(T) == 8)
262 TORC8.Insert(ArgXor, Arg1, Arg2);
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000263 HandleValueProfile(Idx);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000264}
265
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +0000266} // namespace fuzzer
267
Dan Liew59144072016-06-06 20:27:09 +0000268extern "C" {
Kostya Serebryany32661f92016-08-18 20:52:52 +0000269__attribute__((visibility("default")))
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +0000270void __sanitizer_cov_trace_pc_guard(uint32_t *Guard) {
Kostya Serebryanya00b2432016-09-14 02:13:06 +0000271 uintptr_t PC = (uintptr_t)__builtin_return_address(0);
Kostya Serebryanya5277d52016-09-15 01:30:18 +0000272 fuzzer::TPC.HandleTrace(Guard, PC);
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +0000273}
Dan Liew59144072016-06-06 20:27:09 +0000274
Kostya Serebryany32661f92016-08-18 20:52:52 +0000275__attribute__((visibility("default")))
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +0000276void __sanitizer_cov_trace_pc_guard_init(uint32_t *Start, uint32_t *Stop) {
Kostya Serebryanya5277d52016-09-15 01:30:18 +0000277 fuzzer::TPC.HandleInit(Start, Stop);
Dan Liew59144072016-06-06 20:27:09 +0000278}
Kostya Serebryany09845172016-09-15 22:16:15 +0000279
280__attribute__((visibility("default")))
281void __sanitizer_cov_trace_pc_indir(uintptr_t Callee) {
282 uintptr_t PC = (uintptr_t)__builtin_return_address(0);
283 fuzzer::TPC.HandleCallerCallee(PC, Callee);
284}
Kostya Serebryany379359c2016-10-05 01:09:40 +0000285
Kostya Serebryany379359c2016-10-05 01:09:40 +0000286__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000287void __sanitizer_cov_trace_cmp8(uint64_t Arg1, uint64_t Arg2) {
288 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000289}
290__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000291void __sanitizer_cov_trace_cmp4(uint32_t Arg1, uint32_t Arg2) {
292 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000293}
294__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000295void __sanitizer_cov_trace_cmp2(uint16_t Arg1, uint16_t Arg2) {
296 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000297}
298__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000299void __sanitizer_cov_trace_cmp1(uint8_t Arg1, uint8_t Arg2) {
300 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000301}
302
303__attribute__((visibility("default")))
304void __sanitizer_cov_trace_switch(uint64_t Val, uint64_t *Cases) {
Kostya Serebryanyd19919a2016-10-11 01:14:41 +0000305 uint64_t N = Cases[0];
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000306 uint64_t ValSizeInBits = Cases[1];
Kostya Serebryanyd19919a2016-10-11 01:14:41 +0000307 uint64_t *Vals = Cases + 2;
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000308 // Skip the most common and the most boring case.
309 if (Vals[N - 1] < 256 && Val < 256)
310 return;
Kostya Serebryanyd19919a2016-10-11 01:14:41 +0000311 char *PC = (char*)__builtin_return_address(0);
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000312 size_t i;
313 uint64_t Token = 0;
314 for (i = 0; i < N; i++) {
315 Token = Val ^ Vals[i];
316 if (Val < Vals[i])
317 break;
318 }
319
320 if (ValSizeInBits == 16)
321 fuzzer::TPC.HandleCmp(PC + i, static_cast<uint16_t>(Token), (uint16_t)(0));
322 else if (ValSizeInBits == 32)
323 fuzzer::TPC.HandleCmp(PC + i, static_cast<uint32_t>(Token), (uint32_t)(0));
Kostya Serebryany00e638e2016-12-17 02:03:34 +0000324 else
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000325 fuzzer::TPC.HandleCmp(PC + i, Token, (uint64_t)(0));
Kostya Serebryany379359c2016-10-05 01:09:40 +0000326}
327
328__attribute__((visibility("default")))
329void __sanitizer_cov_trace_div4(uint32_t Val) {
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000330 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Val, (uint32_t)0);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000331}
332__attribute__((visibility("default")))
333void __sanitizer_cov_trace_div8(uint64_t Val) {
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000334 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Val, (uint64_t)0);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000335}
336__attribute__((visibility("default")))
337void __sanitizer_cov_trace_gep(uintptr_t Idx) {
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000338 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Idx, (uintptr_t)0);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000339}
340
341} // extern "C"