blob: 01c0b8c2ddb510439521a1ec18e4d0e10ac5313b [file] [log] [blame]
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +00001//===- FuzzerTracePC.cpp - PC tracing--------------------------------------===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// Trace PCs.
Kostya Serebryanya00b2432016-09-14 02:13:06 +000010// This module implements __sanitizer_cov_trace_pc_guard[_init],
11// the callback required for -fsanitize-coverage=trace-pc-guard instrumentation.
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000012//
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000013//===----------------------------------------------------------------------===//
14
Kostya Serebryany1c73f1b2016-10-05 22:56:21 +000015#include "FuzzerCorpus.h"
Kostya Serebryany86586182016-09-21 21:17:23 +000016#include "FuzzerDefs.h"
Kostya Serebryanya5f94fb2016-10-14 20:20:33 +000017#include "FuzzerDictionary.h"
Kostya Serebryany95b1a432016-10-19 00:12:03 +000018#include "FuzzerExtFunctions.h"
Zachary Turner24a148b2016-11-30 19:06:14 +000019#include "FuzzerIO.h"
Kostya Serebryany6f5a8042016-09-21 01:50:50 +000020#include "FuzzerTracePC.h"
Kostya Serebryany86586182016-09-21 21:17:23 +000021#include "FuzzerValueBitMap.h"
Zachary Turner24a148b2016-11-30 19:06:14 +000022#include <map>
Mike Aizatsky9b415be2016-12-19 22:18:08 +000023#include <sanitizer/coverage_interface.h>
Zachary Turner24a148b2016-11-30 19:06:14 +000024#include <set>
25#include <sstream>
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000026
27namespace fuzzer {
Mike Aizatsky1aa501e2016-05-10 23:43:15 +000028
Kostya Serebryanya00b2432016-09-14 02:13:06 +000029TracePC TPC;
Mike Aizatsky1aa501e2016-05-10 23:43:15 +000030
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +000031void TracePC::HandleTrace(uint32_t *Guard, uintptr_t PC) {
32 uint32_t Idx = *Guard;
Kostya Serebryany8e781a82016-09-18 04:52:23 +000033 if (!Idx) return;
Kostya Serebryany2fabeca2016-10-26 18:52:04 +000034 PCs[Idx % kNumPCs] = PC;
35 Counters[Idx % kNumCounters]++;
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000036}
Kostya Serebryanya5277d52016-09-15 01:30:18 +000037
Kostya Serebryany275e2602016-10-25 23:52:25 +000038size_t TracePC::GetTotalPCCoverage() {
39 size_t Res = 0;
Kostya Serebryany06b87572016-10-26 00:42:52 +000040 for (size_t i = 1; i < GetNumPCs(); i++)
Kostya Serebryany275e2602016-10-25 23:52:25 +000041 if (PCs[i])
42 Res++;
43 return Res;
44}
45
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +000046void TracePC::HandleInit(uint32_t *Start, uint32_t *Stop) {
Kostya Serebryany3e36ec12016-09-17 05:04:47 +000047 if (Start == Stop || *Start) return;
48 assert(NumModules < sizeof(Modules) / sizeof(Modules[0]));
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +000049 for (uint32_t *P = Start; P < Stop; P++)
Kostya Serebryany8e781a82016-09-18 04:52:23 +000050 *P = ++NumGuards;
Kostya Serebryany3e36ec12016-09-17 05:04:47 +000051 Modules[NumModules].Start = Start;
52 Modules[NumModules].Stop = Stop;
53 NumModules++;
54}
55
56void TracePC::PrintModuleInfo() {
57 Printf("INFO: Loaded %zd modules (%zd guards): ", NumModules, NumGuards);
58 for (size_t i = 0; i < NumModules; i++)
59 Printf("[%p, %p), ", Modules[i].Start, Modules[i].Stop);
60 Printf("\n");
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +000061}
Kostya Serebryanya5277d52016-09-15 01:30:18 +000062
Kostya Serebryany09845172016-09-15 22:16:15 +000063void TracePC::HandleCallerCallee(uintptr_t Caller, uintptr_t Callee) {
64 const uintptr_t kBits = 12;
65 const uintptr_t kMask = (1 << kBits) - 1;
Kostya Serebryany1c73f1b2016-10-05 22:56:21 +000066 uintptr_t Idx = (Caller & kMask) | ((Callee & kMask) << kBits);
67 HandleValueProfile(Idx);
Kostya Serebryany09845172016-09-15 22:16:15 +000068}
69
Kostya Serebryany95b1a432016-10-19 00:12:03 +000070static bool IsInterestingCoverageFile(std::string &File) {
71 if (File.find("compiler-rt/lib/") != std::string::npos)
72 return false; // sanitizer internal.
73 if (File.find("/usr/lib/") != std::string::npos)
74 return false;
75 if (File.find("/usr/include/") != std::string::npos)
76 return false;
77 if (File == "<null>")
78 return false;
79 return true;
80}
81
Kostya Serebryany11a22bc2016-12-30 01:13:07 +000082void TracePC::InitializePrintNewPCs() {
83 assert(!PrintedPCs);
84 PrintedPCs = new std::set<uintptr_t>;
85 for (size_t i = 1; i < GetNumPCs(); i++)
86 if (PCs[i])
87 PrintedPCs->insert(PCs[i]);
88}
89
Kostya Serebryanya5b2e542016-10-26 00:20:51 +000090void TracePC::PrintNewPCs() {
Kostya Serebryany11a22bc2016-12-30 01:13:07 +000091 assert(PrintedPCs);
92 for (size_t i = 1; i < GetNumPCs(); i++)
93 if (PCs[i] && PrintedPCs->insert(PCs[i]).second)
94 PrintPC("\tNEW_PC: %p %F %L\n", "\tNEW_PC: %p\n", PCs[i]);
Kostya Serebryanya5b2e542016-10-26 00:20:51 +000095}
96
Kostya Serebryanyb706b482016-09-18 21:47:08 +000097void TracePC::PrintCoverage() {
Kostya Serebryany1394ce22016-12-10 01:19:35 +000098 if (!EF->__sanitizer_symbolize_pc ||
99 !EF->__sanitizer_get_module_and_offset_for_pc) {
100 Printf("INFO: __sanitizer_symbolize_pc or "
101 "__sanitizer_get_module_and_offset_for_pc is not available,"
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000102 " not printing coverage\n");
103 return;
104 }
105 std::map<std::string, std::vector<uintptr_t>> CoveredPCsPerModule;
106 std::map<std::string, uintptr_t> ModuleOffsets;
Kostya Serebryany1cba0a92016-11-30 21:53:32 +0000107 std::set<std::string> CoveredDirs, CoveredFiles, CoveredFunctions,
108 CoveredLines;
Kostya Serebryanyb706b482016-09-18 21:47:08 +0000109 Printf("COVERAGE:\n");
Kostya Serebryany06b87572016-10-26 00:42:52 +0000110 for (size_t i = 1; i < GetNumPCs(); i++) {
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000111 if (!PCs[i]) continue;
112 std::string FileStr = DescribePC("%s", PCs[i]);
113 if (!IsInterestingCoverageFile(FileStr)) continue;
114 std::string FixedPCStr = DescribePC("%p", PCs[i]);
115 std::string FunctionStr = DescribePC("%F", PCs[i]);
116 std::string LineStr = DescribePC("%l", PCs[i]);
Kostya Serebryany1394ce22016-12-10 01:19:35 +0000117 char ModulePathRaw[4096] = ""; // What's PATH_MAX in portable C++?
118 void *OffsetRaw = nullptr;
119 if (!EF->__sanitizer_get_module_and_offset_for_pc(
120 reinterpret_cast<void *>(PCs[i]), ModulePathRaw,
121 sizeof(ModulePathRaw), &OffsetRaw))
122 continue;
123 std::string Module = ModulePathRaw;
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000124 uintptr_t FixedPC = std::stol(FixedPCStr, 0, 16);
Kostya Serebryany1394ce22016-12-10 01:19:35 +0000125 uintptr_t PcOffset = reinterpret_cast<uintptr_t>(OffsetRaw);
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000126 ModuleOffsets[Module] = FixedPC - PcOffset;
127 CoveredPCsPerModule[Module].push_back(PcOffset);
128 CoveredFunctions.insert(FunctionStr);
129 CoveredFiles.insert(FileStr);
Kostya Serebryany1cba0a92016-11-30 21:53:32 +0000130 CoveredDirs.insert(DirName(FileStr));
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000131 if (!CoveredLines.insert(FileStr + ":" + LineStr).second)
132 continue;
133 Printf("COVERED: %s %s:%s\n", FunctionStr.c_str(),
134 FileStr.c_str(), LineStr.c_str());
135 }
136
Kostya Serebryany1cba0a92016-11-30 21:53:32 +0000137 std::string CoveredDirsStr;
138 for (auto &Dir : CoveredDirs) {
139 if (!CoveredDirsStr.empty())
140 CoveredDirsStr += ",";
141 CoveredDirsStr += Dir;
142 }
143 Printf("COVERED_DIRS: %s\n", CoveredDirsStr.c_str());
144
Kostya Serebryany95b1a432016-10-19 00:12:03 +0000145 for (auto &M : CoveredPCsPerModule) {
146 std::set<std::string> UncoveredFiles, UncoveredFunctions;
147 std::map<std::string, std::set<int> > UncoveredLines; // Func+File => lines
148 auto &ModuleName = M.first;
149 auto &CoveredOffsets = M.second;
150 uintptr_t ModuleOffset = ModuleOffsets[ModuleName];
151 std::sort(CoveredOffsets.begin(), CoveredOffsets.end());
152 Printf("MODULE_WITH_COVERAGE: %s\n", ModuleName.c_str());
153 // sancov does not yet fully support DSOs.
154 // std::string Cmd = "sancov -print-coverage-pcs " + ModuleName;
155 std::string Cmd = "objdump -d " + ModuleName +
156 " | grep 'call.*__sanitizer_cov_trace_pc_guard' | awk -F: '{print $1}'";
157 std::string SanCovOutput;
158 if (!ExecuteCommandAndReadOutput(Cmd, &SanCovOutput)) {
159 Printf("INFO: Command failed: %s\n", Cmd.c_str());
160 continue;
161 }
162 std::istringstream ISS(SanCovOutput);
163 std::string S;
164 while (std::getline(ISS, S, '\n')) {
165 uintptr_t PcOffset = std::stol(S, 0, 16);
166 if (!std::binary_search(CoveredOffsets.begin(), CoveredOffsets.end(),
167 PcOffset)) {
168 uintptr_t PC = ModuleOffset + PcOffset;
169 auto FileStr = DescribePC("%s", PC);
170 if (!IsInterestingCoverageFile(FileStr)) continue;
171 if (CoveredFiles.count(FileStr) == 0) {
172 UncoveredFiles.insert(FileStr);
173 continue;
174 }
175 auto FunctionStr = DescribePC("%F", PC);
176 if (CoveredFunctions.count(FunctionStr) == 0) {
177 UncoveredFunctions.insert(FunctionStr);
178 continue;
179 }
180 std::string LineStr = DescribePC("%l", PC);
181 uintptr_t Line = std::stoi(LineStr);
182 std::string FileLineStr = FileStr + ":" + LineStr;
183 if (CoveredLines.count(FileLineStr) == 0)
184 UncoveredLines[FunctionStr + " " + FileStr].insert(Line);
185 }
186 }
187 for (auto &FileLine: UncoveredLines)
188 for (int Line : FileLine.second)
189 Printf("UNCOVERED_LINE: %s:%d\n", FileLine.first.c_str(), Line);
190 for (auto &Func : UncoveredFunctions)
191 Printf("UNCOVERED_FUNC: %s\n", Func.c_str());
192 for (auto &File : UncoveredFiles)
193 Printf("UNCOVERED_FILE: %s\n", File.c_str());
Kostya Serebryanyb706b482016-09-18 21:47:08 +0000194 }
195}
196
Mike Aizatsky9b415be2016-12-19 22:18:08 +0000197void TracePC::DumpCoverage() {
198 __sanitizer_dump_coverage(PCs, GetNumPCs());
199}
200
Kostya Serebryany379359c2016-10-05 01:09:40 +0000201// Value profile.
202// We keep track of various values that affect control flow.
203// These values are inserted into a bit-set-based hash map.
204// Every new bit in the map is treated as a new coverage.
205//
206// For memcmp/strcmp/etc the interesting value is the length of the common
207// prefix of the parameters.
208// For cmp instructions the interesting value is a XOR of the parameters.
209// The interesting value is mixed up with the PC and is then added to the map.
210
Kostya Serebryany3a4e2dd2016-12-16 22:45:25 +0000211ATTRIBUTE_NO_SANITIZE_MEMORY
Kostya Serebryany379359c2016-10-05 01:09:40 +0000212void TracePC::AddValueForMemcmp(void *caller_pc, const void *s1, const void *s2,
213 size_t n) {
214 if (!n) return;
215 size_t Len = std::min(n, (size_t)32);
216 const uint8_t *A1 = reinterpret_cast<const uint8_t *>(s1);
217 const uint8_t *A2 = reinterpret_cast<const uint8_t *>(s2);
218 size_t I = 0;
219 for (; I < Len; I++)
220 if (A1[I] != A2[I])
221 break;
222 size_t PC = reinterpret_cast<size_t>(caller_pc);
223 size_t Idx = I;
224 // if (I < Len)
225 // Idx += __builtin_popcountl((A1[I] ^ A2[I])) - 1;
226 TPC.HandleValueProfile((PC & 4095) | (Idx << 12));
227}
228
Kostya Serebryany3a4e2dd2016-12-16 22:45:25 +0000229ATTRIBUTE_NO_SANITIZE_MEMORY
Kostya Serebryany379359c2016-10-05 01:09:40 +0000230void TracePC::AddValueForStrcmp(void *caller_pc, const char *s1, const char *s2,
231 size_t n) {
232 if (!n) return;
233 size_t Len = std::min(n, (size_t)32);
234 const uint8_t *A1 = reinterpret_cast<const uint8_t *>(s1);
235 const uint8_t *A2 = reinterpret_cast<const uint8_t *>(s2);
236 size_t I = 0;
237 for (; I < Len; I++)
238 if (A1[I] != A2[I] || A1[I] == 0)
239 break;
240 size_t PC = reinterpret_cast<size_t>(caller_pc);
241 size_t Idx = I;
242 // if (I < Len && A1[I])
243 // Idx += __builtin_popcountl((A1[I] ^ A2[I])) - 1;
244 TPC.HandleValueProfile((PC & 4095) | (Idx << 12));
245}
246
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000247template <class T>
Kostya Serebryany379359c2016-10-05 01:09:40 +0000248ATTRIBUTE_TARGET_POPCNT
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000249#ifdef __clang__ // g++ can't handle this __attribute__ here :(
250__attribute__((always_inline))
251#endif // __clang__
252void TracePC::HandleCmp(void *PC, T Arg1, T Arg2) {
253 uintptr_t PCuint = reinterpret_cast<uintptr_t>(PC);
Kostya Serebryanya5f94fb2016-10-14 20:20:33 +0000254 uint64_t ArgXor = Arg1 ^ Arg2;
255 uint64_t ArgDistance = __builtin_popcountl(ArgXor) + 1; // [1,65]
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000256 uintptr_t Idx = ((PCuint & 4095) + 1) * ArgDistance;
Kostya Serebryany94c427c2016-10-27 00:36:38 +0000257 if (sizeof(T) == 4)
258 TORC4.Insert(ArgXor, Arg1, Arg2);
259 else if (sizeof(T) == 8)
260 TORC8.Insert(ArgXor, Arg1, Arg2);
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000261 HandleValueProfile(Idx);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000262}
263
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +0000264} // namespace fuzzer
265
Dan Liew59144072016-06-06 20:27:09 +0000266extern "C" {
Kostya Serebryany32661f92016-08-18 20:52:52 +0000267__attribute__((visibility("default")))
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +0000268void __sanitizer_cov_trace_pc_guard(uint32_t *Guard) {
Kostya Serebryanya00b2432016-09-14 02:13:06 +0000269 uintptr_t PC = (uintptr_t)__builtin_return_address(0);
Kostya Serebryanya5277d52016-09-15 01:30:18 +0000270 fuzzer::TPC.HandleTrace(Guard, PC);
Kostya Serebryanyda63c1d2016-02-26 21:33:56 +0000271}
Dan Liew59144072016-06-06 20:27:09 +0000272
Kostya Serebryany32661f92016-08-18 20:52:52 +0000273__attribute__((visibility("default")))
Kostya Serebryanya9b0dd02016-09-29 17:43:24 +0000274void __sanitizer_cov_trace_pc_guard_init(uint32_t *Start, uint32_t *Stop) {
Kostya Serebryanya5277d52016-09-15 01:30:18 +0000275 fuzzer::TPC.HandleInit(Start, Stop);
Dan Liew59144072016-06-06 20:27:09 +0000276}
Kostya Serebryany09845172016-09-15 22:16:15 +0000277
278__attribute__((visibility("default")))
279void __sanitizer_cov_trace_pc_indir(uintptr_t Callee) {
280 uintptr_t PC = (uintptr_t)__builtin_return_address(0);
281 fuzzer::TPC.HandleCallerCallee(PC, Callee);
282}
Kostya Serebryany379359c2016-10-05 01:09:40 +0000283
Kostya Serebryany379359c2016-10-05 01:09:40 +0000284__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000285void __sanitizer_cov_trace_cmp8(uint64_t Arg1, uint64_t Arg2) {
286 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000287}
288__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000289void __sanitizer_cov_trace_cmp4(uint32_t Arg1, uint32_t Arg2) {
290 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000291}
292__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000293void __sanitizer_cov_trace_cmp2(uint16_t Arg1, uint16_t Arg2) {
294 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000295}
296__attribute__((visibility("default")))
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000297void __sanitizer_cov_trace_cmp1(uint8_t Arg1, uint8_t Arg2) {
298 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Arg1, Arg2);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000299}
300
301__attribute__((visibility("default")))
302void __sanitizer_cov_trace_switch(uint64_t Val, uint64_t *Cases) {
Kostya Serebryanyd19919a2016-10-11 01:14:41 +0000303 uint64_t N = Cases[0];
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000304 uint64_t ValSizeInBits = Cases[1];
Kostya Serebryanyd19919a2016-10-11 01:14:41 +0000305 uint64_t *Vals = Cases + 2;
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000306 // Skip the most common and the most boring case.
307 if (Vals[N - 1] < 256 && Val < 256)
308 return;
Kostya Serebryanyd19919a2016-10-11 01:14:41 +0000309 char *PC = (char*)__builtin_return_address(0);
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000310 size_t i;
311 uint64_t Token = 0;
312 for (i = 0; i < N; i++) {
313 Token = Val ^ Vals[i];
314 if (Val < Vals[i])
315 break;
316 }
317
318 if (ValSizeInBits == 16)
319 fuzzer::TPC.HandleCmp(PC + i, static_cast<uint16_t>(Token), (uint16_t)(0));
320 else if (ValSizeInBits == 32)
321 fuzzer::TPC.HandleCmp(PC + i, static_cast<uint32_t>(Token), (uint32_t)(0));
Kostya Serebryany00e638e2016-12-17 02:03:34 +0000322 else
Kostya Serebryanyd7238042016-12-29 02:50:35 +0000323 fuzzer::TPC.HandleCmp(PC + i, Token, (uint64_t)(0));
Kostya Serebryany379359c2016-10-05 01:09:40 +0000324}
325
326__attribute__((visibility("default")))
327void __sanitizer_cov_trace_div4(uint32_t Val) {
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000328 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Val, (uint32_t)0);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000329}
330__attribute__((visibility("default")))
331void __sanitizer_cov_trace_div8(uint64_t Val) {
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000332 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Val, (uint64_t)0);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000333}
334__attribute__((visibility("default")))
335void __sanitizer_cov_trace_gep(uintptr_t Idx) {
Kostya Serebryany17d176e12016-10-13 16:19:09 +0000336 fuzzer::TPC.HandleCmp(__builtin_return_address(0), Idx, (uintptr_t)0);
Kostya Serebryany379359c2016-10-05 01:09:40 +0000337}
338
339} // extern "C"