blob: 44af57d5312014703ca04e2b7431e8bc5cfdf00a [file] [log] [blame]
Aaron Ballmanef116982015-01-29 16:58:29 +00001//===- FuzzerInternal.h - Internal header for the Fuzzer --------*- C++ -* ===//
2//
3// The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9// Define the main class fuzzer::Fuzzer and most functions.
10//===----------------------------------------------------------------------===//
Yaron Keren347663b2015-08-10 16:37:40 +000011
12#ifndef LLVM_FUZZER_INTERNAL_H
13#define LLVM_FUZZER_INTERNAL_H
14
Aaron Ballmanef116982015-01-29 16:58:29 +000015#include <cassert>
Kostya Serebryany33f86692015-02-04 22:20:09 +000016#include <climits>
Aaron Ballmanef116982015-01-29 16:58:29 +000017#include <chrono>
18#include <cstddef>
19#include <cstdlib>
20#include <string>
21#include <vector>
Kostya Serebryany2c1b33b2015-01-29 23:01:07 +000022#include <unordered_set>
Aaron Ballmanef116982015-01-29 16:58:29 +000023
Kostya Serebryany016852c2015-02-19 18:45:37 +000024#include "FuzzerInterface.h"
25
Aaron Ballmanef116982015-01-29 16:58:29 +000026namespace fuzzer {
Aaron Ballmanef116982015-01-29 16:58:29 +000027using namespace std::chrono;
Kostya Serebryanyaca76962016-01-16 01:23:12 +000028typedef std::vector<uint8_t> Unit;
Aaron Ballmanef116982015-01-29 16:58:29 +000029
Kostya Serebryany52a788e2015-03-31 20:13:20 +000030std::string FileToString(const std::string &Path);
31Unit FileToVector(const std::string &Path);
Kostya Serebryany1ac80552015-05-08 21:30:55 +000032void ReadDirToVectorOfUnits(const char *Path, std::vector<Unit> *V,
33 long *Epoch);
Aaron Ballmanef116982015-01-29 16:58:29 +000034void WriteToFile(const Unit &U, const std::string &Path);
Kostya Serebryany5b266a82015-02-04 19:10:20 +000035void CopyFileToErr(const std::string &Path);
Aaron Ballmanef116982015-01-29 16:58:29 +000036// Returns "Dir/FileName" or equivalent for the current OS.
37std::string DirPlusFile(const std::string &DirPath,
38 const std::string &FileName);
39
Kostya Serebryany20e9bcb2015-05-23 01:07:46 +000040void Printf(const char *Fmt, ...);
Kostya Serebryany98abb2c2016-01-13 23:46:01 +000041void PrintHexArray(const Unit &U, const char *PrintAfter = "");
42void PrintHexArray(const uint8_t *Data, size_t Size,
43 const char *PrintAfter = "");
Kostya Serebryany41740052016-01-12 02:36:59 +000044void PrintASCII(const uint8_t *Data, size_t Size, const char *PrintAfter = "");
Aaron Ballmanef116982015-01-29 16:58:29 +000045void PrintASCII(const Unit &U, const char *PrintAfter = "");
46std::string Hash(const Unit &U);
47void SetTimer(int Seconds);
Kostya Serebryany9e48cda2015-12-04 22:29:39 +000048std::string Base64(const Unit &U);
Kostya Serebryanydc3135d2015-11-12 01:02:01 +000049int ExecuteCommand(const std::string &Command);
Aaron Ballmanef116982015-01-29 16:58:29 +000050
Kostya Serebryany96eab652015-05-14 22:41:49 +000051// Private copy of SHA1 implementation.
52static const int kSHA1NumBytes = 20;
53// Computes SHA1 hash of 'Len' bytes in 'Data', writes kSHA1NumBytes to 'Out'.
54void ComputeSHA1(const uint8_t *Data, size_t Len, uint8_t *Out);
55
Kostya Serebryanybc7c0ad2015-08-11 01:44:42 +000056// Changes U to contain only ASCII (isprint+isspace) characters.
57// Returns true iff U has been changed.
58bool ToASCII(Unit &U);
Kostya Serebryanya9346c22015-09-02 19:08:08 +000059bool IsASCII(const Unit &U);
Kostya Serebryanybc7c0ad2015-08-11 01:44:42 +000060
Kostya Serebryany9690fcf2015-05-12 18:51:57 +000061int NumberOfCpuCores();
Kostya Serebryanyd6edce92015-10-16 23:04:31 +000062int GetPid();
Kostya Serebryany9690fcf2015-05-12 18:51:57 +000063
Kostya Serebryany9838b2b2015-09-03 20:23:46 +000064// Dictionary.
65
66// Parses one dictionary entry.
67// If successfull, write the enty to Unit and returns true,
68// otherwise returns false.
69bool ParseOneDictionaryEntry(const std::string &Str, Unit *U);
70// Parses the dictionary file, fills Units, returns true iff all lines
71// were parsed succesfully.
72bool ParseDictionaryFile(const std::string &Text, std::vector<Unit> *Units);
73
Kostya Serebryany628bc3e2016-01-16 00:04:36 +000074class MutationDispatcher {
75 public:
76 MutationDispatcher(FuzzerRandomBase &Rand);
77 ~MutationDispatcher();
78 /// Indicate that we are about to start a new sequence of mutations.
79 void StartMutationSequence();
80 /// Print the current sequence of mutations.
81 void PrintMutationSequence();
82 /// Indicate that the current sequence of mutations was successfull.
83 void RecordSuccessfulMutationSequence();
84 /// Mutates data by shuffling bytes.
85 size_t Mutate_ShuffleBytes(uint8_t *Data, size_t Size, size_t MaxSize);
86 /// Mutates data by erasing a byte.
87 size_t Mutate_EraseByte(uint8_t *Data, size_t Size, size_t MaxSize);
88 /// Mutates data by inserting a byte.
89 size_t Mutate_InsertByte(uint8_t *Data, size_t Size, size_t MaxSize);
90 /// Mutates data by chanding one byte.
91 size_t Mutate_ChangeByte(uint8_t *Data, size_t Size, size_t MaxSize);
92 /// Mutates data by chanding one bit.
93 size_t Mutate_ChangeBit(uint8_t *Data, size_t Size, size_t MaxSize);
94
95 /// Mutates data by adding a word from the manual dictionary.
96 size_t Mutate_AddWordFromManualDictionary(uint8_t *Data, size_t Size,
97 size_t MaxSize);
98
99 /// Mutates data by adding a word from the temporary automatic dictionary.
100 size_t Mutate_AddWordFromTemporaryAutoDictionary(uint8_t *Data, size_t Size,
101 size_t MaxSize);
102
103 /// Mutates data by adding a word from the persistent automatic dictionary.
104 size_t Mutate_AddWordFromPersistentAutoDictionary(uint8_t *Data, size_t Size,
105 size_t MaxSize);
106
107 /// Tries to find an ASCII integer in Data, changes it to another ASCII int.
108 size_t Mutate_ChangeASCIIInteger(uint8_t *Data, size_t Size, size_t MaxSize);
109
110 /// CrossOver Data with some other element of the corpus.
111 size_t Mutate_CrossOver(uint8_t *Data, size_t Size, size_t MaxSize);
112
113 /// Applies one of the above mutations.
114 /// Returns the new size of data which could be up to MaxSize.
115 size_t Mutate(uint8_t *Data, size_t Size, size_t MaxSize);
116
117 /// Creates a cross-over of two pieces of Data, returns its size.
118 size_t CrossOver(const uint8_t *Data1, size_t Size1, const uint8_t *Data2,
119 size_t Size2, uint8_t *Out, size_t MaxOutSize);
120
121 void AddWordToManualDictionary(const Unit &Word);
122
123 void AddWordToAutoDictionary(const Unit &Word, size_t PositionHint);
124 void ClearAutoDictionary();
125 void PrintRecommendedDictionary();
126
127 void SetCorpus(const std::vector<Unit> *Corpus);
128
129 private:
130 FuzzerRandomBase &Rand;
131 struct Impl;
132 Impl *MDImpl;
133};
134
Aaron Ballmanef116982015-01-29 16:58:29 +0000135class Fuzzer {
136 public:
137 struct FuzzingOptions {
138 int Verbosity = 1;
139 int MaxLen = 0;
Kostya Serebryany490bbd62015-05-19 22:12:57 +0000140 int UnitTimeoutSec = 300;
Kostya Serebryanyb85db172015-10-02 20:47:55 +0000141 int MaxTotalTimeSec = 0;
Aaron Ballmanef116982015-01-29 16:58:29 +0000142 bool DoCrossOver = true;
Kostya Serebryany5b266a82015-02-04 19:10:20 +0000143 int MutateDepth = 5;
Aaron Ballmanef116982015-01-29 16:58:29 +0000144 bool ExitOnFirst = false;
Kostya Serebryanybe5e0ed2015-03-03 23:27:02 +0000145 bool UseCounters = false;
Kostya Serebryany2e9fca92015-10-22 23:55:39 +0000146 bool UseIndirCalls = true;
Kostya Serebryany5a99ecb2015-05-11 20:51:19 +0000147 bool UseTraces = false;
Kostya Serebryanyae5b9562016-01-15 06:24:05 +0000148 bool UseMemcmp = true;
Kostya Serebryany2c1b33b2015-01-29 23:01:07 +0000149 bool UseFullCoverageSet = false;
Kostya Serebryany1ac80552015-05-08 21:30:55 +0000150 bool Reload = true;
Kostya Serebryanyfed509e2015-10-17 04:38:26 +0000151 bool ShuffleAtStartUp = true;
Kostya Serebryany92e04762015-02-04 23:42:42 +0000152 int PreferSmallDuringInitialShuffle = -1;
Kostya Serebryany33f86692015-02-04 22:20:09 +0000153 size_t MaxNumberOfRuns = ULONG_MAX;
Kostya Serebryany2da7b842015-05-18 21:34:20 +0000154 int SyncTimeout = 600;
Kostya Serebryany70926ae2015-08-05 21:43:48 +0000155 int ReportSlowUnits = 10;
Kostya Serebryanybc7c0ad2015-08-11 01:44:42 +0000156 bool OnlyASCII = false;
Aaron Ballmanef116982015-01-29 16:58:29 +0000157 std::string OutputCorpus;
Kostya Serebryany2da7b842015-05-18 21:34:20 +0000158 std::string SyncCommand;
Kostya Serebryanybd5d1cd2015-10-09 03:57:59 +0000159 std::string ArtifactPrefix = "./";
Kostya Serebryany2d0ef142015-11-25 21:40:46 +0000160 std::string ExactArtifactPath;
Kostya Serebryanyb91c62b2015-10-16 22:41:47 +0000161 bool SaveArtifacts = true;
Kostya Serebryanydc3135d2015-11-12 01:02:01 +0000162 bool PrintNEW = true; // Print a status line when new units are found;
Mike Aizatskya9c23872015-11-12 04:38:40 +0000163 bool OutputCSV = false;
Mike Aizatsky8b11f872016-01-06 00:21:22 +0000164 bool PrintNewCovPcs = false;
Aaron Ballmanef116982015-01-29 16:58:29 +0000165 };
Kostya Serebryanyf3424592015-05-22 22:35:31 +0000166 Fuzzer(UserSuppliedFuzzer &USF, FuzzingOptions Options);
Aaron Ballmanef116982015-01-29 16:58:29 +0000167 void AddToCorpus(const Unit &U) { Corpus.push_back(U); }
Kostya Serebryanydc3135d2015-11-12 01:02:01 +0000168 size_t ChooseUnitIdxToMutate();
169 const Unit &ChooseUnitToMutate() { return Corpus[ChooseUnitIdxToMutate()]; };
Kostya Serebryany468ed782015-09-08 17:30:35 +0000170 void Loop();
Kostya Serebryanydc3135d2015-11-12 01:02:01 +0000171 void Drill();
Aaron Ballmanef116982015-01-29 16:58:29 +0000172 void ShuffleAndMinimize();
Kostya Serebryany22526252015-05-11 21:16:27 +0000173 void InitializeTraceState();
Kostya Serebryanyd50a3ee2016-01-13 23:02:30 +0000174 void AssignTaintLabels(uint8_t *Data, size_t Size);
Aaron Ballmanef116982015-01-29 16:58:29 +0000175 size_t CorpusSize() const { return Corpus.size(); }
Kostya Serebryany1ac80552015-05-08 21:30:55 +0000176 void ReadDir(const std::string &Path, long *Epoch) {
Kostya Serebryany9cc3b0d2015-10-24 01:16:40 +0000177 Printf("Loading corpus: %s\n", Path.c_str());
Kostya Serebryany1ac80552015-05-08 21:30:55 +0000178 ReadDirToVectorOfUnits(Path.c_str(), &Corpus, Epoch);
Aaron Ballmanef116982015-01-29 16:58:29 +0000179 }
Kostya Serebryany1ac80552015-05-08 21:30:55 +0000180 void RereadOutputCorpus();
Aaron Ballmanef116982015-01-29 16:58:29 +0000181 // Save the current corpus to OutputCorpus.
182 void SaveCorpus();
183
Kostya Serebryany92e04762015-02-04 23:42:42 +0000184 size_t secondsSinceProcessStartUp() {
185 return duration_cast<seconds>(system_clock::now() - ProcessStartTime)
186 .count();
187 }
188
189 size_t getTotalNumberOfRuns() { return TotalNumberOfRuns; }
190
Kostya Serebryany52a788e2015-03-31 20:13:20 +0000191 static void StaticAlarmCallback();
192
Ivan Krasin95e82d52015-10-01 23:23:06 +0000193 void ExecuteCallback(const Unit &U);
Aaron Ballmanef116982015-01-29 16:58:29 +0000194
Kostya Serebryany9cc3b0d2015-10-24 01:16:40 +0000195 // Merge Corpora[1:] into Corpora[0].
196 void Merge(const std::vector<std::string> &Corpora);
197
Aaron Ballmanef116982015-01-29 16:58:29 +0000198 private:
Kostya Serebryany52a788e2015-03-31 20:13:20 +0000199 void AlarmCallback();
Kostya Serebryany27ab2d72015-12-19 02:49:09 +0000200 void MutateAndTestOne();
Kostya Serebryany007c9b22015-10-22 22:50:47 +0000201 void ReportNewCoverage(const Unit &U);
202 bool RunOne(const Unit &U);
Kostya Serebryanybc7c0ad2015-08-11 01:44:42 +0000203 void RunOneAndUpdateCorpus(Unit &U);
Aaron Ballmanef116982015-01-29 16:58:29 +0000204 void WriteToOutputCorpus(const Unit &U);
Kostya Serebryany2b7d2e92015-07-23 18:37:22 +0000205 void WriteUnitToFileWithPrefix(const Unit &U, const char *Prefix);
Kostya Serebryany09d2a5f2015-10-22 22:56:45 +0000206 void PrintStats(const char *Where, const char *End = "\n");
Kostya Serebryanydc3135d2015-11-12 01:02:01 +0000207 void PrintStatusForNewUnit(const Unit &U);
Aaron Ballmanef116982015-01-29 16:58:29 +0000208
Kostya Serebryany2da7b842015-05-18 21:34:20 +0000209 void SyncCorpus();
210
Kostya Serebryany007c9b22015-10-22 22:50:47 +0000211 size_t RecordBlockCoverage();
Kostya Serebryany2e9fca92015-10-22 23:55:39 +0000212 size_t RecordCallerCalleeCoverage();
Kostya Serebryany007c9b22015-10-22 22:50:47 +0000213 void PrepareCoverageBeforeRun();
214 bool CheckCoverageAfterRun();
215
216
Kostya Serebryanybeb24c32015-05-07 21:02:11 +0000217 // Trace-based fuzzing: we run a unit with some kind of tracing
218 // enabled and record potentially useful mutations. Then
219 // We apply these mutations one by one to the unit and run it again.
220
221 // Start tracing; forget all previously proposed mutations.
222 void StartTraceRecording();
Kostya Serebryanyb65805a2016-01-09 03:08:58 +0000223 // Stop tracing.
224 void StopTraceRecording();
Kostya Serebryanybeb24c32015-05-07 21:02:11 +0000225
Aaron Ballmanef116982015-01-29 16:58:29 +0000226 void SetDeathCallback();
Kostya Serebryany52a788e2015-03-31 20:13:20 +0000227 static void StaticDeathCallback();
228 void DeathCallback();
Kostya Serebryany98abb2c2016-01-13 23:46:01 +0000229
230 uint8_t *CurrentUnitData;
231 size_t CurrentUnitSize;
Aaron Ballmanef116982015-01-29 16:58:29 +0000232
233 size_t TotalNumberOfRuns = 0;
Kostya Serebryany12c78372015-08-12 01:55:37 +0000234 size_t TotalNumberOfExecutedTraceBasedMutations = 0;
Aaron Ballmanef116982015-01-29 16:58:29 +0000235
236 std::vector<Unit> Corpus;
Kostya Serebryanycbb23342015-05-19 01:06:07 +0000237 std::unordered_set<std::string> UnitHashesAddedToCorpus;
Kostya Serebryanybe5e0ed2015-03-03 23:27:02 +0000238
239 // For UseCounters
240 std::vector<uint8_t> CounterBitmap;
241 size_t TotalBits() { // Slow. Call it only for printing stats.
242 size_t Res = 0;
243 for (auto x : CounterBitmap) Res += __builtin_popcount(x);
244 return Res;
245 }
246
Kostya Serebryanyf3424592015-05-22 22:35:31 +0000247 UserSuppliedFuzzer &USF;
Aaron Ballmanef116982015-01-29 16:58:29 +0000248 FuzzingOptions Options;
249 system_clock::time_point ProcessStartTime = system_clock::now();
Kostya Serebryany2da7b842015-05-18 21:34:20 +0000250 system_clock::time_point LastExternalSync = system_clock::now();
Kostya Serebryany52a788e2015-03-31 20:13:20 +0000251 system_clock::time_point UnitStartTime;
Kostya Serebryany16901a92015-03-30 23:04:35 +0000252 long TimeOfLongestUnitInSeconds = 0;
Kostya Serebryany1ac80552015-05-08 21:30:55 +0000253 long EpochOfLastReadOfOutputCorpus = 0;
Kostya Serebryany007c9b22015-10-22 22:50:47 +0000254 size_t LastRecordedBlockCoverage = 0;
Kostya Serebryany2e9fca92015-10-22 23:55:39 +0000255 size_t LastRecordedCallerCalleeCoverage = 0;
Mike Aizatsky8b11f872016-01-06 00:21:22 +0000256 size_t LastCoveragePcBufferLen = 0;
Aaron Ballmanef116982015-01-29 16:58:29 +0000257};
258
Kostya Serebryanyf3424592015-05-22 22:35:31 +0000259class SimpleUserSuppliedFuzzer: public UserSuppliedFuzzer {
260 public:
Kostya Serebryany404c69f2015-07-24 01:06:40 +0000261 SimpleUserSuppliedFuzzer(FuzzerRandomBase *Rand, UserCallback Callback)
262 : UserSuppliedFuzzer(Rand), Callback(Callback) {}
Kostya Serebryany20bb5e72015-10-02 23:34:06 +0000263
Kostya Serebryany20bb5e72015-10-02 23:34:06 +0000264 virtual int TargetFunction(const uint8_t *Data, size_t Size) override {
Kostya Serebryany94660b32015-10-23 18:37:58 +0000265 return Callback(Data, Size);
Kostya Serebryanyf3424592015-05-22 22:35:31 +0000266 }
267
268 private:
Kostya Serebryany20bb5e72015-10-02 23:34:06 +0000269 UserCallback Callback = nullptr;
Kostya Serebryanyf3424592015-05-22 22:35:31 +0000270};
271
Aaron Ballmanef116982015-01-29 16:58:29 +0000272}; // namespace fuzzer
Yaron Keren347663b2015-08-10 16:37:40 +0000273
274#endif // LLVM_FUZZER_INTERNAL_H