Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 1 | //===- FuzzerMutate.cpp - Mutate a test input -----------------------------===// |
| 2 | // |
| 3 | // The LLVM Compiler Infrastructure |
| 4 | // |
| 5 | // This file is distributed under the University of Illinois Open Source |
| 6 | // License. See LICENSE.TXT for details. |
| 7 | // |
| 8 | //===----------------------------------------------------------------------===// |
| 9 | // Mutate a test input. |
| 10 | //===----------------------------------------------------------------------===// |
| 11 | |
Kostya Serebryany | f342459 | 2015-05-22 22:35:31 +0000 | [diff] [blame] | 12 | #include <cstring> |
| 13 | |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 14 | #include "FuzzerInternal.h" |
| 15 | |
Kostya Serebryany | bf29ff2 | 2015-08-06 01:29:13 +0000 | [diff] [blame] | 16 | #include <algorithm> |
| 17 | |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 18 | namespace fuzzer { |
| 19 | |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 20 | struct Mutator { |
| 21 | size_t (MutationDispatcher::*Fn)(uint8_t *Data, size_t Size, size_t Max); |
| 22 | const char *Name; |
| 23 | }; |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 24 | |
| 25 | struct MutationDispatcher::Impl { |
| 26 | std::vector<Unit> Dictionary; |
| 27 | std::vector<Mutator> Mutators; |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 28 | std::vector<Mutator> CurrentMutatorSequence; |
Kostya Serebryany | 27ab2d7 | 2015-12-19 02:49:09 +0000 | [diff] [blame] | 29 | const std::vector<Unit> *Corpus = nullptr; |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 30 | |
| 31 | void Add(Mutator M) { Mutators.push_back(M); } |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 32 | Impl() { |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 33 | Add({&MutationDispatcher::Mutate_EraseByte, "EraseByte"}); |
| 34 | Add({&MutationDispatcher::Mutate_InsertByte, "InsertByte"}); |
| 35 | Add({&MutationDispatcher::Mutate_ChangeByte, "ChangeByte"}); |
| 36 | Add({&MutationDispatcher::Mutate_ChangeBit, "ChangeBit"}); |
| 37 | Add({&MutationDispatcher::Mutate_ShuffleBytes, "ShuffleBytes"}); |
| 38 | Add({&MutationDispatcher::Mutate_ChangeASCIIInteger, "ChangeASCIIInt"}); |
Kostya Serebryany | 27ab2d7 | 2015-12-19 02:49:09 +0000 | [diff] [blame] | 39 | Add({&MutationDispatcher::Mutate_CrossOver, "CrossOver"}); |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 40 | } |
| 41 | void AddWordToDictionary(const uint8_t *Word, size_t Size) { |
| 42 | if (Dictionary.empty()) { |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 43 | Add({&MutationDispatcher::Mutate_AddWordFromDictionary, "AddFromDict"}); |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 44 | } |
| 45 | Dictionary.push_back(Unit(Word, Word + Size)); |
| 46 | } |
Kostya Serebryany | 27ab2d7 | 2015-12-19 02:49:09 +0000 | [diff] [blame] | 47 | void SetCorpus(const std::vector<Unit> *Corpus) { this->Corpus = Corpus; } |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 48 | }; |
| 49 | |
Kostya Serebryany | 404c69f | 2015-07-24 01:06:40 +0000 | [diff] [blame] | 50 | static char FlipRandomBit(char X, FuzzerRandomBase &Rand) { |
| 51 | int Bit = Rand(8); |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 52 | char Mask = 1 << Bit; |
| 53 | char R; |
| 54 | if (X & (1 << Bit)) |
| 55 | R = X & ~Mask; |
| 56 | else |
| 57 | R = X | Mask; |
| 58 | assert(R != X); |
| 59 | return R; |
| 60 | } |
| 61 | |
Kostya Serebryany | 404c69f | 2015-07-24 01:06:40 +0000 | [diff] [blame] | 62 | static char RandCh(FuzzerRandomBase &Rand) { |
| 63 | if (Rand.RandBool()) return Rand(256); |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 64 | const char *Special = "!*'();:@&=+$,/?%#[]123ABCxyz-`~."; |
Kostya Serebryany | 404c69f | 2015-07-24 01:06:40 +0000 | [diff] [blame] | 65 | return Special[Rand(sizeof(Special) - 1)]; |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 66 | } |
| 67 | |
Kostya Serebryany | ec2dcb1 | 2015-09-03 21:24:19 +0000 | [diff] [blame] | 68 | size_t MutationDispatcher::Mutate_ShuffleBytes(uint8_t *Data, size_t Size, |
| 69 | size_t MaxSize) { |
Kostya Serebryany | bf29ff2 | 2015-08-06 01:29:13 +0000 | [diff] [blame] | 70 | assert(Size); |
Kostya Serebryany | 3b80487 | 2015-10-08 00:59:25 +0000 | [diff] [blame] | 71 | size_t ShuffleAmount = Rand(std::min(Size, (size_t)8)) + 1; // [1,8] and <= Size. |
Kostya Serebryany | bf29ff2 | 2015-08-06 01:29:13 +0000 | [diff] [blame] | 72 | size_t ShuffleStart = Rand(Size - ShuffleAmount); |
| 73 | assert(ShuffleStart + ShuffleAmount <= Size); |
| 74 | std::random_shuffle(Data + ShuffleStart, Data + ShuffleStart + ShuffleAmount, |
| 75 | Rand); |
| 76 | return Size; |
| 77 | } |
| 78 | |
Kostya Serebryany | ec2dcb1 | 2015-09-03 21:24:19 +0000 | [diff] [blame] | 79 | size_t MutationDispatcher::Mutate_EraseByte(uint8_t *Data, size_t Size, |
| 80 | size_t MaxSize) { |
Kostya Serebryany | 8ce7424 | 2015-08-01 01:42:51 +0000 | [diff] [blame] | 81 | assert(Size); |
Kostya Serebryany | b2e9897 | 2015-09-04 00:40:29 +0000 | [diff] [blame] | 82 | if (Size == 1) return 0; |
Kostya Serebryany | 8ce7424 | 2015-08-01 01:42:51 +0000 | [diff] [blame] | 83 | size_t Idx = Rand(Size); |
| 84 | // Erase Data[Idx]. |
| 85 | memmove(Data + Idx, Data + Idx + 1, Size - Idx - 1); |
| 86 | return Size - 1; |
| 87 | } |
| 88 | |
Kostya Serebryany | ec2dcb1 | 2015-09-03 21:24:19 +0000 | [diff] [blame] | 89 | size_t MutationDispatcher::Mutate_InsertByte(uint8_t *Data, size_t Size, |
| 90 | size_t MaxSize) { |
Kostya Serebryany | b2e9897 | 2015-09-04 00:40:29 +0000 | [diff] [blame] | 91 | if (Size == MaxSize) return 0; |
Kostya Serebryany | 86a5fba | 2015-08-01 02:23:06 +0000 | [diff] [blame] | 92 | size_t Idx = Rand(Size + 1); |
| 93 | // Insert new value at Data[Idx]. |
| 94 | memmove(Data + Idx + 1, Data + Idx, Size - Idx); |
| 95 | Data[Idx] = RandCh(Rand); |
| 96 | return Size + 1; |
| 97 | } |
| 98 | |
Kostya Serebryany | ec2dcb1 | 2015-09-03 21:24:19 +0000 | [diff] [blame] | 99 | size_t MutationDispatcher::Mutate_ChangeByte(uint8_t *Data, size_t Size, |
| 100 | size_t MaxSize) { |
Kostya Serebryany | 86a5fba | 2015-08-01 02:23:06 +0000 | [diff] [blame] | 101 | size_t Idx = Rand(Size); |
| 102 | Data[Idx] = RandCh(Rand); |
| 103 | return Size; |
| 104 | } |
| 105 | |
Kostya Serebryany | ec2dcb1 | 2015-09-03 21:24:19 +0000 | [diff] [blame] | 106 | size_t MutationDispatcher::Mutate_ChangeBit(uint8_t *Data, size_t Size, |
| 107 | size_t MaxSize) { |
Kostya Serebryany | 86a5fba | 2015-08-01 02:23:06 +0000 | [diff] [blame] | 108 | size_t Idx = Rand(Size); |
| 109 | Data[Idx] = FlipRandomBit(Data[Idx], Rand); |
| 110 | return Size; |
| 111 | } |
| 112 | |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 113 | size_t MutationDispatcher::Mutate_AddWordFromDictionary(uint8_t *Data, |
| 114 | size_t Size, |
| 115 | size_t MaxSize) { |
| 116 | auto &D = MDImpl->Dictionary; |
Kostya Serebryany | b2e9897 | 2015-09-04 00:40:29 +0000 | [diff] [blame] | 117 | assert(!D.empty()); |
| 118 | if (D.empty()) return 0; |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 119 | const Unit &Word = D[Rand(D.size())]; |
Kostya Serebryany | 80eb76a | 2016-01-06 02:13:04 +0000 | [diff] [blame^] | 120 | if (Rand.RandBool()) { // Insert Word. |
| 121 | if (Size + Word.size() > MaxSize) return 0; |
| 122 | size_t Idx = Rand(Size + 1); |
| 123 | memmove(Data + Idx + Word.size(), Data + Idx, Size - Idx); |
| 124 | memcpy(Data + Idx, Word.data(), Word.size()); |
| 125 | return Size + Word.size(); |
| 126 | } else { // Overwrite some bytes with Word. |
| 127 | if (Word.size() > Size) return 0; |
| 128 | size_t Idx = Rand(Size - Word.size()); |
| 129 | memcpy(Data + Idx, Word.data(), Word.size()); |
| 130 | return Size; |
| 131 | } |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 132 | } |
| 133 | |
Kostya Serebryany | 25425ad | 2015-09-08 17:19:31 +0000 | [diff] [blame] | 134 | size_t MutationDispatcher::Mutate_ChangeASCIIInteger(uint8_t *Data, size_t Size, |
| 135 | size_t MaxSize) { |
| 136 | size_t B = Rand(Size); |
| 137 | while (B < Size && !isdigit(Data[B])) B++; |
| 138 | if (B == Size) return 0; |
| 139 | size_t E = B; |
| 140 | while (E < Size && isdigit(Data[E])) E++; |
| 141 | assert(B < E); |
| 142 | // now we have digits in [B, E). |
| 143 | // strtol and friends don't accept non-zero-teminated data, parse it manually. |
| 144 | uint64_t Val = Data[B] - '0'; |
| 145 | for (size_t i = B + 1; i < E; i++) |
| 146 | Val = Val * 10 + Data[i] - '0'; |
| 147 | |
| 148 | // Mutate the integer value. |
| 149 | switch(Rand(5)) { |
| 150 | case 0: Val++; break; |
| 151 | case 1: Val--; break; |
| 152 | case 2: Val /= 2; break; |
| 153 | case 3: Val *= 2; break; |
| 154 | case 4: Val = Rand(Val * Val); break; |
| 155 | default: assert(0); |
| 156 | } |
| 157 | // Just replace the bytes with the new ones, don't bother moving bytes. |
| 158 | for (size_t i = B; i < E; i++) { |
| 159 | size_t Idx = E + B - i - 1; |
| 160 | assert(Idx >= B && Idx < E); |
| 161 | Data[Idx] = (Val % 10) + '0'; |
| 162 | Val /= 10; |
| 163 | } |
| 164 | return Size; |
| 165 | } |
| 166 | |
Kostya Serebryany | 27ab2d7 | 2015-12-19 02:49:09 +0000 | [diff] [blame] | 167 | size_t MutationDispatcher::Mutate_CrossOver(uint8_t *Data, size_t Size, |
| 168 | size_t MaxSize) { |
| 169 | auto Corpus = MDImpl->Corpus; |
| 170 | if (!Corpus || Corpus->size() < 2 || Size == 0) return 0; |
| 171 | size_t Idx = Rand(Corpus->size()); |
| 172 | const Unit &Other = (*Corpus)[Idx]; |
| 173 | if (Other.empty()) return 0; |
| 174 | Unit U(MaxSize); |
| 175 | size_t NewSize = |
| 176 | CrossOver(Data, Size, Other.data(), Other.size(), U.data(), U.size()); |
| 177 | assert(NewSize > 0 && "CrossOver returned empty unit"); |
| 178 | assert(NewSize <= MaxSize && "CrossOver returned overisized unit"); |
| 179 | memcpy(Data, U.data(), NewSize); |
| 180 | return NewSize; |
| 181 | } |
| 182 | |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 183 | void MutationDispatcher::StartMutationSequence() { |
| 184 | MDImpl->CurrentMutatorSequence.clear(); |
| 185 | } |
| 186 | |
| 187 | void MutationDispatcher::PrintMutationSequence() { |
| 188 | Printf("MS: %zd ", MDImpl->CurrentMutatorSequence.size()); |
| 189 | for (auto M : MDImpl->CurrentMutatorSequence) |
| 190 | Printf("%s-", M.Name); |
| 191 | } |
| 192 | |
Kostya Serebryany | f342459 | 2015-05-22 22:35:31 +0000 | [diff] [blame] | 193 | // Mutates Data in place, returns new size. |
Kostya Serebryany | ec2dcb1 | 2015-09-03 21:24:19 +0000 | [diff] [blame] | 194 | size_t MutationDispatcher::Mutate(uint8_t *Data, size_t Size, size_t MaxSize) { |
Kostya Serebryany | f342459 | 2015-05-22 22:35:31 +0000 | [diff] [blame] | 195 | assert(MaxSize > 0); |
| 196 | assert(Size <= MaxSize); |
| 197 | if (Size == 0) { |
| 198 | for (size_t i = 0; i < MaxSize; i++) |
Kostya Serebryany | 404c69f | 2015-07-24 01:06:40 +0000 | [diff] [blame] | 199 | Data[i] = RandCh(Rand); |
Kostya Serebryany | f342459 | 2015-05-22 22:35:31 +0000 | [diff] [blame] | 200 | return MaxSize; |
Kostya Serebryany | 5b266a8 | 2015-02-04 19:10:20 +0000 | [diff] [blame] | 201 | } |
Kostya Serebryany | f342459 | 2015-05-22 22:35:31 +0000 | [diff] [blame] | 202 | assert(Size > 0); |
Kostya Serebryany | b2e9897 | 2015-09-04 00:40:29 +0000 | [diff] [blame] | 203 | // Some mutations may fail (e.g. can't insert more bytes if Size == MaxSize), |
| 204 | // in which case they will return 0. |
| 205 | // Try several times before returning un-mutated data. |
| 206 | for (int Iter = 0; Iter < 10; Iter++) { |
| 207 | size_t MutatorIdx = Rand(MDImpl->Mutators.size()); |
Kostya Serebryany | 14c5028 | 2015-12-19 01:09:49 +0000 | [diff] [blame] | 208 | auto M = MDImpl->Mutators[MutatorIdx]; |
| 209 | size_t NewSize = (this->*(M.Fn))(Data, Size, MaxSize); |
| 210 | if (NewSize) { |
| 211 | MDImpl->CurrentMutatorSequence.push_back(M); |
| 212 | return NewSize; |
| 213 | } |
Kostya Serebryany | b2e9897 | 2015-09-04 00:40:29 +0000 | [diff] [blame] | 214 | } |
Kostya Serebryany | f342459 | 2015-05-22 22:35:31 +0000 | [diff] [blame] | 215 | return Size; |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 216 | } |
| 217 | |
Kostya Serebryany | 27ab2d7 | 2015-12-19 02:49:09 +0000 | [diff] [blame] | 218 | void MutationDispatcher::SetCorpus(const std::vector<Unit> *Corpus) { |
| 219 | MDImpl->SetCorpus(Corpus); |
| 220 | } |
| 221 | |
Kostya Serebryany | 7d21166 | 2015-09-04 00:12:11 +0000 | [diff] [blame] | 222 | void MutationDispatcher::AddWordToDictionary(const uint8_t *Word, size_t Size) { |
| 223 | MDImpl->AddWordToDictionary(Word, Size); |
| 224 | } |
| 225 | |
| 226 | MutationDispatcher::MutationDispatcher(FuzzerRandomBase &Rand) : Rand(Rand) { |
| 227 | MDImpl = new Impl; |
| 228 | } |
| 229 | |
| 230 | MutationDispatcher::~MutationDispatcher() { delete MDImpl; } |
| 231 | |
Aaron Ballman | ef11698 | 2015-01-29 16:58:29 +0000 | [diff] [blame] | 232 | } // namespace fuzzer |