Vitaly Buka | 00b6107 | 2016-10-19 23:22:51 | [diff] [blame] | 1 | // Copyright 2016 Google Inc. All rights reserved. |
| 2 | // |
| 3 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | // you may not use this file except in compliance with the License. |
| 5 | // You may obtain a copy of the License at |
| 6 | // |
| 7 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | // |
| 9 | // Unless required by applicable law or agreed to in writing, software |
| 10 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | // See the License for the specific language governing permissions and |
| 13 | // limitations under the License. |
| 14 | |
Vitaly Buka | f90698f | 2017-03-01 23:46:58 | [diff] [blame] | 15 | #include "src/mutator.h" |
Vitaly Buka | 00b6107 | 2016-10-19 23:22:51 | [diff] [blame] | 16 | |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 17 | #include <algorithm> |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 18 | #include <map> |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 19 | #include <random> |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 20 | #include <string> |
Allen-Webb | c4fa591 | 2018-09-07 22:53:30 | [diff] [blame] | 21 | #include <vector> |
Vitaly Buka | 00b6107 | 2016-10-19 23:22:51 | [diff] [blame] | 22 | |
Vitaly Buka | 9dd2f8e | 2017-01-13 08:48:31 | [diff] [blame] | 23 | #include "src/field_instance.h" |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 24 | #include "src/utf8_fix.h" |
Vitaly Buka | 9dd2f8e | 2017-01-13 08:48:31 | [diff] [blame] | 25 | #include "src/weighted_reservoir_sampler.h" |
Vitaly Buka | 00b6107 | 2016-10-19 23:22:51 | [diff] [blame] | 26 | |
Vitaly Buka | f86815c | 2017-02-27 22:19:19 | [diff] [blame] | 27 | namespace protobuf_mutator { |
| 28 | |
Vitaly Buka | 6c6dbbe | 2017-02-22 21:58:24 | [diff] [blame] | 29 | using protobuf::Descriptor; |
Vitaly Buka | 6c6dbbe | 2017-02-22 21:58:24 | [diff] [blame] | 30 | using protobuf::FieldDescriptor; |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 31 | using protobuf::FileDescriptor; |
Vitaly Buka | 6c6dbbe | 2017-02-22 21:58:24 | [diff] [blame] | 32 | using protobuf::Message; |
| 33 | using protobuf::OneofDescriptor; |
| 34 | using protobuf::Reflection; |
Vitaly Buka | 4782c14 | 2017-03-04 08:12:32 | [diff] [blame] | 35 | using protobuf::util::MessageDifferencer; |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 36 | using std::placeholders::_1; |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 37 | |
| 38 | namespace { |
| 39 | |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 40 | const int kMaxInitializeDepth = 200; |
Vitaly Buka | 329fa46 | 2017-03-15 23:52:17 | [diff] [blame] | 41 | const uint64_t kDefaultMutateWeight = 1000000; |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 42 | |
| 43 | enum class Mutation { |
Vitaly Buka | 30de309 | 2016-11-18 19:39:07 | [diff] [blame] | 44 | None, |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 45 | Add, // Adds new field with default value. |
| 46 | Mutate, // Mutates field contents. |
| 47 | Delete, // Deletes field. |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 48 | Copy, // Copy values copied from another field. |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 49 | |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 50 | // TODO(vitalybuka): |
| 51 | // Clone, // Adds new field with value copied from another field. |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 52 | }; |
| 53 | |
Vitaly Buka | b592ff0 | 2017-03-03 22:35:52 | [diff] [blame] | 54 | // Return random integer from [0, count) |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 55 | size_t GetRandomIndex(RandomEngine* random, size_t count) { |
Vitaly Buka | b592ff0 | 2017-03-03 22:35:52 | [diff] [blame] | 56 | assert(count > 0); |
| 57 | if (count == 1) return 0; |
| 58 | return std::uniform_int_distribution<size_t>(0, count - 1)(*random); |
| 59 | } |
| 60 | |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 61 | // Flips random bit in the buffer. |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 62 | void FlipBit(size_t size, uint8_t* bytes, RandomEngine* random) { |
Vitaly Buka | b592ff0 | 2017-03-03 22:35:52 | [diff] [blame] | 63 | size_t bit = GetRandomIndex(random, size * 8); |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 64 | bytes[bit / 8] ^= (1u << (bit % 8)); |
| 65 | } |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 66 | |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 67 | // Flips random bit in the value. |
| 68 | template <class T> |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 69 | T FlipBit(T value, RandomEngine* random) { |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 70 | FlipBit(sizeof(value), reinterpret_cast<uint8_t*>(&value), random); |
| 71 | return value; |
| 72 | } |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 73 | |
Vitaly Buka | beb9080 | 2017-02-28 23:28:10 | [diff] [blame] | 74 | // Return true with probability about 1-of-n. |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 75 | bool GetRandomBool(RandomEngine* random, size_t n = 2) { |
Vitaly Buka | beb9080 | 2017-02-28 23:28:10 | [diff] [blame] | 76 | return GetRandomIndex(random, n) == 0; |
| 77 | } |
| 78 | |
Vitaly Buka | 28ca0ee | 2017-03-05 05:35:42 | [diff] [blame] | 79 | bool IsProto3SimpleField(const FieldDescriptor& field) { |
| 80 | assert(field.file()->syntax() == FileDescriptor::SYNTAX_PROTO3 || |
| 81 | field.file()->syntax() == FileDescriptor::SYNTAX_PROTO2); |
| 82 | return field.file()->syntax() == FileDescriptor::SYNTAX_PROTO3 && |
| 83 | field.cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE && |
| 84 | !field.containing_oneof() && !field.is_repeated(); |
| 85 | } |
| 86 | |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 87 | struct CreateDefaultField : public FieldFunction<CreateDefaultField> { |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 88 | template <class T> |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 89 | void ForType(const FieldInstance& field) const { |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 90 | T value; |
| 91 | field.GetDefault(&value); |
| 92 | field.Create(value); |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 93 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 94 | }; |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 95 | |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 96 | struct DeleteField : public FieldFunction<DeleteField> { |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 97 | template <class T> |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 98 | void ForType(const FieldInstance& field) const { |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 99 | field.Delete(); |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 100 | } |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 101 | }; |
| 102 | |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 103 | struct CopyField : public FieldFunction<CopyField> { |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 104 | template <class T> |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 105 | void ForType(const ConstFieldInstance& source, |
| 106 | const FieldInstance& field) const { |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 107 | T value; |
| 108 | source.Load(&value); |
| 109 | field.Store(value); |
| 110 | } |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 111 | }; |
| 112 | |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 113 | struct AppendField : public FieldFunction<AppendField> { |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 114 | template <class T> |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 115 | void ForType(const ConstFieldInstance& source, |
| 116 | const FieldInstance& field) const { |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 117 | T value; |
| 118 | source.Load(&value); |
| 119 | field.Create(value); |
| 120 | } |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 121 | }; |
| 122 | |
Vitaly Buka | 2792ed7 | 2019-01-23 19:04:24 | [diff] [blame] | 123 | class CanCopyAndDifferentField |
| 124 | : public FieldFunction<CanCopyAndDifferentField, bool> { |
Vitaly Buka | 4782c14 | 2017-03-04 08:12:32 | [diff] [blame] | 125 | public: |
| 126 | template <class T> |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 127 | bool ForType(const ConstFieldInstance& src, const ConstFieldInstance& dst, |
| 128 | int size_increase_hint) const { |
Vitaly Buka | 2792ed7 | 2019-01-23 19:04:24 | [diff] [blame] | 129 | T s; |
| 130 | src.Load(&s); |
| 131 | if (!dst.CanStore(s)) return false; |
| 132 | T d; |
| 133 | dst.Load(&d); |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 134 | return SizeDiff(s, d) <= size_increase_hint && !IsEqual(s, d); |
Vitaly Buka | 4782c14 | 2017-03-04 08:12:32 | [diff] [blame] | 135 | } |
| 136 | |
| 137 | private: |
| 138 | bool IsEqual(const ConstFieldInstance::Enum& a, |
| 139 | const ConstFieldInstance::Enum& b) const { |
| 140 | assert(a.count == b.count); |
| 141 | return a.index == b.index; |
| 142 | } |
| 143 | |
| 144 | bool IsEqual(const std::unique_ptr<protobuf::Message>& a, |
| 145 | const std::unique_ptr<protobuf::Message>& b) const { |
| 146 | return MessageDifferencer::Equals(*a, *b); |
| 147 | } |
| 148 | |
| 149 | template <class T> |
| 150 | bool IsEqual(const T& a, const T& b) const { |
| 151 | return a == b; |
| 152 | } |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 153 | |
| 154 | int64_t SizeDiff(const std::unique_ptr<protobuf::Message>& src, |
| 155 | const std::unique_ptr<protobuf::Message>& dst) const { |
| 156 | return src->ByteSizeLong() - dst->ByteSizeLong(); |
| 157 | } |
| 158 | |
| 159 | int64_t SizeDiff(const std::string& src, const std::string& dst) const { |
| 160 | return src.size() - dst.size(); |
| 161 | } |
| 162 | |
| 163 | template <class T> |
| 164 | int64_t SizeDiff(const T&, const T&) const { |
| 165 | return 0; |
| 166 | } |
Vitaly Buka | 4782c14 | 2017-03-04 08:12:32 | [diff] [blame] | 167 | }; |
| 168 | |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 169 | // Selects random field and mutation from the given proto message. |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 170 | class MutationSampler { |
Vitaly Buka | c9d2248 | 2016-11-21 21:29:17 | [diff] [blame] | 171 | public: |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 172 | MutationSampler(bool keep_initialized, bool can_grow, RandomEngine* random, |
| 173 | Message* message) |
| 174 | : keep_initialized_(keep_initialized), |
| 175 | can_grow_(can_grow), |
| 176 | random_(random), |
| 177 | sampler_(random) { |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 178 | Sample(message); |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 179 | assert(mutation() != Mutation::None || !can_grow || |
Vitaly Buka | f3383a9 | 2017-03-20 00:04:18 | [diff] [blame] | 180 | message->GetDescriptor()->field_count() == 0); |
Vitaly Buka | c9d2248 | 2016-11-21 21:29:17 | [diff] [blame] | 181 | } |
| 182 | |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 183 | // Returns selected field. |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 184 | const FieldInstance& field() const { return sampler_.selected().field; } |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 185 | |
| 186 | // Returns selected mutation. |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 187 | Mutation mutation() const { return sampler_.selected().mutation; } |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 188 | |
| 189 | private: |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 190 | void Sample(Message* message) { |
| 191 | const Descriptor* descriptor = message->GetDescriptor(); |
| 192 | const Reflection* reflection = message->GetReflection(); |
| 193 | |
| 194 | int field_count = descriptor->field_count(); |
| 195 | for (int i = 0; i < field_count; ++i) { |
| 196 | const FieldDescriptor* field = descriptor->field(i); |
| 197 | if (const OneofDescriptor* oneof = field->containing_oneof()) { |
| 198 | // Handle entire oneof group on the first field. |
| 199 | if (field->index_in_oneof() == 0) { |
Vitaly Buka | 2f660a5 | 2017-03-04 03:46:14 | [diff] [blame] | 200 | assert(oneof->field_count()); |
| 201 | const FieldDescriptor* current_field = |
| 202 | reflection->GetOneofFieldDescriptor(*message, oneof); |
| 203 | for (;;) { |
| 204 | const FieldDescriptor* add_field = |
| 205 | oneof->field(GetRandomIndex(random_, oneof->field_count())); |
| 206 | if (add_field != current_field) { |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 207 | Try({message, add_field}, Mutation::Add); |
Vitaly Buka | 2f660a5 | 2017-03-04 03:46:14 | [diff] [blame] | 208 | break; |
| 209 | } |
| 210 | if (oneof->field_count() < 2) break; |
| 211 | } |
| 212 | if (current_field) { |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 213 | if (current_field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) |
| 214 | Try({message, current_field}, Mutation::Mutate); |
| 215 | Try({message, current_field}, Mutation::Delete); |
| 216 | Try({message, current_field}, Mutation::Copy); |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 217 | } |
| 218 | } |
| 219 | } else { |
| 220 | if (field->is_repeated()) { |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 221 | int field_size = reflection->FieldSize(*message, field); |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 222 | Try({message, field, GetRandomIndex(random_, field_size + 1)}, |
| 223 | Mutation::Add); |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 224 | |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 225 | if (field_size) { |
| 226 | size_t random_index = GetRandomIndex(random_, field_size); |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 227 | if (field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) |
| 228 | Try({message, field, random_index}, Mutation::Mutate); |
| 229 | Try({message, field, random_index}, Mutation::Delete); |
| 230 | Try({message, field, random_index}, Mutation::Copy); |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 231 | } |
| 232 | } else { |
Vitaly Buka | 28ca0ee | 2017-03-05 05:35:42 | [diff] [blame] | 233 | if (reflection->HasField(*message, field) || |
| 234 | IsProto3SimpleField(*field)) { |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 235 | if (field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) |
| 236 | Try({message, field}, Mutation::Mutate); |
Vitaly Buka | 28ca0ee | 2017-03-05 05:35:42 | [diff] [blame] | 237 | if (!IsProto3SimpleField(*field) && |
| 238 | (!field->is_required() || !keep_initialized_)) { |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 239 | Try({message, field}, Mutation::Delete); |
Vitaly Buka | 28ca0ee | 2017-03-05 05:35:42 | [diff] [blame] | 240 | } |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 241 | Try({message, field}, Mutation::Copy); |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 242 | } else { |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 243 | Try({message, field}, Mutation::Add); |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 244 | } |
| 245 | } |
| 246 | } |
| 247 | |
| 248 | if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) { |
| 249 | if (field->is_repeated()) { |
| 250 | const int field_size = reflection->FieldSize(*message, field); |
| 251 | for (int j = 0; j < field_size; ++j) |
| 252 | Sample(reflection->MutableRepeatedMessage(message, field, j)); |
| 253 | } else if (reflection->HasField(*message, field)) { |
| 254 | Sample(reflection->MutableMessage(message, field)); |
| 255 | } |
| 256 | } |
| 257 | } |
| 258 | } |
| 259 | |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 260 | void Try(const FieldInstance& field, Mutation mutation) { |
| 261 | assert(mutation != Mutation::None); |
| 262 | if (!can_grow_ && mutation != Mutation::Delete) return; |
| 263 | sampler_.Try(kDefaultMutateWeight, {field, mutation}); |
| 264 | } |
| 265 | |
Vitaly Buka | 781853c | 2016-11-22 07:09:35 | [diff] [blame] | 266 | bool keep_initialized_ = false; |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 267 | bool can_grow_ = false; |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 268 | |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 269 | RandomEngine* random_; |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 270 | |
| 271 | struct Result { |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 272 | Result() = default; |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 273 | Result(const FieldInstance& f, Mutation m) : field(f), mutation(m) {} |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 274 | |
Vitaly Buka | bec5222 | 2016-12-09 22:29:32 | [diff] [blame] | 275 | FieldInstance field; |
| 276 | Mutation mutation = Mutation::None; |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 277 | }; |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 278 | WeightedReservoirSampler<Result, RandomEngine> sampler_; |
Vitaly Buka | c9d2248 | 2016-11-21 21:29:17 | [diff] [blame] | 279 | }; |
| 280 | |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 281 | // Selects random field of compatible type to use for clone mutations. |
| 282 | class DataSourceSampler { |
| 283 | public: |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 284 | DataSourceSampler(const ConstFieldInstance& match, RandomEngine* random, |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 285 | int size_increase_hint, const Message& message) |
| 286 | : match_(match), |
| 287 | random_(random), |
| 288 | size_increase_hint_(size_increase_hint), |
| 289 | sampler_(random) { |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 290 | Sample(message); |
| 291 | } |
| 292 | |
| 293 | // Returns selected field. |
Vitaly Buka | 8871286 | 2017-02-27 06:21:30 | [diff] [blame] | 294 | const ConstFieldInstance& field() const { |
Vitaly Buka | 72019dc | 2016-12-15 03:17:24 | [diff] [blame] | 295 | assert(!IsEmpty()); |
| 296 | return sampler_.selected(); |
| 297 | } |
| 298 | |
| 299 | bool IsEmpty() const { return sampler_.IsEmpty(); } |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 300 | |
| 301 | private: |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 302 | void Sample(const Message& message) { |
| 303 | const Descriptor* descriptor = message.GetDescriptor(); |
| 304 | const Reflection* reflection = message.GetReflection(); |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 305 | |
| 306 | int field_count = descriptor->field_count(); |
| 307 | for (int i = 0; i < field_count; ++i) { |
| 308 | const FieldDescriptor* field = descriptor->field(i); |
| 309 | if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) { |
| 310 | if (field->is_repeated()) { |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 311 | const int field_size = reflection->FieldSize(message, field); |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 312 | for (int j = 0; j < field_size; ++j) { |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 313 | Sample(reflection->GetRepeatedMessage(message, field, j)); |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 314 | } |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 315 | } else if (reflection->HasField(message, field)) { |
| 316 | Sample(reflection->GetMessage(message, field)); |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 317 | } |
| 318 | } |
| 319 | |
| 320 | if (field->cpp_type() != match_.cpp_type()) continue; |
| 321 | if (match_.cpp_type() == FieldDescriptor::CPPTYPE_ENUM) { |
| 322 | if (field->enum_type() != match_.enum_type()) continue; |
| 323 | } else if (match_.cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) { |
| 324 | if (field->message_type() != match_.message_type()) continue; |
| 325 | } |
| 326 | |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 327 | if (field->is_repeated()) { |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 328 | if (int field_size = reflection->FieldSize(message, field)) { |
| 329 | ConstFieldInstance source(&message, field, |
Vitaly Buka | 4782c14 | 2017-03-04 08:12:32 | [diff] [blame] | 330 | GetRandomIndex(random_, field_size)); |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 331 | if (CanCopyAndDifferentField()(source, match_, size_increase_hint_)) |
Vitaly Buka | 4782c14 | 2017-03-04 08:12:32 | [diff] [blame] | 332 | sampler_.Try(field_size, source); |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 333 | } |
| 334 | } else { |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 335 | if (reflection->HasField(message, field)) { |
| 336 | ConstFieldInstance source(&message, field); |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 337 | if (CanCopyAndDifferentField()(source, match_, size_increase_hint_)) |
Vitaly Buka | 2792ed7 | 2019-01-23 19:04:24 | [diff] [blame] | 338 | sampler_.Try(1, source); |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 339 | } |
| 340 | } |
| 341 | } |
| 342 | } |
| 343 | |
Vitaly Buka | 8871286 | 2017-02-27 06:21:30 | [diff] [blame] | 344 | ConstFieldInstance match_; |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 345 | RandomEngine* random_; |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 346 | int size_increase_hint_; |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 347 | |
Vitaly Buka | f62fe47 | 2017-03-02 07:05:15 | [diff] [blame] | 348 | WeightedReservoirSampler<ConstFieldInstance, RandomEngine> sampler_; |
Vitaly Buka | a3e59c7 | 2016-12-07 00:53:56 | [diff] [blame] | 349 | }; |
| 350 | |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 351 | } // namespace |
| 352 | |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 353 | class FieldMutator { |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 354 | public: |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 355 | FieldMutator(int size_increase_hint, bool enforce_changes, |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 356 | bool enforce_utf8_strings, const protobuf::Message& source, |
| 357 | Mutator* mutator) |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 358 | : size_increase_hint_(size_increase_hint), |
| 359 | enforce_changes_(enforce_changes), |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 360 | enforce_utf8_strings_(enforce_utf8_strings), |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 361 | source_(source), |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 362 | mutator_(mutator) {} |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 363 | |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 364 | void Mutate(int32_t* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 365 | RepeatMutate(value, std::bind(&Mutator::MutateInt32, mutator_, _1)); |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 366 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 367 | |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 368 | void Mutate(int64_t* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 369 | RepeatMutate(value, std::bind(&Mutator::MutateInt64, mutator_, _1)); |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 370 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 371 | |
| 372 | void Mutate(uint32_t* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 373 | RepeatMutate(value, std::bind(&Mutator::MutateUInt32, mutator_, _1)); |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 374 | } |
| 375 | |
| 376 | void Mutate(uint64_t* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 377 | RepeatMutate(value, std::bind(&Mutator::MutateUInt64, mutator_, _1)); |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 378 | } |
| 379 | |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 380 | void Mutate(float* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 381 | RepeatMutate(value, std::bind(&Mutator::MutateFloat, mutator_, _1)); |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 382 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 383 | |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 384 | void Mutate(double* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 385 | RepeatMutate(value, std::bind(&Mutator::MutateDouble, mutator_, _1)); |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 386 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 387 | |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 388 | void Mutate(bool* value) const { |
Vitaly Buka | d7f943f | 2019-01-31 22:05:33 | [diff] [blame] | 389 | RepeatMutate(value, std::bind(&Mutator::MutateBool, mutator_, _1)); |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 390 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 391 | |
| 392 | void Mutate(FieldInstance::Enum* value) const { |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 393 | RepeatMutate(&value->index, |
Vitaly Buka | d7f943f | 2019-01-31 22:05:33 | [diff] [blame] | 394 | std::bind(&Mutator::MutateEnum, mutator_, _1, value->count)); |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 395 | assert(value->index < value->count); |
| 396 | } |
| 397 | |
| 398 | void Mutate(std::string* value) const { |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 399 | if (enforce_utf8_strings_) { |
| 400 | RepeatMutate(value, std::bind(&Mutator::MutateUtf8String, mutator_, _1, |
| 401 | size_increase_hint_)); |
| 402 | } else { |
| 403 | RepeatMutate(value, std::bind(&Mutator::MutateString, mutator_, _1, |
| 404 | size_increase_hint_)); |
| 405 | } |
Vitaly Buka | 91ad7b0 | 2016-12-12 23:41:41 | [diff] [blame] | 406 | } |
| 407 | |
Vitaly Buka | b2c4fb5 | 2017-03-16 18:50:40 | [diff] [blame] | 408 | void Mutate(std::unique_ptr<Message>* message) const { |
| 409 | assert(!enforce_changes_); |
| 410 | assert(*message); |
Vitaly Buka | d7f943f | 2019-01-31 22:05:33 | [diff] [blame] | 411 | if (GetRandomBool(mutator_->random(), mutator_->random_to_default_ratio_)) |
| 412 | return; |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 413 | mutator_->MutateImpl(source_, message->get(), size_increase_hint_); |
Vitaly Buka | b2c4fb5 | 2017-03-16 18:50:40 | [diff] [blame] | 414 | } |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 415 | |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 416 | private: |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 417 | template <class T, class F> |
Vitaly Buka | d7f943f | 2019-01-31 22:05:33 | [diff] [blame] | 418 | void RepeatMutate(T* value, F mutate) const { |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 419 | if (!enforce_changes_ && |
Vitaly Buka | d7f943f | 2019-01-31 22:05:33 | [diff] [blame] | 420 | GetRandomBool(mutator_->random(), mutator_->random_to_default_ratio_)) { |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 421 | return; |
Vitaly Buka | b2c4fb5 | 2017-03-16 18:50:40 | [diff] [blame] | 422 | } |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 423 | T tmp = *value; |
| 424 | for (int i = 0; i < 10; ++i) { |
| 425 | *value = mutate(*value); |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 426 | if (!enforce_changes_ || *value != tmp) return; |
Vitaly Buka | 796b112 | 2017-03-03 22:42:02 | [diff] [blame] | 427 | } |
| 428 | } |
| 429 | |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 430 | int size_increase_hint_; |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 431 | size_t enforce_changes_; |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 432 | bool enforce_utf8_strings_; |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 433 | const protobuf::Message& source_; |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 434 | Mutator* mutator_; |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 435 | }; |
| 436 | |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 437 | namespace { |
| 438 | |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 439 | struct MutateField : public FieldFunction<MutateField> { |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 440 | template <class T> |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 441 | void ForType(const FieldInstance& field, int size_increase_hint, |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 442 | const protobuf::Message& source, Mutator* mutator) const { |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 443 | T value; |
| 444 | field.Load(&value); |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 445 | FieldMutator(size_increase_hint, true, field.EnforceUtf8(), source, mutator) |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 446 | .Mutate(&value); |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 447 | field.Store(value); |
| 448 | } |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 449 | }; |
| 450 | |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 451 | struct CreateField : public FieldFunction<CreateField> { |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 452 | public: |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 453 | template <class T> |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 454 | void ForType(const FieldInstance& field, int size_increase_hint, |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 455 | const protobuf::Message& source, Mutator* mutator) const { |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 456 | T value; |
| 457 | field.GetDefault(&value); |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 458 | FieldMutator field_mutator(size_increase_hint, |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 459 | false /* defaults could be useful */, |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 460 | field.EnforceUtf8(), source, mutator); |
Vitaly Buka | 0e9439f | 2017-03-16 00:51:57 | [diff] [blame] | 461 | field_mutator.Mutate(&value); |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 462 | field.Create(value); |
| 463 | } |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 464 | }; |
| 465 | |
| 466 | } // namespace |
| 467 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 468 | void Mutator::Seed(uint32_t value) { random_.seed(value); } |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 469 | |
Vitaly Buka | baa1329 | 2020-01-26 03:39:28 | [diff] [blame] | 470 | void Mutator::Mutate(Message* message, size_t max_size_hint) { |
| 471 | MutateImpl(*message, message, |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 472 | static_cast<int>(max_size_hint) - |
| 473 | static_cast<int>(message->ByteSizeLong())); |
Vitaly Buka | 0e17fd7 | 2016-11-18 18:02:46 | [diff] [blame] | 474 | |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 475 | InitializeAndTrim(message, kMaxInitializeDepth); |
Vitaly Buka | 9eaf063 | 2020-01-16 01:30:20 | [diff] [blame] | 476 | assert(IsInitialized(*message)); |
Vitaly Buka | 67387f7 | 2019-09-01 02:34:10 | [diff] [blame] | 477 | |
Peter Foley | fe76ed6 | 2019-10-01 00:03:37 | [diff] [blame] | 478 | if (!post_processors_.empty()) { |
| 479 | ApplyPostProcessing(message); |
| 480 | } |
| 481 | } |
| 482 | |
| 483 | void Mutator::RegisterPostProcessor(const protobuf::Descriptor* desc, |
| 484 | PostProcess callback) { |
| 485 | post_processors_.emplace(desc, callback); |
| 486 | } |
| 487 | |
| 488 | void Mutator::ApplyPostProcessing(Message* message) { |
| 489 | const Descriptor* descriptor = message->GetDescriptor(); |
| 490 | |
Vitaly Buka | ad520b3 | 2020-01-08 22:39:55 | [diff] [blame] | 491 | auto range = post_processors_.equal_range(descriptor); |
| 492 | for (auto it = range.first; it != range.second; ++it) |
Peter Foley | fe76ed6 | 2019-10-01 00:03:37 | [diff] [blame] | 493 | it->second(message, random_()); |
Peter Foley | fe76ed6 | 2019-10-01 00:03:37 | [diff] [blame] | 494 | |
| 495 | // Now recursively apply custom mutators. |
| 496 | const Reflection* reflection = message->GetReflection(); |
| 497 | for (int i = 0; i < descriptor->field_count(); i++) { |
| 498 | const FieldDescriptor* field = descriptor->field(i); |
| 499 | if (field->cpp_type() != FieldDescriptor::CPPTYPE_MESSAGE) { |
| 500 | continue; |
| 501 | } |
| 502 | if (field->is_repeated()) { |
| 503 | const int field_size = reflection->FieldSize(*message, field); |
| 504 | for (int j = 0; j < field_size; ++j) { |
| 505 | Message* nested_message = |
| 506 | reflection->MutableRepeatedMessage(message, field, j); |
| 507 | ApplyPostProcessing(nested_message); |
| 508 | } |
| 509 | } else if (reflection->HasField(*message, field)) { |
| 510 | Message* nested_message = reflection->MutableMessage(message, field); |
| 511 | ApplyPostProcessing(nested_message); |
| 512 | } |
| 513 | } |
Vitaly Buka | 00b6107 | 2016-10-19 23:22:51 | [diff] [blame] | 514 | } |
| 515 | |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 516 | void Mutator::MutateImpl(const Message& source, Message* message, |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 517 | int size_increase_hint) { |
| 518 | if (size_increase_hint > 0) size_increase_hint /= 2; |
Vitaly Buka | 3183b0d | 2019-09-06 22:11:10 | [diff] [blame] | 519 | for (;;) { |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 520 | MutationSampler mutation(keep_initialized_, size_increase_hint > 16, |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 521 | &random_, message); |
Vitaly Buka | 3183b0d | 2019-09-06 22:11:10 | [diff] [blame] | 522 | switch (mutation.mutation()) { |
| 523 | case Mutation::None: |
| 524 | return; |
| 525 | case Mutation::Add: |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 526 | CreateField()(mutation.field(), size_increase_hint, source, this); |
Vitaly Buka | 3183b0d | 2019-09-06 22:11:10 | [diff] [blame] | 527 | return; |
| 528 | case Mutation::Mutate: |
Vitaly Buka | 4908d25 | 2020-01-25 03:10:34 | [diff] [blame] | 529 | MutateField()(mutation.field(), size_increase_hint, source, this); |
Vitaly Buka | 3183b0d | 2019-09-06 22:11:10 | [diff] [blame] | 530 | return; |
| 531 | case Mutation::Delete: |
| 532 | DeleteField()(mutation.field()); |
| 533 | return; |
| 534 | case Mutation::Copy: { |
Vitaly Buka | 5cd166e | 2020-01-26 06:33:05 | [diff] [blame^] | 535 | DataSourceSampler source_sampler(mutation.field(), &random_, |
| 536 | size_increase_hint, source); |
Vitaly Buka | 0f63f91 | 2020-01-24 23:02:45 | [diff] [blame] | 537 | if (source_sampler.IsEmpty()) break; |
| 538 | CopyField()(source_sampler.field(), mutation.field()); |
Vitaly Buka | 3183b0d | 2019-09-06 22:11:10 | [diff] [blame] | 539 | return; |
| 540 | } |
| 541 | default: |
| 542 | assert(false && "unexpected mutation"); |
| 543 | return; |
| 544 | } |
| 545 | } |
| 546 | } |
| 547 | |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 548 | void Mutator::CrossOver(const protobuf::Message& message1, |
| 549 | protobuf::Message* message2) { |
Vitaly Buka | 142e08b | 2017-03-06 00:26:15 | [diff] [blame] | 550 | // CrossOver can produce result which still equals to inputs. So we backup |
| 551 | // message2 to later comparison. message1 is already constant. |
| 552 | std::unique_ptr<protobuf::Message> message2_copy(message2->New()); |
| 553 | message2_copy->CopyFrom(*message2); |
| 554 | |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 555 | CrossOverImpl(message1, message2); |
| 556 | |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 557 | InitializeAndTrim(message2, kMaxInitializeDepth); |
Vitaly Buka | 9eaf063 | 2020-01-16 01:30:20 | [diff] [blame] | 558 | assert(IsInitialized(*message2)); |
Vitaly Buka | 142e08b | 2017-03-06 00:26:15 | [diff] [blame] | 559 | |
Vitaly Buka | dd89da9 | 2019-10-08 17:08:02 | [diff] [blame] | 560 | if (!post_processors_.empty()) { |
| 561 | ApplyPostProcessing(message2); |
| 562 | } |
Vitaly Buka | 67387f7 | 2019-09-01 02:34:10 | [diff] [blame] | 563 | |
Vitaly Buka | 2d609df | 2017-03-07 07:29:47 | [diff] [blame] | 564 | // Can't call mutate from crossover because of a bug in libFuzzer. |
Vitaly Buka | 2d609df | 2017-03-07 07:29:47 | [diff] [blame] | 565 | // if (MessageDifferencer::Equals(*message2_copy, *message2) || |
| 566 | // MessageDifferencer::Equals(message1, *message2)) { |
| 567 | // Mutate(message2, 0); |
| 568 | // } |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 569 | } |
| 570 | |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 571 | void Mutator::CrossOverImpl(const protobuf::Message& message1, |
| 572 | protobuf::Message* message2) { |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 573 | const Descriptor* descriptor = message2->GetDescriptor(); |
| 574 | const Reflection* reflection = message2->GetReflection(); |
| 575 | assert(message1.GetDescriptor() == descriptor); |
| 576 | assert(message1.GetReflection() == reflection); |
| 577 | |
| 578 | for (int i = 0; i < descriptor->field_count(); ++i) { |
| 579 | const FieldDescriptor* field = descriptor->field(i); |
| 580 | |
| 581 | if (field->is_repeated()) { |
| 582 | const int field_size1 = reflection->FieldSize(message1, field); |
| 583 | int field_size2 = reflection->FieldSize(*message2, field); |
| 584 | for (int j = 0; j < field_size1; ++j) { |
| 585 | ConstFieldInstance source(&message1, field, j); |
| 586 | FieldInstance destination(message2, field, field_size2++); |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 587 | AppendField()(source, destination); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 588 | } |
| 589 | |
| 590 | assert(field_size2 == reflection->FieldSize(*message2, field)); |
| 591 | |
| 592 | // Shuffle |
| 593 | for (int j = 0; j < field_size2; ++j) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 594 | if (int k = GetRandomIndex(&random_, field_size2 - j)) { |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 595 | reflection->SwapElements(message2, field, j, j + k); |
| 596 | } |
| 597 | } |
| 598 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 599 | int keep = GetRandomIndex(&random_, field_size2 + 1); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 600 | |
| 601 | if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) { |
| 602 | int remove = field_size2 - keep; |
| 603 | // Cross some message to keep with messages to remove. |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 604 | int cross = GetRandomIndex(&random_, std::min(keep, remove) + 1); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 605 | for (int j = 0; j < cross; ++j) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 606 | int k = GetRandomIndex(&random_, keep); |
| 607 | int r = keep + GetRandomIndex(&random_, remove); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 608 | assert(k != r); |
| 609 | CrossOverImpl(reflection->GetRepeatedMessage(*message2, field, r), |
| 610 | reflection->MutableRepeatedMessage(message2, field, k)); |
| 611 | } |
| 612 | } |
| 613 | |
| 614 | for (int j = keep; j < field_size2; ++j) |
| 615 | reflection->RemoveLast(message2, field); |
| 616 | assert(keep == reflection->FieldSize(*message2, field)); |
| 617 | |
| 618 | } else if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) { |
| 619 | if (!reflection->HasField(message1, field)) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 620 | if (GetRandomBool(&random_)) |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 621 | DeleteField()(FieldInstance(message2, field)); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 622 | } else if (!reflection->HasField(*message2, field)) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 623 | if (GetRandomBool(&random_)) { |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 624 | ConstFieldInstance source(&message1, field); |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 625 | CopyField()(source, FieldInstance(message2, field)); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 626 | } |
| 627 | } else { |
| 628 | CrossOverImpl(reflection->GetMessage(message1, field), |
| 629 | reflection->MutableMessage(message2, field)); |
| 630 | } |
| 631 | } else { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 632 | if (GetRandomBool(&random_)) { |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 633 | if (reflection->HasField(message1, field)) { |
| 634 | ConstFieldInstance source(&message1, field); |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 635 | CopyField()(source, FieldInstance(message2, field)); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 636 | } else { |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 637 | DeleteField()(FieldInstance(message2, field)); |
Vitaly Buka | adfc27c | 2017-02-27 06:36:36 | [diff] [blame] | 638 | } |
| 639 | } |
| 640 | } |
| 641 | } |
| 642 | } |
| 643 | |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 644 | void Mutator::InitializeAndTrim(Message* message, int max_depth) { |
Vitaly Buka | 13245af | 2016-11-18 21:20:12 | [diff] [blame] | 645 | const Descriptor* descriptor = message->GetDescriptor(); |
| 646 | const Reflection* reflection = message->GetReflection(); |
Vitaly Buka | 13245af | 2016-11-18 21:20:12 | [diff] [blame] | 647 | for (int i = 0; i < descriptor->field_count(); ++i) { |
| 648 | const FieldDescriptor* field = descriptor->field(i); |
Vitaly Buka | 4200a1e | 2019-07-29 22:19:59 | [diff] [blame] | 649 | if (keep_initialized_ && |
| 650 | (field->is_required() || descriptor->options().map_entry()) && |
| 651 | !reflection->HasField(*message, field)) { |
Vitaly Buka | d4ab1e7 | 2017-03-04 07:51:19 | [diff] [blame] | 652 | CreateDefaultField()(FieldInstance(message, field)); |
Vitaly Buka | 4200a1e | 2019-07-29 22:19:59 | [diff] [blame] | 653 | } |
Vitaly Buka | 13245af | 2016-11-18 21:20:12 | [diff] [blame] | 654 | |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 655 | if (field->cpp_type() == FieldDescriptor::CPPTYPE_MESSAGE) { |
| 656 | if (max_depth <= 0 && !field->is_required()) { |
| 657 | // Clear deep optional fields to avoid stack overflow. |
| 658 | reflection->ClearField(message, field); |
| 659 | if (field->is_repeated()) |
| 660 | assert(!reflection->FieldSize(*message, field)); |
| 661 | else |
| 662 | assert(!reflection->HasField(*message, field)); |
| 663 | continue; |
| 664 | } |
| 665 | |
Vitaly Buka | 2cfe02b | 2016-11-19 00:34:09 | [diff] [blame] | 666 | if (field->is_repeated()) { |
| 667 | const int field_size = reflection->FieldSize(*message, field); |
| 668 | for (int j = 0; j < field_size; ++j) { |
| 669 | Message* nested_message = |
| 670 | reflection->MutableRepeatedMessage(message, field, j); |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 671 | InitializeAndTrim(nested_message, max_depth - 1); |
Vitaly Buka | 2cfe02b | 2016-11-19 00:34:09 | [diff] [blame] | 672 | } |
| 673 | } else if (reflection->HasField(*message, field)) { |
| 674 | Message* nested_message = reflection->MutableMessage(message, field); |
Vitaly Buka | e4eae60 | 2017-09-29 00:28:12 | [diff] [blame] | 675 | InitializeAndTrim(nested_message, max_depth - 1); |
Vitaly Buka | 13245af | 2016-11-18 21:20:12 | [diff] [blame] | 676 | } |
| 677 | } |
| 678 | } |
| 679 | } |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 680 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 681 | int32_t Mutator::MutateInt32(int32_t value) { return FlipBit(value, &random_); } |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 682 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 683 | int64_t Mutator::MutateInt64(int64_t value) { return FlipBit(value, &random_); } |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 684 | |
| 685 | uint32_t Mutator::MutateUInt32(uint32_t value) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 686 | return FlipBit(value, &random_); |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 687 | } |
| 688 | |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 689 | uint64_t Mutator::MutateUInt64(uint64_t value) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 690 | return FlipBit(value, &random_); |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 691 | } |
| 692 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 693 | float Mutator::MutateFloat(float value) { return FlipBit(value, &random_); } |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 694 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 695 | double Mutator::MutateDouble(double value) { return FlipBit(value, &random_); } |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 696 | |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 697 | bool Mutator::MutateBool(bool value) { return !value; } |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 698 | |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 699 | size_t Mutator::MutateEnum(size_t index, size_t item_count) { |
Vitaly Buka | ee1c76a | 2017-03-15 17:48:53 | [diff] [blame] | 700 | if (item_count <= 1) return 0; |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 701 | return (index + 1 + GetRandomIndex(&random_, item_count - 1)) % item_count; |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 702 | } |
| 703 | |
Vitaly Buka | e79e018 | 2017-03-02 00:02:14 | [diff] [blame] | 704 | std::string Mutator::MutateString(const std::string& value, |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 705 | int size_increase_hint) { |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 706 | std::string result = value; |
Vitaly Buka | 5d01320 | 2017-02-25 00:50:11 | [diff] [blame] | 707 | |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 708 | while (!result.empty() && GetRandomBool(&random_)) { |
| 709 | result.erase(GetRandomIndex(&random_, result.size()), 1); |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 710 | } |
| 711 | |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 712 | while (size_increase_hint > 0 && |
| 713 | result.size() < static_cast<size_t>(size_increase_hint) && |
| 714 | GetRandomBool(&random_)) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 715 | size_t index = GetRandomIndex(&random_, result.size() + 1); |
| 716 | result.insert(result.begin() + index, GetRandomIndex(&random_, 1 << 8)); |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 717 | } |
| 718 | |
Vitaly Buka | c020de1 | 2017-03-04 03:36:23 | [diff] [blame] | 719 | if (result != value) return result; |
| 720 | |
| 721 | if (result.empty()) { |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 722 | result.push_back(GetRandomIndex(&random_, 1 << 8)); |
Vitaly Buka | c020de1 | 2017-03-04 03:36:23 | [diff] [blame] | 723 | return result; |
| 724 | } |
| 725 | |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 726 | if (!result.empty()) |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 727 | FlipBit(result.size(), reinterpret_cast<uint8_t*>(&result[0]), &random_); |
Vitaly Buka | 4af611d | 2016-12-04 02:57:32 | [diff] [blame] | 728 | return result; |
| 729 | } |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 730 | |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 731 | std::string Mutator::MutateUtf8String(const std::string& value, |
Vitaly Buka | 1c91e72 | 2020-01-26 05:56:22 | [diff] [blame] | 732 | int size_increase_hint) { |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 733 | std::string str = MutateString(value, size_increase_hint); |
Vitaly Buka | 379f5ab | 2019-08-31 23:11:59 | [diff] [blame] | 734 | FixUtf8String(&str, &random_); |
Vitaly Buka | af8136f | 2017-06-09 23:40:12 | [diff] [blame] | 735 | return str; |
| 736 | } |
| 737 | |
Vitaly Buka | 9eaf063 | 2020-01-16 01:30:20 | [diff] [blame] | 738 | bool Mutator::IsInitialized(const Message& message) const { |
| 739 | if (!keep_initialized_ || message.IsInitialized()) return true; |
| 740 | std::cerr << "Uninitialized: " << message.DebugString() << "\n"; |
| 741 | return false; |
| 742 | } |
| 743 | |
Vitaly Buka | 432b545 | 2016-12-09 22:42:09 | [diff] [blame] | 744 | } // namespace protobuf_mutator |