blob: 09f3c4946ec16e232a4940c716dc58b7ee76eacc [file] [log] [blame]
Wyatt Heplerb7609542020-01-24 10:29:54 -08001// Copyright 2020 The Pigweed Authors
2//
3// Licensed under the Apache License, Version 2.0 (the "License"); you may not
4// use this file except in compliance with the License. You may obtain a copy of
5// the License at
6//
7// https://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
11// WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
12// License for the specific language governing permissions and limitations under
13// the License.
14
Wyatt Heplerb7609542020-01-24 10:29:54 -080015#include "pw_kvs/key_value_store.h"
16
Wyatt Heplerbab0e202020-02-04 07:40:08 -080017#include <algorithm>
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -080018#include <cinttypes>
Wyatt Heplerb7609542020-01-24 10:29:54 -080019#include <cstring>
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080020#include <type_traits>
Wyatt Heplerb7609542020-01-24 10:29:54 -080021
Keir Mierle8c352dc2020-02-02 13:58:19 -080022#define PW_LOG_USE_ULTRA_SHORT_NAMES 1
Wyatt Heplerbdd8e5a2020-02-20 19:27:26 -080023#include "pw_kvs/internal/entry.h"
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080024#include "pw_kvs_private/macros.h"
Keir Mierle8c352dc2020-02-02 13:58:19 -080025#include "pw_log/log.h"
Wyatt Heplerb7609542020-01-24 10:29:54 -080026
Wyatt Hepler2ad60672020-01-21 08:00:16 -080027namespace pw::kvs {
Wyatt Heplera00d1ef2020-02-14 14:31:26 -080028namespace {
Wyatt Heplerb7609542020-01-24 10:29:54 -080029
Wyatt Hepleracaacf92020-01-24 10:58:30 -080030using std::byte;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080031using std::string_view;
Wyatt Hepleracaacf92020-01-24 10:58:30 -080032
Wyatt Heplera00d1ef2020-02-14 14:31:26 -080033constexpr bool InvalidKey(std::string_view key) {
Wyatt Heplerbdd8e5a2020-02-20 19:27:26 -080034 return key.empty() || (key.size() > internal::Entry::kMaxKeyLength);
Wyatt Heplera00d1ef2020-02-14 14:31:26 -080035}
36
37} // namespace
38
Wyatt Heplerad0a7932020-02-06 08:20:38 -080039KeyValueStore::KeyValueStore(FlashPartition* partition,
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080040 Vector<KeyDescriptor>& key_descriptor_list,
41 Vector<SectorDescriptor>& sector_descriptor_list,
Wyatt Hepler88adfe82020-02-20 19:33:27 -080042 const EntryFormat& format,
Wyatt Heplerad0a7932020-02-06 08:20:38 -080043 const Options& options)
44 : partition_(*partition),
45 entry_header_format_(format),
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080046 key_descriptors_(key_descriptor_list),
Wyatt Heplerd2298282020-02-20 17:12:45 -080047 sectors_(sector_descriptor_list),
48 options_(options) {
49 Reset();
50}
Wyatt Heplerad0a7932020-02-06 08:20:38 -080051
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080052Status KeyValueStore::Init() {
Wyatt Heplerd2298282020-02-20 17:12:45 -080053 Reset();
54
David Rogers2e9e0c82020-02-13 15:06:06 -080055 INF("Initializing key value store");
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080056 if (partition_.sector_count() > sectors_.max_size()) {
David Rogers2e9e0c82020-02-13 15:06:06 -080057 ERR("KVS init failed: kMaxUsableSectors (=%zu) must be at least as "
58 "large as the number of sectors in the flash partition (=%zu)",
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080059 sectors_.max_size(),
David Rogers2e9e0c82020-02-13 15:06:06 -080060 partition_.sector_count());
Wyatt Heplerad0a7932020-02-06 08:20:38 -080061 return Status::FAILED_PRECONDITION;
62 }
63
Keir Mierle8c352dc2020-02-02 13:58:19 -080064 const size_t sector_size_bytes = partition_.sector_size_bytes();
Keir Mierle8c352dc2020-02-02 13:58:19 -080065
David Rogersf0a35442020-02-04 12:16:38 -080066 if (working_buffer_.size() < sector_size_bytes) {
Wyatt Heplerce7b8df2020-02-21 10:38:39 -080067 ERR("KVS init failed: working_buffer_ (%zu B) is smaller than sector size "
68 "(%zu B)",
David Rogersf0a35442020-02-04 12:16:38 -080069 working_buffer_.size(),
70 sector_size_bytes);
71 return Status::INVALID_ARGUMENT;
72 }
73
Keir Mierle8c352dc2020-02-02 13:58:19 -080074 DBG("First pass: Read all entries from all sectors");
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080075 Address sector_address = 0;
Keir Mierle8c352dc2020-02-02 13:58:19 -080076
Wyatt Heplerd2298282020-02-20 17:12:45 -080077 sectors_.assign(partition_.sector_count(),
78 SectorDescriptor(sector_size_bytes));
79
Alexei Frolovd4adf912020-02-21 13:29:15 -080080 size_t total_corrupt_bytes = 0;
81 int corrupt_entries = 0;
82
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080083 for (SectorDescriptor& sector : sectors_) {
Keir Mierle8c352dc2020-02-02 13:58:19 -080084 Address entry_address = sector_address;
85
Alexei Frolovd4adf912020-02-21 13:29:15 -080086 size_t sector_corrupt_bytes = 0;
87
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080088 for (int num_entries_in_sector = 0; true; num_entries_in_sector++) {
89 DBG("Load entry: sector=%" PRIx32 ", entry#=%d, address=%" PRIx32,
90 sector_address,
Keir Mierle8c352dc2020-02-02 13:58:19 -080091 num_entries_in_sector,
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080092 entry_address);
Keir Mierle8c352dc2020-02-02 13:58:19 -080093
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080094 if (!AddressInSector(sector, entry_address)) {
Keir Mierle8c352dc2020-02-02 13:58:19 -080095 DBG("Fell off end of sector; moving to the next sector");
96 break;
97 }
98
99 Address next_entry_address;
100 Status status = LoadEntry(entry_address, &next_entry_address);
101 if (status == Status::NOT_FOUND) {
102 DBG("Hit un-written data in sector; moving to the next sector");
103 break;
104 }
105 if (status == Status::DATA_LOSS) {
Alexei Frolovd4adf912020-02-21 13:29:15 -0800106 // The entry could not be read, indicating data corruption within the
107 // sector. Try to scan the remainder of the sector for other entries.
108 ERR("KVS init: data loss detected in sector %u at address %zu",
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800109 SectorIndex(&sector),
110 size_t(entry_address));
Alexei Frolovd4adf912020-02-21 13:29:15 -0800111
112 corrupt_entries++;
113
114 status = ScanForEntry(sector,
115 entry_address + Entry::kMinAlignmentBytes,
116 &next_entry_address);
117 if (status == Status::NOT_FOUND) {
118 // No further entries in this sector. Mark the remaining bytes in the
119 // sector as corrupt (since we can't reliably know the size of the
120 // corrupt entry).
121 sector_corrupt_bytes +=
122 sector_size_bytes - (entry_address - sector_address);
123 break;
124 }
125
126 if (!status.ok()) {
127 ERR("Unexpected error in KVS initialization: %s", status.str());
128 return Status::UNKNOWN;
129 }
130
131 sector_corrupt_bytes += next_entry_address - entry_address;
132 } else if (!status.ok()) {
133 ERR("Unexpected error in KVS initialization: %s", status.str());
134 return Status::UNKNOWN;
Keir Mierle8c352dc2020-02-02 13:58:19 -0800135 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800136
137 // Entry loaded successfully; so get ready to load the next one.
138 entry_address = next_entry_address;
139
140 // Update of the number of writable bytes in this sector.
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800141 sector.set_writable_bytes(sector_size_bytes -
142 (entry_address - sector_address));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800143 }
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800144
Alexei Frolovd4adf912020-02-21 13:29:15 -0800145 if (sector_corrupt_bytes > 0) {
146 // If the sector contains corrupt data, prevent any further entries from
147 // being written to it by indicating that it has no space. This should
148 // also make it a decent GC candidate. Valid keys in the sector are still
149 // readable as normal.
150 sector.set_writable_bytes(0);
151
152 WRN("Sector %u contains %zuB of corrupt data",
153 SectorIndex(&sector),
154 sector_corrupt_bytes);
155 }
156
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800157 sector_address += sector_size_bytes;
Alexei Frolovd4adf912020-02-21 13:29:15 -0800158 total_corrupt_bytes += sector_corrupt_bytes;
Keir Mierle8c352dc2020-02-02 13:58:19 -0800159 }
160
161 DBG("Second pass: Count valid bytes in each sector");
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800162 const KeyDescriptor* newest_key = nullptr;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800163
Keir Mierle8c352dc2020-02-02 13:58:19 -0800164 // For every valid key, increment the valid bytes for that sector.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800165 for (KeyDescriptor& key_descriptor : key_descriptors_) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800166 Entry entry;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800167 TRY(Entry::Read(partition_, key_descriptor.address(), &entry));
168 SectorFromKey(key_descriptor)->AddValidBytes(entry.size());
169
170 if (key_descriptor.IsNewerThan(last_transaction_id_)) {
171 last_transaction_id_ = key_descriptor.transaction_id();
172 newest_key = &key_descriptor;
173 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800174 }
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800175
176 if (newest_key == nullptr) {
177 last_new_sector_ = sectors_.begin();
178 } else {
179 last_new_sector_ = SectorFromKey(newest_key);
180 }
181
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800182 initialized_ = true;
David Rogers2e9e0c82020-02-13 15:06:06 -0800183
Armando Montanez5464d5f2020-02-20 10:12:20 -0800184 INF("KeyValueStore init complete: active keys %zu, deleted keys %zu, sectors "
David Rogers2e9e0c82020-02-13 15:06:06 -0800185 "%zu, logical sector size %zu bytes",
186 size(),
187 (key_descriptors_.size() - size()),
188 sectors_.size(),
189 partition_.sector_size_bytes());
190
Alexei Frolovd4adf912020-02-21 13:29:15 -0800191 if (total_corrupt_bytes > 0) {
192 WRN("Found %zu corrupt bytes and %d corrupt entries during init process; "
193 "some keys may be missing",
194 total_corrupt_bytes,
195 corrupt_entries);
196 return Status::DATA_LOSS;
197 }
198
Keir Mierle8c352dc2020-02-02 13:58:19 -0800199 return Status::OK;
200}
201
202Status KeyValueStore::LoadEntry(Address entry_address,
203 Address* next_entry_address) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800204 Entry entry;
205 TRY(Entry::Read(partition_, entry_address, &entry));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800206
207 // TODO: Handle multiple magics for formats that have changed.
Wyatt Heplere541e072020-02-14 09:10:53 -0800208 if (entry.magic() != entry_header_format_.magic) {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800209 // TODO: It may be cleaner to have some logging helpers for these cases.
Wyatt Heplere541e072020-02-14 09:10:53 -0800210 ERR("Found corrupt magic: %zx; expecting %zx; at address %zx",
211 size_t(entry.magic()),
Keir Mierle8c352dc2020-02-02 13:58:19 -0800212 size_t(entry_header_format_.magic),
213 size_t(entry_address));
214 return Status::DATA_LOSS;
215 }
216
217 // Read the key from flash & validate the entry (which reads the value).
Wyatt Heplera00d1ef2020-02-14 14:31:26 -0800218 Entry::KeyBuffer key_buffer;
Wyatt Heplere541e072020-02-14 09:10:53 -0800219 TRY_ASSIGN(size_t key_length, entry.ReadKey(key_buffer));
220 const string_view key(key_buffer.data(), key_length);
Wyatt Heplerbab0e202020-02-04 07:40:08 -0800221
Wyatt Heplere541e072020-02-14 09:10:53 -0800222 TRY(entry.VerifyChecksumInFlash(entry_header_format_.checksum));
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800223 TRY(AppendNewOrOverwriteStaleExistingDescriptor(entry.descriptor(key)));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800224
Wyatt Heplere541e072020-02-14 09:10:53 -0800225 *next_entry_address = entry.next_address();
Keir Mierle8c352dc2020-02-02 13:58:19 -0800226 return Status::OK;
227}
228
Alexei Frolovd4adf912020-02-21 13:29:15 -0800229// Scans flash memory within a sector to find a KVS entry magic.
230// TODO(frolv): This needs to be unit tested!
231Status KeyValueStore::ScanForEntry(const SectorDescriptor& sector,
232 Address start_address,
233 Address* next_entry_address) {
234 DBG("Scanning sector %u for entries starting from address %zx",
235 SectorIndex(&sector),
236 size_t(start_address));
237
238 // Entries must start at addresses which are aligned on a multiple of
239 // Entry::kMinAlignmentBytes. However, that multiple can vary between entries.
240 // When scanning, we don't have an entry to tell us what the current alignment
241 // is, so the minimum alignment is used to be exhaustive.
242 for (Address address = AlignUp(start_address, Entry::kMinAlignmentBytes);
243 AddressInSector(sector, address);
244 address += Entry::kMinAlignmentBytes) {
245 // TODO: Handle multiple magics for formats that have changed.
246 uint32_t magic;
247 TRY(partition_.Read(address, as_writable_bytes(span(&magic, 1))));
248 if (magic == entry_header_format_.magic) {
249 DBG("Found entry magic at address %zx", size_t(address));
250 *next_entry_address = address;
251 return Status::OK;
252 }
253 }
254
255 return Status::NOT_FOUND;
256}
257
Keir Mierle8c352dc2020-02-02 13:58:19 -0800258// TODO: This method is the trigger of the O(valid_entries * all_entries) time
259// complexity for reading. At some cost to memory, this could be optimized by
260// using a hash table instead of scanning, but in practice this should be fine
261// for a small number of keys
262Status KeyValueStore::AppendNewOrOverwriteStaleExistingDescriptor(
263 const KeyDescriptor& key_descriptor) {
264 // With the new key descriptor, either add it to the descriptor table or
265 // overwrite an existing entry with an older version of the key.
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800266 KeyDescriptor* existing_descriptor = FindDescriptor(key_descriptor.hash());
Keir Mierle8c352dc2020-02-02 13:58:19 -0800267
Wyatt Hepler5406a672020-02-18 15:42:38 -0800268 // Write a new entry.
269 if (existing_descriptor == nullptr) {
270 if (key_descriptors_.full()) {
271 return Status::RESOURCE_EXHAUSTED;
272 }
273 key_descriptors_.push_back(key_descriptor);
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800274 } else if (key_descriptor.IsNewerThan(
275 existing_descriptor->transaction_id())) {
Wyatt Hepler5406a672020-02-18 15:42:38 -0800276 // Existing entry is old; replace the existing entry with the new one.
277 *existing_descriptor = key_descriptor;
278 } else {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800279 // Otherwise, check if the entries have a duplicate transaction ID, which is
280 // not valid.
281 if (existing_descriptor->transaction_id() ==
282 key_descriptor.transaction_id()) {
283 ERR("Data loss: Duplicated old(=%zu) and new(=%zu) transaction ID",
284 size_t(existing_descriptor->transaction_id()),
285 size_t(key_descriptor.transaction_id()));
Wyatt Hepler5406a672020-02-18 15:42:38 -0800286 return Status::DATA_LOSS;
287 }
288 DBG("Found stale entry when appending; ignoring");
Keir Mierle8c352dc2020-02-02 13:58:19 -0800289 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800290 return Status::OK;
291}
292
Keir Mierle8c352dc2020-02-02 13:58:19 -0800293KeyValueStore::KeyDescriptor* KeyValueStore::FindDescriptor(uint32_t hash) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800294 for (KeyDescriptor& key_descriptor : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800295 if (key_descriptor.hash() == hash) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800296 return &key_descriptor;
Keir Mierle8c352dc2020-02-02 13:58:19 -0800297 }
298 }
299 return nullptr;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800300}
301
302StatusWithSize KeyValueStore::Get(string_view key,
Wyatt Hepler5f6efc02020-02-18 16:54:31 -0800303 span<byte> value_buffer,
304 size_t offset_bytes) const {
Wyatt Hepler50f70772020-02-13 11:25:10 -0800305 TRY_WITH_SIZE(CheckOperation(key));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800306
David Rogers2761aeb2020-01-31 17:09:00 -0800307 const KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800308 TRY_WITH_SIZE(FindExistingKeyDescriptor(key, &key_descriptor));
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800309
Wyatt Heplere541e072020-02-14 09:10:53 -0800310 Entry entry;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800311 TRY_WITH_SIZE(Entry::Read(partition_, key_descriptor->address(), &entry));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800312
Wyatt Hepler5f6efc02020-02-18 16:54:31 -0800313 StatusWithSize result = entry.ReadValue(value_buffer, offset_bytes);
314 if (result.ok() && options_.verify_on_read && offset_bytes == 0u) {
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800315 Status verify_result = entry.VerifyChecksum(
316 entry_header_format_.checksum, key, value_buffer.first(result.size()));
David Rogerscf680ab2020-02-12 23:28:32 -0800317 if (!verify_result.ok()) {
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800318 std::memset(value_buffer.data(), 0, result.size());
Wyatt Hepler50f70772020-02-13 11:25:10 -0800319 return StatusWithSize(verify_result);
David Rogerscf680ab2020-02-12 23:28:32 -0800320 }
321
322 return StatusWithSize(verify_result, result.size());
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800323 }
324 return result;
325}
326
327Status KeyValueStore::Put(string_view key, span<const byte> value) {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800328 DBG("Writing key/value; key length=%zu, value length=%zu",
329 key.size(),
330 value.size());
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800331
332 TRY(CheckOperation(key));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800333
Wyatt Hepler5406a672020-02-18 15:42:38 -0800334 if (Entry::size(partition_, key, value) > partition_.sector_size_bytes()) {
335 DBG("%zu B value with %zu B key cannot fit in one sector",
336 value.size(),
337 key.size());
338 return Status::INVALID_ARGUMENT;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800339 }
340
David Rogers2761aeb2020-01-31 17:09:00 -0800341 KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800342 Status status = FindKeyDescriptor(key, &key_descriptor);
343
344 if (status.ok()) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800345 DBG("Overwriting entry for key %#08" PRIx32 " in sector %u",
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800346 key_descriptor->hash(),
347 SectorIndex(SectorFromKey(key_descriptor)));
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800348 return WriteEntryForExistingKey(
349 key_descriptor, KeyDescriptor::kValid, key, value);
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800350 }
David Rogers2761aeb2020-01-31 17:09:00 -0800351
Wyatt Hepler2d401692020-02-13 16:01:23 -0800352 if (status == Status::NOT_FOUND) {
353 return WriteEntryForNewKey(key, value);
354 }
355
356 return status;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800357}
358
359Status KeyValueStore::Delete(string_view key) {
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800360 TRY(CheckOperation(key));
361
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800362 KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800363 TRY(FindExistingKeyDescriptor(key, &key_descriptor));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800364
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800365 DBG("Writing tombstone for key %#08" PRIx32 " in sector %u",
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800366 key_descriptor->hash(),
367 SectorIndex(SectorFromKey(key_descriptor)));
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800368 return WriteEntryForExistingKey(
369 key_descriptor, KeyDescriptor::kDeleted, key, {});
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800370}
371
372KeyValueStore::iterator& KeyValueStore::iterator::operator++() {
373 // Skip to the next entry that is valid (not deleted).
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800374 while (++index_ < item_.kvs_.key_descriptors_.size() &&
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800375 descriptor().deleted()) {
376 }
377 return *this;
378}
379
380const KeyValueStore::Item& KeyValueStore::iterator::operator*() {
381 std::memset(item_.key_buffer_.data(), 0, item_.key_buffer_.size());
382
Wyatt Heplere541e072020-02-14 09:10:53 -0800383 Entry entry;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800384 if (Entry::Read(item_.kvs_.partition_, descriptor().address(), &entry).ok()) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800385 entry.ReadKey(item_.key_buffer_);
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800386 }
387
388 return item_;
389}
390
391KeyValueStore::iterator KeyValueStore::begin() const {
392 size_t i = 0;
393 // Skip over any deleted entries at the start of the descriptor list.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800394 while (i < key_descriptors_.size() && key_descriptors_[i].deleted()) {
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800395 i += 1;
396 }
397 return iterator(*this, i);
398}
399
400// TODO(hepler): The valid entry count could be tracked in the KVS to avoid the
401// need for this for-loop.
402size_t KeyValueStore::size() const {
403 size_t valid_entries = 0;
404
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800405 for (const KeyDescriptor& key_descriptor : key_descriptors_) {
406 if (!key_descriptor.deleted()) {
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800407 valid_entries += 1;
408 }
409 }
410
411 return valid_entries;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800412}
413
Wyatt Heplered163b02020-02-03 17:49:32 -0800414StatusWithSize KeyValueStore::ValueSize(std::string_view key) const {
Wyatt Hepler50f70772020-02-13 11:25:10 -0800415 TRY_WITH_SIZE(CheckOperation(key));
Wyatt Heplered163b02020-02-03 17:49:32 -0800416
417 const KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800418 TRY_WITH_SIZE(FindExistingKeyDescriptor(key, &key_descriptor));
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800419
Wyatt Heplere541e072020-02-14 09:10:53 -0800420 Entry entry;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800421 TRY_WITH_SIZE(Entry::Read(partition_, key_descriptor->address(), &entry));
Wyatt Heplered163b02020-02-03 17:49:32 -0800422
Wyatt Heplere541e072020-02-14 09:10:53 -0800423 return StatusWithSize(entry.value_size());
Wyatt Heplered163b02020-02-03 17:49:32 -0800424}
425
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800426Status KeyValueStore::FixedSizeGet(std::string_view key,
427 byte* value,
428 size_t size_bytes) const {
429 // Ensure that the size of the stored value matches the size of the type.
430 // Otherwise, report error. This check avoids potential memory corruption.
431 StatusWithSize result = ValueSize(key);
432 if (!result.ok()) {
433 return result.status();
Keir Mierle8c352dc2020-02-02 13:58:19 -0800434 }
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800435 if (result.size() != size_bytes) {
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800436 DBG("Requested %zu B read, but value is %zu B", size_bytes, result.size());
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800437 return Status::INVALID_ARGUMENT;
Wyatt Heplerbab0e202020-02-04 07:40:08 -0800438 }
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800439 return Get(key, span(value, size_bytes)).status();
Keir Mierle8c352dc2020-02-02 13:58:19 -0800440}
441
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800442Status KeyValueStore::CheckOperation(string_view key) const {
Wyatt Hepleracaacf92020-01-24 10:58:30 -0800443 if (InvalidKey(key)) {
Wyatt Heplerb7609542020-01-24 10:29:54 -0800444 return Status::INVALID_ARGUMENT;
445 }
Wyatt Heplerd2298282020-02-20 17:12:45 -0800446 if (!initialized()) {
Wyatt Heplerb7609542020-01-24 10:29:54 -0800447 return Status::FAILED_PRECONDITION;
448 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800449 return Status::OK;
450}
451
Wyatt Hepler2d401692020-02-13 16:01:23 -0800452// Searches for a KeyDescriptor that matches this key and sets *result to point
453// to it if one is found.
454//
455// OK: there is a matching descriptor and *result is set
456// NOT_FOUND: there is no descriptor that matches this key, but this key
457// has a unique hash (and could potentially be added to the KVS)
458// ALREADY_EXISTS: there is no descriptor that matches this key, but the
459// key's hash collides with the hash for an existing descriptor
460//
David Rogers2761aeb2020-01-31 17:09:00 -0800461Status KeyValueStore::FindKeyDescriptor(string_view key,
462 const KeyDescriptor** result) const {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800463 const uint32_t hash = internal::Hash(key);
Wyatt Heplera00d1ef2020-02-14 14:31:26 -0800464 Entry::KeyBuffer key_buffer;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800465
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800466 for (auto& descriptor : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800467 if (descriptor.hash() == hash) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800468 TRY(Entry::ReadKey(
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800469 partition_, descriptor.address(), key.size(), key_buffer.data()));
Wyatt Heplerb7609542020-01-24 10:29:54 -0800470
Wyatt Heplere541e072020-02-14 09:10:53 -0800471 if (key == string_view(key_buffer.data(), key.size())) {
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800472 DBG("Found match for key hash 0x%08" PRIx32, hash);
David Rogers2761aeb2020-01-31 17:09:00 -0800473 *result = &descriptor;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800474 return Status::OK;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800475 } else {
476 WRN("Found key hash collision for 0x%08" PRIx32, hash);
477 return Status::ALREADY_EXISTS;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800478 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800479 }
480 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800481 return Status::NOT_FOUND;
482}
483
Wyatt Hepler2d401692020-02-13 16:01:23 -0800484// Searches for a KeyDescriptor that matches this key and sets *result to point
485// to it if one is found.
486//
487// OK: there is a matching descriptor and *result is set
488// NOT_FOUND: there is no descriptor that matches this key
489//
490Status KeyValueStore::FindExistingKeyDescriptor(
491 string_view key, const KeyDescriptor** result) const {
492 Status status = FindKeyDescriptor(key, result);
493
494 // If the key's hash collides with an existing key or if the key is deleted,
495 // treat it as if it is not in the KVS.
496 if (status == Status::ALREADY_EXISTS ||
497 (status.ok() && (*result)->deleted())) {
498 return Status::NOT_FOUND;
499 }
500 return status;
501}
502
David Rogers2761aeb2020-01-31 17:09:00 -0800503Status KeyValueStore::WriteEntryForExistingKey(KeyDescriptor* key_descriptor,
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800504 KeyDescriptor::State new_state,
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800505 string_view key,
506 span<const byte> value) {
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800507 // Find the original entry and sector to update the sector's valid_bytes.
Wyatt Hepler30a52152020-02-12 11:26:05 -0800508 Entry original_entry;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800509 TRY(Entry::Read(partition_, key_descriptor->address(), &original_entry));
510 SectorDescriptor* old_sector = SectorFromKey(key_descriptor);
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800511
David Rogers2761aeb2020-01-31 17:09:00 -0800512 SectorDescriptor* sector;
Wyatt Hepler5406a672020-02-18 15:42:38 -0800513 TRY(FindOrRecoverSectorWithSpace(&sector,
514 Entry::size(partition_, key, value)));
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800515 DBG("Writing existing entry; found sector %u (%#" PRIx32 ")",
516 SectorIndex(sector),
517 SectorBaseAddress(sector));
David Rogers3464d0a2020-02-07 11:45:46 -0800518
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800519 if (old_sector != SectorFromKey(key_descriptor)) {
David Rogers3464d0a2020-02-07 11:45:46 -0800520 DBG("Sector for old entry (size %zu) was garbage collected. Old entry "
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800521 "relocated to sector %u",
David Rogers3464d0a2020-02-07 11:45:46 -0800522 original_entry.size(),
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800523 SectorIndex(SectorFromKey(key_descriptor)));
David Rogers3464d0a2020-02-07 11:45:46 -0800524
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800525 old_sector = SectorFromKey(key_descriptor);
David Rogers3464d0a2020-02-07 11:45:46 -0800526 }
527
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800528 TRY(AppendEntry(sector, key_descriptor, key, value, new_state));
529
David Rogers3464d0a2020-02-07 11:45:46 -0800530 old_sector->RemoveValidBytes(original_entry.size());
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800531 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800532}
533
534Status KeyValueStore::WriteEntryForNewKey(string_view key,
535 span<const byte> value) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800536 if (key_descriptors_.full()) {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800537 WRN("KVS full: trying to store a new entry, but can't. Have %zu entries",
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800538 key_descriptors_.size());
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800539 return Status::RESOURCE_EXHAUSTED;
540 }
541
David Rogers2761aeb2020-01-31 17:09:00 -0800542 SectorDescriptor* sector;
Wyatt Hepler5406a672020-02-18 15:42:38 -0800543 TRY(FindOrRecoverSectorWithSpace(&sector,
544 Entry::size(partition_, key, value)));
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800545 DBG("Writing new entry; found sector: %u", SectorIndex(sector));
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800546
547 // Create the KeyDescriptor that will be added to the list. The transaction ID
548 // and address will be set by AppendEntry.
549 KeyDescriptor key_descriptor(key);
Wyatt Hepler0af6ad92020-02-13 15:54:46 -0800550 TRY(AppendEntry(sector, &key_descriptor, key, value, KeyDescriptor::kValid));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800551
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800552 // Only add the entry when we are certain the write succeeded.
553 key_descriptors_.push_back(key_descriptor);
Wyatt Heplerb7609542020-01-24 10:29:54 -0800554 return Status::OK;
555}
556
David Rogers2761aeb2020-01-31 17:09:00 -0800557Status KeyValueStore::RelocateEntry(KeyDescriptor& key_descriptor) {
David Rogersf0a35442020-02-04 12:16:38 -0800558 struct TempEntry {
Wyatt Heplere541e072020-02-14 09:10:53 -0800559 Entry::KeyBuffer key;
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800560 std::array<byte, sizeof(working_buffer_) - sizeof(key)> value;
David Rogersf0a35442020-02-04 12:16:38 -0800561 };
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800562 auto [key_buffer, value_buffer] =
563 *std::launder(reinterpret_cast<TempEntry*>(working_buffer_.data()));
David Rogersf0a35442020-02-04 12:16:38 -0800564
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800565 DBG("Relocating entry at %zx for key %" PRIx32,
566 size_t(key_descriptor.address()),
567 key_descriptor.hash());
David Rogersdf025cd2020-02-06 17:05:34 -0800568
Wyatt Heplere541e072020-02-14 09:10:53 -0800569 // Read the entry to be relocated. Store the entry in a local variable and
David Rogersf0a35442020-02-04 12:16:38 -0800570 // store the key and value in the TempEntry stored in the static allocated
571 // working_buffer_.
Wyatt Heplere541e072020-02-14 09:10:53 -0800572 Entry entry;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800573 TRY(Entry::Read(partition_, key_descriptor.address(), &entry));
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800574
575 TRY_ASSIGN(size_t key_length, entry.ReadKey(key_buffer));
576 string_view key = string_view(key_buffer.data(), key_length);
577
578 StatusWithSize result = entry.ReadValue(value_buffer);
579 if (!result.ok()) {
David Rogersf0a35442020-02-04 12:16:38 -0800580 return Status::INTERNAL;
581 }
582
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800583 const span value = span(value_buffer.data(), result.size());
584 TRY(entry.VerifyChecksum(entry_header_format_.checksum, key, value));
David Rogersf0a35442020-02-04 12:16:38 -0800585
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800586 SectorDescriptor* old_sector = SectorFromKey(key_descriptor);
David Rogersf0a35442020-02-04 12:16:38 -0800587
588 // Find a new sector for the entry and write it to the new location.
David Rogers8ce55cd2020-02-04 19:41:48 -0800589 SectorDescriptor* new_sector;
Wyatt Heplere541e072020-02-14 09:10:53 -0800590 TRY(FindSectorWithSpace(&new_sector, entry.size(), old_sector, true));
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800591 TRY(AppendEntry(
592 new_sector, &key_descriptor, key, value, key_descriptor.state()));
David Rogersdf025cd2020-02-06 17:05:34 -0800593
Wyatt Heplerd2298282020-02-20 17:12:45 -0800594 // Do the valid bytes accounting for the sector the entry was relocated from.
Wyatt Heplere541e072020-02-14 09:10:53 -0800595 old_sector->RemoveValidBytes(entry.size());
David Rogersdf025cd2020-02-06 17:05:34 -0800596
597 return Status::OK;
David Rogersa12786b2020-01-31 16:02:33 -0800598}
599
David Rogers8db5a722020-02-03 18:28:34 -0800600// Find either an existing sector with enough space that is not the sector to
601// skip, or an empty sector. Maintains the invariant that there is always at
602// least 1 empty sector unless set to bypass the rule.
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800603Status KeyValueStore::FindSectorWithSpace(
604 SectorDescriptor** found_sector,
605 size_t size,
606 const SectorDescriptor* sector_to_skip,
607 bool bypass_empty_sector_rule) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800608 SectorDescriptor* first_empty_sector = nullptr;
609 bool at_least_two_empty_sectors = bypass_empty_sector_rule;
610
611 DBG("Find sector with %zu bytes available, starting with sector %u",
612 size,
613 SectorIndex(last_new_sector_));
614 if (sector_to_skip != nullptr) {
615 DBG(" Skip sector %u", SectorIndex(sector_to_skip));
616 }
617 if (bypass_empty_sector_rule) {
618 DBG(" Bypassing empty sector rule");
619 }
620
David Rogers8ce55cd2020-02-04 19:41:48 -0800621 // The last_new_sector_ is the sector that was last selected as the "new empty
622 // sector" to write to. This last new sector is used as the starting point for
623 // the next "find a new empty sector to write to" operation. By using the last
624 // new sector as the start point we will cycle which empty sector is selected
625 // next, spreading the wear across all the empty sectors and get a wear
626 // leveling benefit, rather than putting more wear on the lower number
627 // sectors.
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800628 SectorDescriptor* sector = last_new_sector_;
David Rogers67f4b6c2020-02-06 16:17:09 -0800629
David Rogers8ce55cd2020-02-04 19:41:48 -0800630 // Look for a partial sector to use with enough space. Immediately use the
631 // first one of those that is found. While scanning for a partial sector, keep
632 // track of the first empty sector and if a second sector was seen.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800633 for (size_t j = 0; j < sectors_.size(); j++) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800634 sector += 1;
635 if (sector == sectors_.end()) {
636 sector = sectors_.begin();
637 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800638
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800639 if (sector_to_skip == sector) {
David Rogers8db5a722020-02-03 18:28:34 -0800640 continue;
641 }
642
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800643 const size_t sector_size_bytes = partition_.sector_size_bytes();
644 if (!sector->Empty(sector_size_bytes) && sector->HasSpace(size)) {
645 *found_sector = sector;
David Rogers8ce55cd2020-02-04 19:41:48 -0800646 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800647 }
648
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800649 if (sector->Empty(sector_size_bytes)) {
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800650 if (first_empty_sector == nullptr) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800651 first_empty_sector = sector;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800652 } else {
653 at_least_two_empty_sectors = true;
Wyatt Hepler2ad60672020-01-21 08:00:16 -0800654 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800655 }
656 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800657
David Rogers8ce55cd2020-02-04 19:41:48 -0800658 // If the scan for a partial sector does not find a suitable sector, use the
659 // first empty sector that was found. Normally it is required to keep 1 empty
660 // sector after the sector found here, but that rule can be bypassed in
661 // special circumstances (such as during garbage collection).
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800662 if (at_least_two_empty_sectors) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800663 DBG(" Found a usable empty sector; returning the first found (%u)",
David Rogers8ce55cd2020-02-04 19:41:48 -0800664 SectorIndex(first_empty_sector));
665 last_new_sector_ = first_empty_sector;
666 *found_sector = first_empty_sector;
667 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800668 }
David Rogers8ce55cd2020-02-04 19:41:48 -0800669
670 // No sector was found.
David Rogers67f4b6c2020-02-06 16:17:09 -0800671 DBG(" Unable to find a usable sector");
David Rogers8ce55cd2020-02-04 19:41:48 -0800672 *found_sector = nullptr;
673 return Status::RESOURCE_EXHAUSTED;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800674}
675
David Rogers2761aeb2020-01-31 17:09:00 -0800676Status KeyValueStore::FindOrRecoverSectorWithSpace(SectorDescriptor** sector,
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800677 size_t size) {
David Rogers8ce55cd2020-02-04 19:41:48 -0800678 Status result = FindSectorWithSpace(sector, size);
Wyatt Hepler2d401692020-02-13 16:01:23 -0800679 if (result == Status::RESOURCE_EXHAUSTED && options_.partial_gc_on_write) {
David Rogers1541d612020-02-06 23:47:02 -0800680 // Garbage collect and then try again to find the best sector.
681 TRY(GarbageCollectOneSector());
682 return FindSectorWithSpace(sector, size);
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800683 }
David Rogers8ce55cd2020-02-04 19:41:48 -0800684 return result;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800685}
686
David Rogers2761aeb2020-01-31 17:09:00 -0800687KeyValueStore::SectorDescriptor* KeyValueStore::FindSectorToGarbageCollect() {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800688 const size_t sector_size_bytes = partition_.sector_size_bytes();
David Rogers2761aeb2020-01-31 17:09:00 -0800689 SectorDescriptor* sector_candidate = nullptr;
David Rogersa12786b2020-01-31 16:02:33 -0800690 size_t candidate_bytes = 0;
691
692 // Step 1: Try to find a sectors with stale keys and no valid keys (no
693 // relocation needed). If any such sectors are found, use the sector with the
694 // most reclaimable bytes.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800695 for (auto& sector : sectors_) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800696 if ((sector.valid_bytes() == 0) &&
697 (sector.RecoverableBytes(sector_size_bytes) > candidate_bytes)) {
David Rogersa12786b2020-01-31 16:02:33 -0800698 sector_candidate = &sector;
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800699 candidate_bytes = sector.RecoverableBytes(sector_size_bytes);
David Rogersa12786b2020-01-31 16:02:33 -0800700 }
701 }
702
703 // Step 2: If step 1 yields no sectors, just find the sector with the most
704 // reclaimable bytes.
705 if (sector_candidate == nullptr) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800706 for (auto& sector : sectors_) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800707 if (sector.RecoverableBytes(sector_size_bytes) > candidate_bytes) {
David Rogersa12786b2020-01-31 16:02:33 -0800708 sector_candidate = &sector;
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800709 candidate_bytes = sector.RecoverableBytes(sector_size_bytes);
David Rogersa12786b2020-01-31 16:02:33 -0800710 }
711 }
712 }
713
David Rogers5981f312020-02-13 13:33:56 -0800714 if (sector_candidate != nullptr) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800715 DBG("Found sector %u to Garbage Collect, %zu recoverable bytes",
David Rogers5981f312020-02-13 13:33:56 -0800716 SectorIndex(sector_candidate),
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800717 sector_candidate->RecoverableBytes(sector_size_bytes));
David Rogers5981f312020-02-13 13:33:56 -0800718 } else {
719 DBG("Unable to find sector to garbage collect!");
720 }
David Rogersa12786b2020-01-31 16:02:33 -0800721 return sector_candidate;
722}
723
David Rogers1541d612020-02-06 23:47:02 -0800724Status KeyValueStore::GarbageCollectOneSector() {
David Rogers67f4b6c2020-02-06 16:17:09 -0800725 DBG("Garbage Collect a single sector");
726
David Rogersa12786b2020-01-31 16:02:33 -0800727 // Step 1: Find the sector to garbage collect
David Rogers2761aeb2020-01-31 17:09:00 -0800728 SectorDescriptor* sector_to_gc = FindSectorToGarbageCollect();
David Rogers3464d0a2020-02-07 11:45:46 -0800729 LogSectors();
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800730
David Rogersa12786b2020-01-31 16:02:33 -0800731 if (sector_to_gc == nullptr) {
732 return Status::RESOURCE_EXHAUSTED;
733 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800734
David Rogersa12786b2020-01-31 16:02:33 -0800735 // Step 2: Move any valid entries in the GC sector to other sectors
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800736 if (sector_to_gc->valid_bytes() != 0) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800737 for (auto& descriptor : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800738 if (AddressInSector(*sector_to_gc, descriptor.address())) {
David Rogers67f4b6c2020-02-06 16:17:09 -0800739 DBG(" Relocate entry");
David Rogers2761aeb2020-01-31 17:09:00 -0800740 TRY(RelocateEntry(descriptor));
David Rogersa12786b2020-01-31 16:02:33 -0800741 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800742 }
743 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800744
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800745 if (sector_to_gc->valid_bytes() != 0) {
David Rogers67f4b6c2020-02-06 16:17:09 -0800746 ERR(" Failed to relocate valid entries from sector being garbage "
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800747 "collected, %zu valid bytes remain",
748 sector_to_gc->valid_bytes());
Wyatt Heplerb7609542020-01-24 10:29:54 -0800749 return Status::INTERNAL;
750 }
751
David Rogersa12786b2020-01-31 16:02:33 -0800752 // Step 3: Reinitialize the sector
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800753 sector_to_gc->set_writable_bytes(0);
David Rogersa12786b2020-01-31 16:02:33 -0800754 TRY(partition_.Erase(SectorBaseAddress(sector_to_gc), 1));
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800755 sector_to_gc->set_writable_bytes(partition_.sector_size_bytes());
Wyatt Heplerb7609542020-01-24 10:29:54 -0800756
David Rogers67f4b6c2020-02-06 16:17:09 -0800757 DBG(" Garbage Collect complete");
David Rogers50185ad2020-02-07 00:02:46 -0800758 LogSectors();
David Rogersa12786b2020-01-31 16:02:33 -0800759 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800760}
761
David Rogers2761aeb2020-01-31 17:09:00 -0800762Status KeyValueStore::AppendEntry(SectorDescriptor* sector,
763 KeyDescriptor* key_descriptor,
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800764 string_view key,
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800765 span<const byte> value,
766 KeyDescriptor::State new_state) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800767 const Address address = NextWritableAddress(sector);
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800768 Entry entry = CreateEntry(address, key, value, new_state);
Wyatt Heplere541e072020-02-14 09:10:53 -0800769
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800770 DBG("Appending %zu B entry with transaction ID %" PRIu32 " to address %#zx",
Wyatt Heplere541e072020-02-14 09:10:53 -0800771 entry.size(),
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800772 entry.transaction_id(),
773 size_t(address));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800774
David Rogers6592d292020-02-14 14:19:26 -0800775 StatusWithSize result = entry.Write(key, value);
776 // Remove any bytes that were written, even if the write was not successful.
Keir Mierle0a52aed2020-02-21 09:24:36 -0800777 // This is important to retain the writable space invariant on the sectors.
David Rogers6592d292020-02-14 14:19:26 -0800778 sector->RemoveWritableBytes(result.size());
779
780 if (!result.ok()) {
Keir Mierle0a52aed2020-02-21 09:24:36 -0800781 // TODO: Once fake flash errors are supported in tests, test this branch.
782 ERR("Failed to write %zu bytes at %" PRIx32 ". %zu actually written",
David Rogers6592d292020-02-14 14:19:26 -0800783 entry.size(),
Keir Mierle0a52aed2020-02-21 09:24:36 -0800784 address,
David Rogers6592d292020-02-14 14:19:26 -0800785 result.size());
786 return result.status();
787 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800788
789 if (options_.verify_on_write) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800790 TRY(entry.VerifyChecksumInFlash(entry_header_format_.checksum));
Wyatt Heplerb7609542020-01-24 10:29:54 -0800791 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800792
Keir Mierle9e38b402020-02-21 13:06:21 -0800793 // Entry was written successfully; update the key descriptor and the sector
794 // descriptor to reflect the new entry.
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800795 entry.UpdateDescriptor(key_descriptor);
David Rogers6592d292020-02-14 14:19:26 -0800796 sector->AddValidBytes(result.size());
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800797 return Status::OK;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800798}
799
Wyatt Heplerbdd8e5a2020-02-20 19:27:26 -0800800KeyValueStore::Entry KeyValueStore::CreateEntry(Address address,
801 std::string_view key,
802 span<const byte> value,
803 KeyDescriptor::State state) {
Keir Mierle9e38b402020-02-21 13:06:21 -0800804 // Always bump the transaction ID when creating a new entry.
805 //
806 // Burning transaction IDs prevents inconsistencies between flash and memory
807 // that which could happen if a write succeeds, but for some reason the read
808 // and verify step fails. Here's how this would happen:
809 //
810 // 1. The entry is written but for some reason the flash reports failure OR
811 // The write succeeds, but the read / verify operation fails.
812 // 2. The transaction ID is NOT incremented, because of the failure
813 // 3. (later) A new entry is written, re-using the transaction ID (oops)
814 //
815 // By always burning transaction IDs, the above problem can't happen.
816 last_transaction_id_ += 1;
817
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800818 if (state == KeyDescriptor::kDeleted) {
819 return Entry::Tombstone(partition_,
820 address,
Wyatt Hepler88adfe82020-02-20 19:33:27 -0800821 entry_header_format_,
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800822 key,
823 partition_.alignment_bytes(),
Keir Mierle9e38b402020-02-21 13:06:21 -0800824 last_transaction_id_);
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800825 }
826 return Entry::Valid(partition_,
827 address,
Wyatt Hepler88adfe82020-02-20 19:33:27 -0800828 entry_header_format_,
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800829 key,
830 value,
831 partition_.alignment_bytes(),
Keir Mierle9e38b402020-02-21 13:06:21 -0800832 last_transaction_id_);
Wyatt Heplerd2298282020-02-20 17:12:45 -0800833}
834
835void KeyValueStore::Reset() {
836 initialized_ = false;
837 key_descriptors_.clear();
838 last_new_sector_ = nullptr;
839 last_transaction_id_ = 0;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800840}
841
Keir Mierle8c352dc2020-02-02 13:58:19 -0800842void KeyValueStore::LogDebugInfo() {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800843 const size_t sector_size_bytes = partition_.sector_size_bytes();
844 DBG("====================== KEY VALUE STORE DUMP =========================");
845 DBG(" ");
846 DBG("Flash partition:");
Wyatt Heplerad0a7932020-02-06 08:20:38 -0800847 DBG(" Sector count = %zu", partition_.sector_count());
Wyatt Hepler38ce30f2020-02-19 11:48:31 -0800848 DBG(" Sector max count = %zu", sectors_.max_size());
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800849 DBG(" Sectors in use = %zu", sectors_.size());
Keir Mierle8c352dc2020-02-02 13:58:19 -0800850 DBG(" Sector size = %zu", sector_size_bytes);
851 DBG(" Total size = %zu", partition_.size_bytes());
852 DBG(" Alignment = %zu", partition_.alignment_bytes());
853 DBG(" ");
854 DBG("Key descriptors:");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800855 DBG(" Entry count = %zu", key_descriptors_.size());
Wyatt Hepler38ce30f2020-02-19 11:48:31 -0800856 DBG(" Max entry count = %zu", key_descriptors_.max_size());
Keir Mierle8c352dc2020-02-02 13:58:19 -0800857 DBG(" ");
858 DBG(" # hash version address address (hex)");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800859 for (size_t i = 0; i < key_descriptors_.size(); ++i) {
860 const KeyDescriptor& kd = key_descriptors_[i];
Keir Mierle8c352dc2020-02-02 13:58:19 -0800861 DBG(" |%3zu: | %8zx |%8zu | %8zu | %8zx",
862 i,
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800863 size_t(kd.hash()),
864 size_t(kd.transaction_id()),
865 size_t(kd.address()),
866 size_t(kd.address()));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800867 }
868 DBG(" ");
869
870 DBG("Sector descriptors:");
871 DBG(" # tail free valid has_space");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800872 for (size_t sector_id = 0; sector_id < sectors_.size(); ++sector_id) {
873 const SectorDescriptor& sd = sectors_[sector_id];
Keir Mierle8c352dc2020-02-02 13:58:19 -0800874 DBG(" |%3zu: | %8zu |%8zu | %s",
875 sector_id,
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800876 size_t(sd.writable_bytes()),
877 sd.valid_bytes(),
878 sd.writable_bytes() ? "YES" : "");
Keir Mierle8c352dc2020-02-02 13:58:19 -0800879 }
880 DBG(" ");
881
882 // TODO: This should stop logging after some threshold.
883 // size_t dumped_bytes = 0;
884 DBG("Sector raw data:");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800885 for (size_t sector_id = 0; sector_id < sectors_.size(); ++sector_id) {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800886 // Read sector data. Yes, this will blow the stack on embedded.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800887 std::array<byte, 500> raw_sector_data; // TODO!!!
Keir Mierle8c352dc2020-02-02 13:58:19 -0800888 StatusWithSize sws =
889 partition_.Read(sector_id * sector_size_bytes, raw_sector_data);
890 DBG("Read: %zu bytes", sws.size());
891
892 DBG(" base addr offs 0 1 2 3 4 5 6 7");
893 for (size_t i = 0; i < sector_size_bytes; i += 8) {
894 DBG(" %3zu %8zx %5zu | %02x %02x %02x %02x %02x %02x %02x %02x",
895 sector_id,
896 (sector_id * sector_size_bytes) + i,
897 i,
898 static_cast<unsigned int>(raw_sector_data[i + 0]),
899 static_cast<unsigned int>(raw_sector_data[i + 1]),
900 static_cast<unsigned int>(raw_sector_data[i + 2]),
901 static_cast<unsigned int>(raw_sector_data[i + 3]),
902 static_cast<unsigned int>(raw_sector_data[i + 4]),
903 static_cast<unsigned int>(raw_sector_data[i + 5]),
904 static_cast<unsigned int>(raw_sector_data[i + 6]),
905 static_cast<unsigned int>(raw_sector_data[i + 7]));
906
907 // TODO: Fix exit condition.
908 if (i > 128) {
909 break;
910 }
911 }
912 DBG(" ");
913 }
914
915 DBG("////////////////////// KEY VALUE STORE DUMP END /////////////////////");
916}
917
David Rogerscf680ab2020-02-12 23:28:32 -0800918void KeyValueStore::LogSectors() const {
919 DBG("Sector descriptors: count %zu", sectors_.size());
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800920 for (auto& sector : sectors_) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800921 DBG(" - Sector %u: valid %zu, recoverable %zu, free %zu",
David Rogers50185ad2020-02-07 00:02:46 -0800922 SectorIndex(&sector),
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800923 sector.valid_bytes(),
924 sector.RecoverableBytes(partition_.sector_size_bytes()),
925 sector.writable_bytes());
David Rogers50185ad2020-02-07 00:02:46 -0800926 }
927}
928
David Rogerscf680ab2020-02-12 23:28:32 -0800929void KeyValueStore::LogKeyDescriptor() const {
930 DBG("Key descriptors: count %zu", key_descriptors_.size());
931 for (auto& key : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800932 DBG(" - Key: %s, hash %#zx, transaction ID %zu, address %#zx",
David Rogerscf680ab2020-02-12 23:28:32 -0800933 key.deleted() ? "Deleted" : "Valid",
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800934 static_cast<size_t>(key.hash()),
935 static_cast<size_t>(key.transaction_id()),
936 static_cast<size_t>(key.address()));
David Rogerscf680ab2020-02-12 23:28:32 -0800937 }
938}
939
Wyatt Hepler2ad60672020-01-21 08:00:16 -0800940} // namespace pw::kvs