blob: 7f2dc2da3cc8e9b270c7eff0071541683f46afb3 [file] [log] [blame]
Wyatt Heplerb7609542020-01-24 10:29:54 -08001// Copyright 2020 The Pigweed Authors
2//
3// Licensed under the Apache License, Version 2.0 (the "License"); you may not
4// use this file except in compliance with the License. You may obtain a copy of
5// the License at
6//
7// https://www.apache.org/licenses/LICENSE-2.0
8//
9// Unless required by applicable law or agreed to in writing, software
10// distributed under the License is distributed on an "AS IS" BASIS, WITHOUT
11// WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the
12// License for the specific language governing permissions and limitations under
13// the License.
14
Wyatt Heplerb7609542020-01-24 10:29:54 -080015#include "pw_kvs/key_value_store.h"
16
Wyatt Heplerbab0e202020-02-04 07:40:08 -080017#include <algorithm>
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -080018#include <cinttypes>
Wyatt Heplerb7609542020-01-24 10:29:54 -080019#include <cstring>
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080020#include <type_traits>
Wyatt Heplerb7609542020-01-24 10:29:54 -080021
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -080022#include "pw_kvs/format.h"
23
Keir Mierle8c352dc2020-02-02 13:58:19 -080024#define PW_LOG_USE_ULTRA_SHORT_NAMES 1
Wyatt Heplerbdd8e5a2020-02-20 19:27:26 -080025#include "pw_kvs/internal/entry.h"
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080026#include "pw_kvs_private/macros.h"
Keir Mierle8c352dc2020-02-02 13:58:19 -080027#include "pw_log/log.h"
Wyatt Heplerb7609542020-01-24 10:29:54 -080028
Wyatt Hepler2ad60672020-01-21 08:00:16 -080029namespace pw::kvs {
Wyatt Heplera00d1ef2020-02-14 14:31:26 -080030namespace {
Wyatt Heplerb7609542020-01-24 10:29:54 -080031
Wyatt Hepleracaacf92020-01-24 10:58:30 -080032using std::byte;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080033using std::string_view;
Wyatt Hepleracaacf92020-01-24 10:58:30 -080034
Wyatt Heplera00d1ef2020-02-14 14:31:26 -080035constexpr bool InvalidKey(std::string_view key) {
Wyatt Heplerbdd8e5a2020-02-20 19:27:26 -080036 return key.empty() || (key.size() > internal::Entry::kMaxKeyLength);
Wyatt Heplera00d1ef2020-02-14 14:31:26 -080037}
38
39} // namespace
40
Wyatt Heplerad0a7932020-02-06 08:20:38 -080041KeyValueStore::KeyValueStore(FlashPartition* partition,
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080042 Vector<KeyDescriptor>& key_descriptor_list,
43 Vector<SectorDescriptor>& sector_descriptor_list,
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -080044 span<const EntryFormat> formats,
Wyatt Heplerad0a7932020-02-06 08:20:38 -080045 const Options& options)
46 : partition_(*partition),
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -080047 formats_(formats),
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080048 key_descriptors_(key_descriptor_list),
Wyatt Heplerd2298282020-02-20 17:12:45 -080049 sectors_(sector_descriptor_list),
50 options_(options) {
51 Reset();
52}
Wyatt Heplerad0a7932020-02-06 08:20:38 -080053
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -080054Status KeyValueStore::Init() {
Wyatt Heplerd2298282020-02-20 17:12:45 -080055 Reset();
56
David Rogers2e9e0c82020-02-13 15:06:06 -080057 INF("Initializing key value store");
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080058 if (partition_.sector_count() > sectors_.max_size()) {
David Rogers2e9e0c82020-02-13 15:06:06 -080059 ERR("KVS init failed: kMaxUsableSectors (=%zu) must be at least as "
60 "large as the number of sectors in the flash partition (=%zu)",
Wyatt Hepler38ce30f2020-02-19 11:48:31 -080061 sectors_.max_size(),
David Rogers2e9e0c82020-02-13 15:06:06 -080062 partition_.sector_count());
Wyatt Heplerad0a7932020-02-06 08:20:38 -080063 return Status::FAILED_PRECONDITION;
64 }
65
Keir Mierle8c352dc2020-02-02 13:58:19 -080066 const size_t sector_size_bytes = partition_.sector_size_bytes();
Keir Mierle8c352dc2020-02-02 13:58:19 -080067
David Rogersf0a35442020-02-04 12:16:38 -080068 if (working_buffer_.size() < sector_size_bytes) {
Wyatt Heplerce7b8df2020-02-21 10:38:39 -080069 ERR("KVS init failed: working_buffer_ (%zu B) is smaller than sector size "
70 "(%zu B)",
David Rogersf0a35442020-02-04 12:16:38 -080071 working_buffer_.size(),
72 sector_size_bytes);
73 return Status::INVALID_ARGUMENT;
74 }
75
Keir Mierle8c352dc2020-02-02 13:58:19 -080076 DBG("First pass: Read all entries from all sectors");
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080077 Address sector_address = 0;
Keir Mierle8c352dc2020-02-02 13:58:19 -080078
Wyatt Heplerd2298282020-02-20 17:12:45 -080079 sectors_.assign(partition_.sector_count(),
80 SectorDescriptor(sector_size_bytes));
81
Alexei Frolovd4adf912020-02-21 13:29:15 -080082 size_t total_corrupt_bytes = 0;
83 int corrupt_entries = 0;
David Rogers91627482020-02-27 17:38:12 -080084 bool empty_sector_found = false;
Alexei Frolovd4adf912020-02-21 13:29:15 -080085
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080086 for (SectorDescriptor& sector : sectors_) {
Keir Mierle8c352dc2020-02-02 13:58:19 -080087 Address entry_address = sector_address;
88
Alexei Frolovd4adf912020-02-21 13:29:15 -080089 size_t sector_corrupt_bytes = 0;
90
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080091 for (int num_entries_in_sector = 0; true; num_entries_in_sector++) {
92 DBG("Load entry: sector=%" PRIx32 ", entry#=%d, address=%" PRIx32,
93 sector_address,
Keir Mierle8c352dc2020-02-02 13:58:19 -080094 num_entries_in_sector,
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080095 entry_address);
Keir Mierle8c352dc2020-02-02 13:58:19 -080096
Wyatt Hepler2c7eca02020-02-18 16:01:42 -080097 if (!AddressInSector(sector, entry_address)) {
Keir Mierle8c352dc2020-02-02 13:58:19 -080098 DBG("Fell off end of sector; moving to the next sector");
99 break;
100 }
101
102 Address next_entry_address;
103 Status status = LoadEntry(entry_address, &next_entry_address);
104 if (status == Status::NOT_FOUND) {
105 DBG("Hit un-written data in sector; moving to the next sector");
106 break;
107 }
108 if (status == Status::DATA_LOSS) {
Alexei Frolovd4adf912020-02-21 13:29:15 -0800109 // The entry could not be read, indicating data corruption within the
110 // sector. Try to scan the remainder of the sector for other entries.
David Rogersa2562b52020-03-05 15:30:05 -0800111 WRN("KVS init: data loss detected in sector %u at address %zu",
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800112 SectorIndex(&sector),
113 size_t(entry_address));
Alexei Frolovd4adf912020-02-21 13:29:15 -0800114
115 corrupt_entries++;
116
117 status = ScanForEntry(sector,
118 entry_address + Entry::kMinAlignmentBytes,
119 &next_entry_address);
120 if (status == Status::NOT_FOUND) {
121 // No further entries in this sector. Mark the remaining bytes in the
122 // sector as corrupt (since we can't reliably know the size of the
123 // corrupt entry).
124 sector_corrupt_bytes +=
125 sector_size_bytes - (entry_address - sector_address);
126 break;
127 }
128
129 if (!status.ok()) {
130 ERR("Unexpected error in KVS initialization: %s", status.str());
131 return Status::UNKNOWN;
132 }
133
134 sector_corrupt_bytes += next_entry_address - entry_address;
135 } else if (!status.ok()) {
136 ERR("Unexpected error in KVS initialization: %s", status.str());
137 return Status::UNKNOWN;
Keir Mierle8c352dc2020-02-02 13:58:19 -0800138 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800139
140 // Entry loaded successfully; so get ready to load the next one.
141 entry_address = next_entry_address;
142
143 // Update of the number of writable bytes in this sector.
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800144 sector.set_writable_bytes(sector_size_bytes -
145 (entry_address - sector_address));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800146 }
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800147
Alexei Frolovd4adf912020-02-21 13:29:15 -0800148 if (sector_corrupt_bytes > 0) {
149 // If the sector contains corrupt data, prevent any further entries from
150 // being written to it by indicating that it has no space. This should
151 // also make it a decent GC candidate. Valid keys in the sector are still
152 // readable as normal.
153 sector.set_writable_bytes(0);
154
155 WRN("Sector %u contains %zuB of corrupt data",
156 SectorIndex(&sector),
157 sector_corrupt_bytes);
158 }
159
David Rogers91627482020-02-27 17:38:12 -0800160 if (sector.Empty(sector_size_bytes)) {
161 empty_sector_found = true;
162 }
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800163 sector_address += sector_size_bytes;
Alexei Frolovd4adf912020-02-21 13:29:15 -0800164 total_corrupt_bytes += sector_corrupt_bytes;
Keir Mierle8c352dc2020-02-02 13:58:19 -0800165 }
166
167 DBG("Second pass: Count valid bytes in each sector");
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800168 const KeyDescriptor* newest_key = nullptr;
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800169
Keir Mierle8c352dc2020-02-02 13:58:19 -0800170 // For every valid key, increment the valid bytes for that sector.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800171 for (KeyDescriptor& key_descriptor : key_descriptors_) {
David Rogersf56131c2020-03-04 10:19:22 -0800172 for (auto& address : key_descriptor.addresses()) {
173 Entry entry;
David Rogersa2562b52020-03-05 15:30:05 -0800174 TRY(Entry::Read(partition_, address, formats_, &entry));
David Rogersf56131c2020-03-04 10:19:22 -0800175 SectorFromAddress(address)->AddValidBytes(entry.size());
176 }
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800177 if (key_descriptor.IsNewerThan(last_transaction_id_)) {
178 last_transaction_id_ = key_descriptor.transaction_id();
179 newest_key = &key_descriptor;
180 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800181 }
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800182
183 if (newest_key == nullptr) {
184 last_new_sector_ = sectors_.begin();
185 } else {
David Rogersf56131c2020-03-04 10:19:22 -0800186 last_new_sector_ = SectorFromAddress(newest_key->addresses().back());
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800187 }
188
David Rogers91627482020-02-27 17:38:12 -0800189 if (!empty_sector_found) {
190 // TODO: Record/report the error condition and recovery result.
191 Status gc_result = GarbageCollectPartial();
192
193 if (!gc_result.ok()) {
194 ERR("KVS init failed: Unable to maintain required free sector");
195 return Status::INTERNAL;
196 }
197 }
198
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800199 initialized_ = true;
David Rogers2e9e0c82020-02-13 15:06:06 -0800200
Armando Montanez5464d5f2020-02-20 10:12:20 -0800201 INF("KeyValueStore init complete: active keys %zu, deleted keys %zu, sectors "
David Rogers2e9e0c82020-02-13 15:06:06 -0800202 "%zu, logical sector size %zu bytes",
203 size(),
204 (key_descriptors_.size() - size()),
205 sectors_.size(),
206 partition_.sector_size_bytes());
207
Alexei Frolovd4adf912020-02-21 13:29:15 -0800208 if (total_corrupt_bytes > 0) {
209 WRN("Found %zu corrupt bytes and %d corrupt entries during init process; "
210 "some keys may be missing",
211 total_corrupt_bytes,
212 corrupt_entries);
213 return Status::DATA_LOSS;
214 }
215
Keir Mierle8c352dc2020-02-02 13:58:19 -0800216 return Status::OK;
217}
218
Alexei Frolov9e235832020-02-24 12:44:45 -0800219KeyValueStore::StorageStats KeyValueStore::GetStorageStats() const {
220 StorageStats stats{0, 0, 0};
221 const size_t sector_size = partition_.sector_size_bytes();
222 bool found_empty_sector = false;
223
224 for (const SectorDescriptor& sector : sectors_) {
225 stats.in_use_bytes += sector.valid_bytes();
226 stats.reclaimable_bytes += sector.RecoverableBytes(sector_size);
227
228 if (!found_empty_sector && sector.Empty(sector_size)) {
229 // The KVS tries to always keep an empty sector for GC, so don't count
230 // the first empty sector seen as writable space. However, a free sector
231 // cannot always be assumed to exist; if a GC operation fails, all sectors
232 // may be partially written, in which case the space reported might be
233 // inaccurate.
234 found_empty_sector = true;
235 continue;
236 }
237
238 stats.writable_bytes += sector.writable_bytes();
239 }
240
241 return stats;
242}
243
Keir Mierle8c352dc2020-02-02 13:58:19 -0800244Status KeyValueStore::LoadEntry(Address entry_address,
245 Address* next_entry_address) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800246 Entry entry;
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800247 TRY(Entry::Read(partition_, entry_address, formats_, &entry));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800248
249 // Read the key from flash & validate the entry (which reads the value).
Wyatt Heplera00d1ef2020-02-14 14:31:26 -0800250 Entry::KeyBuffer key_buffer;
Wyatt Heplere541e072020-02-14 09:10:53 -0800251 TRY_ASSIGN(size_t key_length, entry.ReadKey(key_buffer));
252 const string_view key(key_buffer.data(), key_length);
Wyatt Heplerbab0e202020-02-04 07:40:08 -0800253
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800254 TRY(entry.VerifyChecksumInFlash());
David Rogersf56131c2020-03-04 10:19:22 -0800255
256 // A valid entry was found, so update the next entry address before doing any
257 // of the checks that happen in AppendNewOrOverwriteStaleExistingDescriptor().
258 *next_entry_address = entry.next_address();
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800259 TRY(AppendNewOrOverwriteStaleExistingDescriptor(entry.descriptor(key)));
Keir Mierle8c352dc2020-02-02 13:58:19 -0800260
Keir Mierle8c352dc2020-02-02 13:58:19 -0800261 return Status::OK;
262}
263
Alexei Frolovd4adf912020-02-21 13:29:15 -0800264// Scans flash memory within a sector to find a KVS entry magic.
Alexei Frolovd4adf912020-02-21 13:29:15 -0800265Status KeyValueStore::ScanForEntry(const SectorDescriptor& sector,
266 Address start_address,
267 Address* next_entry_address) {
268 DBG("Scanning sector %u for entries starting from address %zx",
269 SectorIndex(&sector),
270 size_t(start_address));
271
272 // Entries must start at addresses which are aligned on a multiple of
273 // Entry::kMinAlignmentBytes. However, that multiple can vary between entries.
274 // When scanning, we don't have an entry to tell us what the current alignment
275 // is, so the minimum alignment is used to be exhaustive.
276 for (Address address = AlignUp(start_address, Entry::kMinAlignmentBytes);
277 AddressInSector(sector, address);
278 address += Entry::kMinAlignmentBytes) {
Alexei Frolovd4adf912020-02-21 13:29:15 -0800279 uint32_t magic;
280 TRY(partition_.Read(address, as_writable_bytes(span(&magic, 1))));
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800281 if (formats_.KnownMagic(magic)) {
Alexei Frolovd4adf912020-02-21 13:29:15 -0800282 DBG("Found entry magic at address %zx", size_t(address));
283 *next_entry_address = address;
284 return Status::OK;
285 }
286 }
287
288 return Status::NOT_FOUND;
289}
290
Keir Mierle8c352dc2020-02-02 13:58:19 -0800291// TODO: This method is the trigger of the O(valid_entries * all_entries) time
292// complexity for reading. At some cost to memory, this could be optimized by
293// using a hash table instead of scanning, but in practice this should be fine
294// for a small number of keys
295Status KeyValueStore::AppendNewOrOverwriteStaleExistingDescriptor(
296 const KeyDescriptor& key_descriptor) {
297 // With the new key descriptor, either add it to the descriptor table or
298 // overwrite an existing entry with an older version of the key.
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800299 KeyDescriptor* existing_descriptor = FindDescriptor(key_descriptor.hash());
Keir Mierle8c352dc2020-02-02 13:58:19 -0800300
Wyatt Hepler5406a672020-02-18 15:42:38 -0800301 // Write a new entry.
302 if (existing_descriptor == nullptr) {
303 if (key_descriptors_.full()) {
304 return Status::RESOURCE_EXHAUSTED;
305 }
306 key_descriptors_.push_back(key_descriptor);
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800307 } else if (key_descriptor.IsNewerThan(
308 existing_descriptor->transaction_id())) {
Wyatt Hepler5406a672020-02-18 15:42:38 -0800309 // Existing entry is old; replace the existing entry with the new one.
310 *existing_descriptor = key_descriptor;
David Rogersf56131c2020-03-04 10:19:22 -0800311 } else if (existing_descriptor->transaction_id() ==
312 key_descriptor.transaction_id()) {
313 // If the entries have a duplicate transaction ID, add the new (redundant)
314 // entry to the existing descriptor.
315 if (existing_descriptor->hash() != key_descriptor.hash()) {
316 ERR("Duplicate entry for key %#010" PRIx32 " with transaction ID %" PRIu32
317 " has non-matching hash",
318 key_descriptor.hash(),
319 key_descriptor.transaction_id());
Wyatt Hepler5406a672020-02-18 15:42:38 -0800320 return Status::DATA_LOSS;
321 }
David Rogersf56131c2020-03-04 10:19:22 -0800322
323 // Verify that this entry is not in the same sector as an existing copy of
324 // this same key.
325 for (auto address : existing_descriptor->addresses()) {
326 if (SectorFromAddress(address) ==
327 SectorFromAddress(key_descriptor.address())) {
328 DBG("Multiple Redundant entries in same sector %u",
329 SectorIndex(SectorFromAddress(address)));
330 return Status::DATA_LOSS;
331 }
332 }
333 existing_descriptor->addresses().push_back(key_descriptor.address());
334 } else {
Wyatt Hepler5406a672020-02-18 15:42:38 -0800335 DBG("Found stale entry when appending; ignoring");
Keir Mierle8c352dc2020-02-02 13:58:19 -0800336 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800337 return Status::OK;
338}
339
Keir Mierle8c352dc2020-02-02 13:58:19 -0800340KeyValueStore::KeyDescriptor* KeyValueStore::FindDescriptor(uint32_t hash) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800341 for (KeyDescriptor& key_descriptor : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800342 if (key_descriptor.hash() == hash) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800343 return &key_descriptor;
Keir Mierle8c352dc2020-02-02 13:58:19 -0800344 }
345 }
346 return nullptr;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800347}
348
349StatusWithSize KeyValueStore::Get(string_view key,
Wyatt Hepler5f6efc02020-02-18 16:54:31 -0800350 span<byte> value_buffer,
351 size_t offset_bytes) const {
Wyatt Hepler50f70772020-02-13 11:25:10 -0800352 TRY_WITH_SIZE(CheckOperation(key));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800353
David Rogers2761aeb2020-01-31 17:09:00 -0800354 const KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800355 TRY_WITH_SIZE(FindExistingKeyDescriptor(key, &key_descriptor));
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800356
Wyatt Heplerfac81132020-02-27 17:26:33 -0800357 return Get(key, *key_descriptor, value_buffer, offset_bytes);
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800358}
359
Wyatt Heplerfac81132020-02-27 17:26:33 -0800360Status KeyValueStore::PutBytes(string_view key, span<const byte> value) {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800361 DBG("Writing key/value; key length=%zu, value length=%zu",
362 key.size(),
363 value.size());
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800364
365 TRY(CheckOperation(key));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800366
Wyatt Hepler5406a672020-02-18 15:42:38 -0800367 if (Entry::size(partition_, key, value) > partition_.sector_size_bytes()) {
368 DBG("%zu B value with %zu B key cannot fit in one sector",
369 value.size(),
370 key.size());
371 return Status::INVALID_ARGUMENT;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800372 }
373
David Rogers2761aeb2020-01-31 17:09:00 -0800374 KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800375 Status status = FindKeyDescriptor(key, &key_descriptor);
376
377 if (status.ok()) {
David Rogersf56131c2020-03-04 10:19:22 -0800378 // TODO: figure out logging how to support multiple addresses.
David Rogersa2562b52020-03-05 15:30:05 -0800379 DBG("Overwriting entry for key %#010" PRIx32 " in %u sectors including %u",
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800380 key_descriptor->hash(),
David Rogersf56131c2020-03-04 10:19:22 -0800381 unsigned(key_descriptor->addresses().size()),
382 SectorIndex(SectorFromAddress(key_descriptor->address())));
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800383 return WriteEntryForExistingKey(
384 key_descriptor, KeyDescriptor::kValid, key, value);
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800385 }
David Rogers2761aeb2020-01-31 17:09:00 -0800386
Wyatt Hepler2d401692020-02-13 16:01:23 -0800387 if (status == Status::NOT_FOUND) {
388 return WriteEntryForNewKey(key, value);
389 }
390
391 return status;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800392}
393
394Status KeyValueStore::Delete(string_view key) {
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800395 TRY(CheckOperation(key));
396
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800397 KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800398 TRY(FindExistingKeyDescriptor(key, &key_descriptor));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800399
David Rogersf56131c2020-03-04 10:19:22 -0800400 // TODO: figure out logging how to support multiple addresses.
David Rogersa2562b52020-03-05 15:30:05 -0800401 DBG("Writing tombstone for key %#010" PRIx32 " in %u sectors including %u",
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800402 key_descriptor->hash(),
David Rogersf56131c2020-03-04 10:19:22 -0800403 unsigned(key_descriptor->addresses().size()),
404 SectorIndex(SectorFromAddress(key_descriptor->address())));
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800405 return WriteEntryForExistingKey(
406 key_descriptor, KeyDescriptor::kDeleted, key, {});
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800407}
408
Wyatt Hepler08d37d82020-02-27 15:45:37 -0800409void KeyValueStore::Item::ReadKey() {
410 key_buffer_.fill('\0');
411
412 Entry entry;
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800413 if (Entry::Read(
414 kvs_.partition_, descriptor_->address(), kvs_.formats_, &entry)
415 .ok()) {
Wyatt Hepler08d37d82020-02-27 15:45:37 -0800416 entry.ReadKey(key_buffer_);
417 }
418}
419
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800420KeyValueStore::iterator& KeyValueStore::iterator::operator++() {
421 // Skip to the next entry that is valid (not deleted).
Wyatt Hepler08d37d82020-02-27 15:45:37 -0800422 while (++item_.descriptor_ != item_.kvs_.key_descriptors_.end() &&
423 item_.descriptor_->deleted()) {
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800424 }
425 return *this;
426}
427
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800428KeyValueStore::iterator KeyValueStore::begin() const {
Wyatt Hepler08d37d82020-02-27 15:45:37 -0800429 const KeyDescriptor* descriptor = key_descriptors_.begin();
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800430 // Skip over any deleted entries at the start of the descriptor list.
Wyatt Hepler08d37d82020-02-27 15:45:37 -0800431 while (descriptor != key_descriptors_.end() && descriptor->deleted()) {
432 ++descriptor;
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800433 }
Wyatt Hepler08d37d82020-02-27 15:45:37 -0800434 return iterator(*this, descriptor);
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800435}
436
437// TODO(hepler): The valid entry count could be tracked in the KVS to avoid the
438// need for this for-loop.
439size_t KeyValueStore::size() const {
440 size_t valid_entries = 0;
441
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800442 for (const KeyDescriptor& key_descriptor : key_descriptors_) {
443 if (!key_descriptor.deleted()) {
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800444 valid_entries += 1;
445 }
446 }
447
448 return valid_entries;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800449}
450
Wyatt Heplered163b02020-02-03 17:49:32 -0800451StatusWithSize KeyValueStore::ValueSize(std::string_view key) const {
Wyatt Hepler50f70772020-02-13 11:25:10 -0800452 TRY_WITH_SIZE(CheckOperation(key));
Wyatt Heplered163b02020-02-03 17:49:32 -0800453
454 const KeyDescriptor* key_descriptor;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800455 TRY_WITH_SIZE(FindExistingKeyDescriptor(key, &key_descriptor));
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800456
Wyatt Heplerfac81132020-02-27 17:26:33 -0800457 return ValueSize(*key_descriptor);
458}
Wyatt Heplered163b02020-02-03 17:49:32 -0800459
Wyatt Heplerfac81132020-02-27 17:26:33 -0800460StatusWithSize KeyValueStore::Get(string_view key,
461 const KeyDescriptor& descriptor,
462 span<std::byte> value_buffer,
463 size_t offset_bytes) const {
464 Entry entry;
David Rogersa2562b52020-03-05 15:30:05 -0800465 // TODO: add support for using one of the redundant entries if reading the
466 // first copy fails.
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800467 TRY_WITH_SIZE(
468 Entry::Read(partition_, descriptor.address(), formats_, &entry));
Wyatt Heplerfac81132020-02-27 17:26:33 -0800469
470 StatusWithSize result = entry.ReadValue(value_buffer, offset_bytes);
471 if (result.ok() && options_.verify_on_read && offset_bytes == 0u) {
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800472 Status verify_result =
473 entry.VerifyChecksum(key, value_buffer.first(result.size()));
Wyatt Heplerfac81132020-02-27 17:26:33 -0800474 if (!verify_result.ok()) {
475 std::memset(value_buffer.data(), 0, result.size());
476 return StatusWithSize(verify_result, 0);
477 }
478
479 return StatusWithSize(verify_result, result.size());
480 }
481 return result;
Wyatt Heplered163b02020-02-03 17:49:32 -0800482}
483
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800484Status KeyValueStore::FixedSizeGet(std::string_view key,
Wyatt Heplerfac81132020-02-27 17:26:33 -0800485 void* value,
486 size_t size_bytes) const {
487 TRY(CheckOperation(key));
488
489 const KeyDescriptor* descriptor;
490 TRY(FindExistingKeyDescriptor(key, &descriptor));
491
492 return FixedSizeGet(key, *descriptor, value, size_bytes);
493}
494
495Status KeyValueStore::FixedSizeGet(std::string_view key,
496 const KeyDescriptor& descriptor,
497 void* value,
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800498 size_t size_bytes) const {
499 // Ensure that the size of the stored value matches the size of the type.
500 // Otherwise, report error. This check avoids potential memory corruption.
Wyatt Heplerfac81132020-02-27 17:26:33 -0800501 TRY_ASSIGN(const size_t actual_size, ValueSize(descriptor));
502
503 if (actual_size != size_bytes) {
504 DBG("Requested %zu B read, but value is %zu B", size_bytes, actual_size);
Wyatt Hepler6e3a83b2020-02-04 07:36:45 -0800505 return Status::INVALID_ARGUMENT;
Wyatt Heplerbab0e202020-02-04 07:40:08 -0800506 }
Wyatt Heplerfac81132020-02-27 17:26:33 -0800507
508 StatusWithSize result =
509 Get(key, descriptor, span(static_cast<byte*>(value), size_bytes), 0);
510
511 return result.status();
512}
513
514StatusWithSize KeyValueStore::ValueSize(const KeyDescriptor& descriptor) const {
515 Entry entry;
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800516 TRY_WITH_SIZE(
517 Entry::Read(partition_, descriptor.address(), formats_, &entry));
Wyatt Heplerfac81132020-02-27 17:26:33 -0800518
519 return StatusWithSize(entry.value_size());
Keir Mierle8c352dc2020-02-02 13:58:19 -0800520}
521
Wyatt Hepler729f28c2020-02-05 09:46:00 -0800522Status KeyValueStore::CheckOperation(string_view key) const {
Wyatt Hepleracaacf92020-01-24 10:58:30 -0800523 if (InvalidKey(key)) {
Wyatt Heplerb7609542020-01-24 10:29:54 -0800524 return Status::INVALID_ARGUMENT;
525 }
Wyatt Heplerd2298282020-02-20 17:12:45 -0800526 if (!initialized()) {
Wyatt Heplerb7609542020-01-24 10:29:54 -0800527 return Status::FAILED_PRECONDITION;
528 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800529 return Status::OK;
530}
531
Wyatt Hepler2d401692020-02-13 16:01:23 -0800532// Searches for a KeyDescriptor that matches this key and sets *result to point
533// to it if one is found.
534//
535// OK: there is a matching descriptor and *result is set
536// NOT_FOUND: there is no descriptor that matches this key, but this key
537// has a unique hash (and could potentially be added to the KVS)
538// ALREADY_EXISTS: there is no descriptor that matches this key, but the
539// key's hash collides with the hash for an existing descriptor
540//
David Rogers2761aeb2020-01-31 17:09:00 -0800541Status KeyValueStore::FindKeyDescriptor(string_view key,
542 const KeyDescriptor** result) const {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800543 const uint32_t hash = internal::Hash(key);
Wyatt Heplera00d1ef2020-02-14 14:31:26 -0800544 Entry::KeyBuffer key_buffer;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800545
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800546 for (auto& descriptor : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800547 if (descriptor.hash() == hash) {
Wyatt Heplere541e072020-02-14 09:10:53 -0800548 TRY(Entry::ReadKey(
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800549 partition_, descriptor.address(), key.size(), key_buffer.data()));
Wyatt Heplerb7609542020-01-24 10:29:54 -0800550
Wyatt Heplere541e072020-02-14 09:10:53 -0800551 if (key == string_view(key_buffer.data(), key.size())) {
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800552 DBG("Found match for key hash 0x%08" PRIx32, hash);
David Rogers2761aeb2020-01-31 17:09:00 -0800553 *result = &descriptor;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800554 return Status::OK;
Wyatt Hepler2d401692020-02-13 16:01:23 -0800555 } else {
556 WRN("Found key hash collision for 0x%08" PRIx32, hash);
557 return Status::ALREADY_EXISTS;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800558 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800559 }
560 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800561 return Status::NOT_FOUND;
562}
563
Wyatt Hepler2d401692020-02-13 16:01:23 -0800564// Searches for a KeyDescriptor that matches this key and sets *result to point
565// to it if one is found.
566//
567// OK: there is a matching descriptor and *result is set
568// NOT_FOUND: there is no descriptor that matches this key
569//
570Status KeyValueStore::FindExistingKeyDescriptor(
571 string_view key, const KeyDescriptor** result) const {
572 Status status = FindKeyDescriptor(key, result);
573
574 // If the key's hash collides with an existing key or if the key is deleted,
575 // treat it as if it is not in the KVS.
576 if (status == Status::ALREADY_EXISTS ||
577 (status.ok() && (*result)->deleted())) {
578 return Status::NOT_FOUND;
579 }
580 return status;
581}
582
David Rogers2761aeb2020-01-31 17:09:00 -0800583Status KeyValueStore::WriteEntryForExistingKey(KeyDescriptor* key_descriptor,
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800584 KeyDescriptor::State new_state,
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800585 string_view key,
586 span<const byte> value) {
Wyatt Hepler30a52152020-02-12 11:26:05 -0800587 Entry original_entry;
David Rogersa2562b52020-03-05 15:30:05 -0800588 // TODO: add support for using one of the redundant entries if reading the
589 // first copy fails.
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800590 TRY(Entry::Read(
591 partition_, key_descriptor->address(), formats_, &original_entry));
Wyatt Hepler6c24c062020-02-05 15:30:49 -0800592
David Rogersa2562b52020-03-05 15:30:05 -0800593 // Create a new temporary key descriptor to use while writing the new
594 // key-value out to flash. Once the writing is done, update the main
595 // descriptor for this key with the new information.
596 KeyDescriptor new_key_descriptor(key);
597 TRY(WriteEntry(&new_key_descriptor, key, value, new_state));
David Rogers3464d0a2020-02-07 11:45:46 -0800598
David Rogersa2562b52020-03-05 15:30:05 -0800599 // Update the main descriptor for the new key version.
David Rogersf56131c2020-03-04 10:19:22 -0800600 KeyDescriptor old_key_descriptor = *key_descriptor;
David Rogersa2562b52020-03-05 15:30:05 -0800601 *key_descriptor = new_key_descriptor;
David Rogers3464d0a2020-02-07 11:45:46 -0800602
David Rogersa2562b52020-03-05 15:30:05 -0800603 // Remove all the valid bytes for the old key version, which are now stale.
David Rogersf56131c2020-03-04 10:19:22 -0800604 for (auto& address : old_key_descriptor.addresses()) {
605 SectorFromAddress(address)->RemoveValidBytes(original_entry.size());
606 }
607
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800608 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800609}
610
611Status KeyValueStore::WriteEntryForNewKey(string_view key,
612 span<const byte> value) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800613 if (key_descriptors_.full()) {
Keir Mierle8c352dc2020-02-02 13:58:19 -0800614 WRN("KVS full: trying to store a new entry, but can't. Have %zu entries",
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800615 key_descriptors_.size());
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800616 return Status::RESOURCE_EXHAUSTED;
617 }
618
David Rogersa2562b52020-03-05 15:30:05 -0800619 // Create the KeyDescriptor that will be added to the list and write it to
620 // flash.
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800621 KeyDescriptor key_descriptor(key);
David Rogersa2562b52020-03-05 15:30:05 -0800622 TRY(WriteEntry(&key_descriptor, key, value, KeyDescriptor::kValid));
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800623
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800624 // Only add the entry when we are certain the write succeeded.
625 key_descriptors_.push_back(key_descriptor);
Wyatt Heplerb7609542020-01-24 10:29:54 -0800626 return Status::OK;
627}
628
David Rogersa2562b52020-03-05 15:30:05 -0800629Status KeyValueStore::WriteEntry(KeyDescriptor* key_descriptor,
630 string_view key,
631 span<const byte> value,
632 KeyDescriptor::State new_state) {
633 size_t entry_size = Entry::size(partition_, key, value);
634
635 Entry entry = CreateEntry(0, key, value, new_state);
636 *key_descriptor = entry.descriptor(key);
637 key_descriptor->addresses().clear();
638
639 // For number of redundany entries to be written, do the following:
640 // - Find a sector to write an individual entry to. This optionally will
641 // include garbage collecting one or more sectors if needed.
642 // - Write the entry to the sector.
643 // - Repeat for redundancy number of total entries.
644 for (size_t i = 0; i < internal::kEntryRedundancy; i++) {
645 SectorDescriptor* sector;
646 TRY(GetSectorForWrite(&sector, entry_size, key_descriptor));
647
648 DBG("Writing entry %zu; found sector: %u", i, SectorIndex(sector));
649 const Address write_address = NextWritableAddress(sector);
650 TRY(AppendEntry(write_address, entry, key, value));
651
652 // Entry copy was written successfully; update the key descriptor to reflect
653 // the new entry.
654 key_descriptor->addresses().push_back(write_address);
655 }
656
657 // Once all the entries are written, add valid bytes to each of the sectors
658 // that entries were written to.
659 for (auto new_address : key_descriptor->addresses()) {
660 SectorFromAddress(new_address)->AddValidBytes(entry.size());
661 }
662
663 return Status::OK;
664}
665
666// Find a sector to use for writing a new entry to. Do automatic garbage
667// collection if needed and allowed.
668//
669// OK: Sector found with needed space.
670// RESOURCE_EXHAUSTED: No sector available with the needed space.
671Status KeyValueStore::GetSectorForWrite(SectorDescriptor** sector,
672 size_t entry_size,
673 KeyDescriptor* key_descriptor) {
674 Status result = FindSectorWithSpace(
675 sector, entry_size, kAppendEntry, key_descriptor->addresses());
676
677 bool do_auto_gc = options_.gc_on_write != GargbageCollectOnWrite::kDisabled;
678
679 // Do garbage collection as needed, so long as policy allows.
680 while (result == Status::RESOURCE_EXHAUSTED && do_auto_gc) {
681 if (options_.gc_on_write == GargbageCollectOnWrite::kOneSector) {
682 // If GC config option is kOneSector clear the flag to not do any more
683 // GC after this try.
684 do_auto_gc = false;
685 }
686 // Garbage collect and then try again to find the best sector.
687 Status gc_status = GarbageCollectPartial();
688 if (!gc_status.ok()) {
689 if (gc_status == Status::NOT_FOUND) {
690 // Not enough space, and no reclaimable bytes, this KVS is full!
691 return Status::RESOURCE_EXHAUSTED;
692 }
693 return gc_status;
694 }
695
696 result = FindSectorWithSpace(
697 sector, entry_size, kAppendEntry, key_descriptor->addresses());
698 }
699
700 if (!result.ok()) {
701 WRN("Unable to find sector to write %zu B", entry_size);
702 }
703 return result;
704}
705
706Status KeyValueStore::AppendEntry(Address write_address,
707 Entry& entry,
708 string_view key,
709 span<const byte> value) {
710 entry.UpdateAddress(write_address);
711
712 StatusWithSize result = entry.Write(key, value);
713 // Remove any bytes that were written, even if the write was not successful.
714 // This is important to retain the writable space invariant on the sectors.
715 SectorFromAddress(write_address)->RemoveWritableBytes(result.size());
716
717 if (!result.ok()) {
718 ERR("Failed to write %zu bytes at %#zx. %zu actually written",
719 entry.size(),
720 size_t(write_address),
721 result.size());
722 return result.status();
723 }
724
725 if (options_.verify_on_write) {
726 TRY(entry.VerifyChecksumInFlash());
727 }
728
729 return Status::OK;
730}
731
David Rogersf56131c2020-03-04 10:19:22 -0800732Status KeyValueStore::RelocateEntry(KeyDescriptor& key_descriptor,
David Rogersa2562b52020-03-05 15:30:05 -0800733 KeyValueStore::Address old_address) {
734 Entry entry;
735 TRY(Entry::Read(partition_, old_address, formats_, &entry));
736
737 // Find a new sector for the entry and write it to the new location. For
738 // relocation the find should not not be a sector already containing the key
739 // but can be the always empty sector, since this is part of the GC process
740 // that will result in a new empty sector. Also find a sector that does not
741 // have reclaimable space (mostly for the full GC, where that would result in
742 // an immediate extra relocation).
743 SectorDescriptor* new_sector;
744
745 TRY(FindSectorWithSpace(
746 &new_sector, entry.size(), kGarbageCollect, key_descriptor.addresses()));
747 const Address new_address = NextWritableAddress(new_sector);
748 TRY(MoveEntry(new_address, entry));
749
750 // TODO: Perhaps add check that the entry matches the key descriptor (key
751 // hash, ID, checksum).
752
753 // Entry was written successfully; update the key descriptor and the sector
754 // descriptors to reflect the new entry.
755 key_descriptor.UpdateAddress(old_address, new_address);
756 new_sector->AddValidBytes(entry.size());
757 SectorFromAddress(old_address)->RemoveValidBytes(entry.size());
758
759 return Status::OK;
760}
761
762Status KeyValueStore::MoveEntry(Address new_address, Entry& entry) {
763 // Step 1: Read the old entry.
David Rogersf0a35442020-02-04 12:16:38 -0800764 struct TempEntry {
Wyatt Heplere541e072020-02-14 09:10:53 -0800765 Entry::KeyBuffer key;
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800766 std::array<byte, sizeof(working_buffer_) - sizeof(key)> value;
David Rogersf0a35442020-02-04 12:16:38 -0800767 };
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800768 auto [key_buffer, value_buffer] =
769 *std::launder(reinterpret_cast<TempEntry*>(working_buffer_.data()));
David Rogersf0a35442020-02-04 12:16:38 -0800770
Wyatt Heplere541e072020-02-14 09:10:53 -0800771 // Read the entry to be relocated. Store the entry in a local variable and
David Rogersf0a35442020-02-04 12:16:38 -0800772 // store the key and value in the TempEntry stored in the static allocated
773 // working_buffer_.
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800774 TRY_ASSIGN(size_t key_length, entry.ReadKey(key_buffer));
775 string_view key = string_view(key_buffer.data(), key_length);
776
777 StatusWithSize result = entry.ReadValue(value_buffer);
778 if (!result.ok()) {
David Rogersf0a35442020-02-04 12:16:38 -0800779 return Status::INTERNAL;
780 }
781
Wyatt Heplerce7b8df2020-02-21 10:38:39 -0800782 const span value = span(value_buffer.data(), result.size());
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -0800783 TRY(entry.VerifyChecksum(key, value));
David Rogersf0a35442020-02-04 12:16:38 -0800784
David Rogersa2562b52020-03-05 15:30:05 -0800785 DBG("Moving %zu B entry with transaction ID %zu to address %#zx",
786 entry.size(),
787 size_t(entry.transaction_id()),
788 size_t(new_address));
David Rogerscd87c322020-02-27 14:04:08 -0800789
David Rogersa2562b52020-03-05 15:30:05 -0800790 // Step 2: Write the entry to the new location.
791 entry.UpdateAddress(new_address);
792 result = entry.Write(key, value);
793
794 // Remove any bytes that were written, even if the write was not successful.
795 // This is important to retain the writable space invariant on the sectors.
796 SectorFromAddress(new_address)->RemoveWritableBytes(result.size());
797
798 if (!result.ok()) {
799 ERR("Failed to write %zu bytes at %" PRIx32 ". %zu actually written",
800 entry.size(),
801 new_address,
802 result.size());
803 return result.status();
David Rogersf56131c2020-03-04 10:19:22 -0800804 }
805
David Rogersa2562b52020-03-05 15:30:05 -0800806 // Step 3: Verify write to the new location.
807 if (options_.verify_on_write) {
808 TRY(entry.VerifyChecksumInFlash());
David Rogersf56131c2020-03-04 10:19:22 -0800809 }
David Rogersdf025cd2020-02-06 17:05:34 -0800810
811 return Status::OK;
David Rogersa12786b2020-01-31 16:02:33 -0800812}
813
David Rogers8db5a722020-02-03 18:28:34 -0800814// Find either an existing sector with enough space that is not the sector to
815// skip, or an empty sector. Maintains the invariant that there is always at
David Rogersc8fe1f52020-02-27 14:04:08 -0800816// least 1 empty sector except during GC. On GC, skip sectors that have
817// reclaimable bytes.
Wyatt Hepler5a33d8c2020-02-06 09:32:58 -0800818Status KeyValueStore::FindSectorWithSpace(
819 SectorDescriptor** found_sector,
820 size_t size,
David Rogersc8fe1f52020-02-27 14:04:08 -0800821 FindSectorMode find_mode,
David Rogersa2562b52020-03-05 15:30:05 -0800822 span<const Address> addresses_to_skip) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800823 SectorDescriptor* first_empty_sector = nullptr;
David Rogersc8fe1f52020-02-27 14:04:08 -0800824 bool at_least_two_empty_sectors = (find_mode == kGarbageCollect);
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800825
David Rogersa2562b52020-03-05 15:30:05 -0800826 // Build a vector of sectors to avoid.
827 Vector<const SectorDescriptor*, internal::kEntryRedundancy> sectors_to_skip;
828 for (auto& address : addresses_to_skip) {
829 sectors_to_skip.push_back(SectorFromAddress(address));
830 }
831
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800832 DBG("Find sector with %zu bytes available, starting with sector %u",
833 size,
834 SectorIndex(last_new_sector_));
David Rogerscd87c322020-02-27 14:04:08 -0800835 for (auto& skip_sector : sectors_to_skip) {
836 DBG(" Skip sector %u", SectorIndex(skip_sector));
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800837 }
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800838
David Rogers8ce55cd2020-02-04 19:41:48 -0800839 // The last_new_sector_ is the sector that was last selected as the "new empty
840 // sector" to write to. This last new sector is used as the starting point for
841 // the next "find a new empty sector to write to" operation. By using the last
842 // new sector as the start point we will cycle which empty sector is selected
843 // next, spreading the wear across all the empty sectors and get a wear
844 // leveling benefit, rather than putting more wear on the lower number
845 // sectors.
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800846 SectorDescriptor* sector = last_new_sector_;
David Rogers67f4b6c2020-02-06 16:17:09 -0800847
David Rogerscd87c322020-02-27 14:04:08 -0800848 // Look for a sector to use with enough space. The search uses a 2 priority
849 // tier process.
850 //
David Rogersc8fe1f52020-02-27 14:04:08 -0800851 // Tier 1 is sector that already has valid data. During GC only select a
852 // sector that has no reclaimable bytes. Immediately use the first matching
853 // sector that is found.
David Rogerscd87c322020-02-27 14:04:08 -0800854 //
David Rogersc8fe1f52020-02-27 14:04:08 -0800855 // Tier 2 is find sectors that are empty/erased. While scanning for a partial
856 // sector, keep track of the first empty sector and if a second empty sector
857 // was seen. If during GC then count the second empty sector as always seen.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800858 for (size_t j = 0; j < sectors_.size(); j++) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800859 sector += 1;
860 if (sector == sectors_.end()) {
861 sector = sectors_.begin();
862 }
Keir Mierle8c352dc2020-02-02 13:58:19 -0800863
David Rogerscd87c322020-02-27 14:04:08 -0800864 if (std::find(sectors_to_skip.begin(), sectors_to_skip.end(), sector) !=
865 sectors_to_skip.end()) {
David Rogers8db5a722020-02-03 18:28:34 -0800866 continue;
867 }
868
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800869 const size_t sector_size_bytes = partition_.sector_size_bytes();
David Rogerscd87c322020-02-27 14:04:08 -0800870 if (!sector->Empty(sector_size_bytes) && sector->HasSpace(size) &&
David Rogersc8fe1f52020-02-27 14:04:08 -0800871 ((find_mode == kAppendEntry) ||
David Rogerscd87c322020-02-27 14:04:08 -0800872 (sector->RecoverableBytes(sector_size_bytes) == 0))) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800873 *found_sector = sector;
David Rogers8ce55cd2020-02-04 19:41:48 -0800874 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800875 }
876
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800877 if (sector->Empty(sector_size_bytes)) {
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800878 if (first_empty_sector == nullptr) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800879 first_empty_sector = sector;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800880 } else {
881 at_least_two_empty_sectors = true;
Wyatt Hepler2ad60672020-01-21 08:00:16 -0800882 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800883 }
884 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800885
David Rogers8ce55cd2020-02-04 19:41:48 -0800886 // If the scan for a partial sector does not find a suitable sector, use the
887 // first empty sector that was found. Normally it is required to keep 1 empty
David Rogersc8fe1f52020-02-27 14:04:08 -0800888 // sector after the sector found here, but that rule does not apply during GC.
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800889 if (at_least_two_empty_sectors) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800890 DBG(" Found a usable empty sector; returning the first found (%u)",
David Rogers8ce55cd2020-02-04 19:41:48 -0800891 SectorIndex(first_empty_sector));
892 last_new_sector_ = first_empty_sector;
893 *found_sector = first_empty_sector;
894 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800895 }
David Rogers8ce55cd2020-02-04 19:41:48 -0800896
897 // No sector was found.
David Rogers67f4b6c2020-02-06 16:17:09 -0800898 DBG(" Unable to find a usable sector");
David Rogers8ce55cd2020-02-04 19:41:48 -0800899 *found_sector = nullptr;
900 return Status::RESOURCE_EXHAUSTED;
Wyatt Heplerb7609542020-01-24 10:29:54 -0800901}
902
David Rogers2761aeb2020-01-31 17:09:00 -0800903KeyValueStore::SectorDescriptor* KeyValueStore::FindSectorToGarbageCollect() {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800904 const size_t sector_size_bytes = partition_.sector_size_bytes();
David Rogers2761aeb2020-01-31 17:09:00 -0800905 SectorDescriptor* sector_candidate = nullptr;
David Rogersa12786b2020-01-31 16:02:33 -0800906 size_t candidate_bytes = 0;
907
908 // Step 1: Try to find a sectors with stale keys and no valid keys (no
909 // relocation needed). If any such sectors are found, use the sector with the
910 // most reclaimable bytes.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800911 for (auto& sector : sectors_) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800912 if ((sector.valid_bytes() == 0) &&
913 (sector.RecoverableBytes(sector_size_bytes) > candidate_bytes)) {
David Rogersa12786b2020-01-31 16:02:33 -0800914 sector_candidate = &sector;
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800915 candidate_bytes = sector.RecoverableBytes(sector_size_bytes);
David Rogersa12786b2020-01-31 16:02:33 -0800916 }
917 }
918
919 // Step 2: If step 1 yields no sectors, just find the sector with the most
920 // reclaimable bytes.
921 if (sector_candidate == nullptr) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800922 for (auto& sector : sectors_) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800923 if (sector.RecoverableBytes(sector_size_bytes) > candidate_bytes) {
David Rogersa12786b2020-01-31 16:02:33 -0800924 sector_candidate = &sector;
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800925 candidate_bytes = sector.RecoverableBytes(sector_size_bytes);
David Rogersa12786b2020-01-31 16:02:33 -0800926 }
927 }
928 }
929
David Rogers5981f312020-02-13 13:33:56 -0800930 if (sector_candidate != nullptr) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800931 DBG("Found sector %u to Garbage Collect, %zu recoverable bytes",
David Rogers5981f312020-02-13 13:33:56 -0800932 SectorIndex(sector_candidate),
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800933 sector_candidate->RecoverableBytes(sector_size_bytes));
David Rogers5981f312020-02-13 13:33:56 -0800934 } else {
935 DBG("Unable to find sector to garbage collect!");
936 }
David Rogersa12786b2020-01-31 16:02:33 -0800937 return sector_candidate;
938}
939
David Rogerscd87c322020-02-27 14:04:08 -0800940Status KeyValueStore::GarbageCollectFull() {
941 DBG("Garbage Collect all sectors");
David Rogerscd87c322020-02-27 14:04:08 -0800942 SectorDescriptor* sector = last_new_sector_;
943
944 // TODO: look in to making an iterator method for cycling through sectors
945 // starting from last_new_sector_.
946 for (size_t j = 0; j < sectors_.size(); j++) {
947 sector += 1;
948 if (sector == sectors_.end()) {
949 sector = sectors_.begin();
950 }
951
952 if (sector->RecoverableBytes(partition_.sector_size_bytes()) > 0) {
953 TRY(GarbageCollectSector(sector));
954 }
955 }
956
957 DBG("Garbage Collect all complete");
David Rogerscd87c322020-02-27 14:04:08 -0800958 return Status::OK;
959}
960
961Status KeyValueStore::GarbageCollectPartial() {
David Rogers67f4b6c2020-02-06 16:17:09 -0800962 DBG("Garbage Collect a single sector");
963
David Rogersa12786b2020-01-31 16:02:33 -0800964 // Step 1: Find the sector to garbage collect
David Rogers2761aeb2020-01-31 17:09:00 -0800965 SectorDescriptor* sector_to_gc = FindSectorToGarbageCollect();
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800966
David Rogersa12786b2020-01-31 16:02:33 -0800967 if (sector_to_gc == nullptr) {
David Rogersa2562b52020-03-05 15:30:05 -0800968 // Nothing to GC.
969 return Status::NOT_FOUND;
David Rogersa12786b2020-01-31 16:02:33 -0800970 }
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -0800971
David Rogerscd87c322020-02-27 14:04:08 -0800972 TRY(GarbageCollectSector(sector_to_gc));
David Rogerscd87c322020-02-27 14:04:08 -0800973 return Status::OK;
974}
975
976Status KeyValueStore::GarbageCollectSector(SectorDescriptor* sector_to_gc) {
977 // Step 1: Move any valid entries in the GC sector to other sectors
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800978 if (sector_to_gc->valid_bytes() != 0) {
Wyatt Hepler1c329ca2020-02-07 18:07:23 -0800979 for (auto& descriptor : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -0800980 if (AddressInSector(*sector_to_gc, descriptor.address())) {
David Rogers67f4b6c2020-02-06 16:17:09 -0800981 DBG(" Relocate entry");
David Rogersf56131c2020-03-04 10:19:22 -0800982 TRY(RelocateEntry(descriptor, descriptor.address()));
David Rogersa12786b2020-01-31 16:02:33 -0800983 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800984 }
985 }
Wyatt Heplerb7609542020-01-24 10:29:54 -0800986
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800987 if (sector_to_gc->valid_bytes() != 0) {
David Rogers67f4b6c2020-02-06 16:17:09 -0800988 ERR(" Failed to relocate valid entries from sector being garbage "
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800989 "collected, %zu valid bytes remain",
990 sector_to_gc->valid_bytes());
Wyatt Heplerb7609542020-01-24 10:29:54 -0800991 return Status::INTERNAL;
992 }
993
David Rogerscd87c322020-02-27 14:04:08 -0800994 // Step 2: Reinitialize the sector
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800995 sector_to_gc->set_writable_bytes(0);
David Rogersa12786b2020-01-31 16:02:33 -0800996 TRY(partition_.Erase(SectorBaseAddress(sector_to_gc), 1));
Wyatt Hepler2c7eca02020-02-18 16:01:42 -0800997 sector_to_gc->set_writable_bytes(partition_.sector_size_bytes());
Wyatt Heplerb7609542020-01-24 10:29:54 -0800998
David Rogerscd87c322020-02-27 14:04:08 -0800999 DBG(" Garbage Collect sector %u complete", SectorIndex(sector_to_gc));
David Rogersa12786b2020-01-31 16:02:33 -08001000 return Status::OK;
Wyatt Hepler4da1fcb2020-01-30 17:32:18 -08001001}
1002
Wyatt Heplerbdd8e5a2020-02-20 19:27:26 -08001003KeyValueStore::Entry KeyValueStore::CreateEntry(Address address,
1004 std::string_view key,
1005 span<const byte> value,
1006 KeyDescriptor::State state) {
Keir Mierle9e38b402020-02-21 13:06:21 -08001007 // Always bump the transaction ID when creating a new entry.
1008 //
1009 // Burning transaction IDs prevents inconsistencies between flash and memory
1010 // that which could happen if a write succeeds, but for some reason the read
1011 // and verify step fails. Here's how this would happen:
1012 //
1013 // 1. The entry is written but for some reason the flash reports failure OR
1014 // The write succeeds, but the read / verify operation fails.
1015 // 2. The transaction ID is NOT incremented, because of the failure
1016 // 3. (later) A new entry is written, re-using the transaction ID (oops)
1017 //
1018 // By always burning transaction IDs, the above problem can't happen.
1019 last_transaction_id_ += 1;
1020
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001021 if (state == KeyDescriptor::kDeleted) {
Wyatt Hepler7465be32020-02-21 15:30:53 -08001022 return Entry::Tombstone(
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -08001023 partition_, address, formats_.primary(), key, last_transaction_id_);
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001024 }
1025 return Entry::Valid(partition_,
1026 address,
Wyatt Hepler22d0d9f2020-03-05 14:57:11 -08001027 formats_.primary(),
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001028 key,
1029 value,
Keir Mierle9e38b402020-02-21 13:06:21 -08001030 last_transaction_id_);
Wyatt Heplerd2298282020-02-20 17:12:45 -08001031}
1032
1033void KeyValueStore::Reset() {
1034 initialized_ = false;
1035 key_descriptors_.clear();
1036 last_new_sector_ = nullptr;
1037 last_transaction_id_ = 0;
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001038}
1039
Keir Mierle8c352dc2020-02-02 13:58:19 -08001040void KeyValueStore::LogDebugInfo() {
Keir Mierle8c352dc2020-02-02 13:58:19 -08001041 const size_t sector_size_bytes = partition_.sector_size_bytes();
1042 DBG("====================== KEY VALUE STORE DUMP =========================");
1043 DBG(" ");
1044 DBG("Flash partition:");
Wyatt Heplerad0a7932020-02-06 08:20:38 -08001045 DBG(" Sector count = %zu", partition_.sector_count());
Wyatt Hepler38ce30f2020-02-19 11:48:31 -08001046 DBG(" Sector max count = %zu", sectors_.max_size());
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001047 DBG(" Sectors in use = %zu", sectors_.size());
Keir Mierle8c352dc2020-02-02 13:58:19 -08001048 DBG(" Sector size = %zu", sector_size_bytes);
1049 DBG(" Total size = %zu", partition_.size_bytes());
1050 DBG(" Alignment = %zu", partition_.alignment_bytes());
1051 DBG(" ");
1052 DBG("Key descriptors:");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001053 DBG(" Entry count = %zu", key_descriptors_.size());
Wyatt Hepler38ce30f2020-02-19 11:48:31 -08001054 DBG(" Max entry count = %zu", key_descriptors_.max_size());
Keir Mierle8c352dc2020-02-02 13:58:19 -08001055 DBG(" ");
1056 DBG(" # hash version address address (hex)");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001057 for (size_t i = 0; i < key_descriptors_.size(); ++i) {
1058 const KeyDescriptor& kd = key_descriptors_[i];
Keir Mierle8c352dc2020-02-02 13:58:19 -08001059 DBG(" |%3zu: | %8zx |%8zu | %8zu | %8zx",
1060 i,
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001061 size_t(kd.hash()),
1062 size_t(kd.transaction_id()),
1063 size_t(kd.address()),
1064 size_t(kd.address()));
Keir Mierle8c352dc2020-02-02 13:58:19 -08001065 }
1066 DBG(" ");
1067
1068 DBG("Sector descriptors:");
1069 DBG(" # tail free valid has_space");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001070 for (size_t sector_id = 0; sector_id < sectors_.size(); ++sector_id) {
1071 const SectorDescriptor& sd = sectors_[sector_id];
Keir Mierle8c352dc2020-02-02 13:58:19 -08001072 DBG(" |%3zu: | %8zu |%8zu | %s",
1073 sector_id,
Wyatt Hepler2c7eca02020-02-18 16:01:42 -08001074 size_t(sd.writable_bytes()),
1075 sd.valid_bytes(),
1076 sd.writable_bytes() ? "YES" : "");
Keir Mierle8c352dc2020-02-02 13:58:19 -08001077 }
1078 DBG(" ");
1079
1080 // TODO: This should stop logging after some threshold.
1081 // size_t dumped_bytes = 0;
1082 DBG("Sector raw data:");
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001083 for (size_t sector_id = 0; sector_id < sectors_.size(); ++sector_id) {
Keir Mierle8c352dc2020-02-02 13:58:19 -08001084 // Read sector data. Yes, this will blow the stack on embedded.
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001085 std::array<byte, 500> raw_sector_data; // TODO!!!
Keir Mierle8c352dc2020-02-02 13:58:19 -08001086 StatusWithSize sws =
1087 partition_.Read(sector_id * sector_size_bytes, raw_sector_data);
1088 DBG("Read: %zu bytes", sws.size());
1089
1090 DBG(" base addr offs 0 1 2 3 4 5 6 7");
1091 for (size_t i = 0; i < sector_size_bytes; i += 8) {
1092 DBG(" %3zu %8zx %5zu | %02x %02x %02x %02x %02x %02x %02x %02x",
1093 sector_id,
1094 (sector_id * sector_size_bytes) + i,
1095 i,
1096 static_cast<unsigned int>(raw_sector_data[i + 0]),
1097 static_cast<unsigned int>(raw_sector_data[i + 1]),
1098 static_cast<unsigned int>(raw_sector_data[i + 2]),
1099 static_cast<unsigned int>(raw_sector_data[i + 3]),
1100 static_cast<unsigned int>(raw_sector_data[i + 4]),
1101 static_cast<unsigned int>(raw_sector_data[i + 5]),
1102 static_cast<unsigned int>(raw_sector_data[i + 6]),
1103 static_cast<unsigned int>(raw_sector_data[i + 7]));
1104
1105 // TODO: Fix exit condition.
1106 if (i > 128) {
1107 break;
1108 }
1109 }
1110 DBG(" ");
1111 }
1112
1113 DBG("////////////////////// KEY VALUE STORE DUMP END /////////////////////");
1114}
1115
David Rogerscf680ab2020-02-12 23:28:32 -08001116void KeyValueStore::LogSectors() const {
1117 DBG("Sector descriptors: count %zu", sectors_.size());
Wyatt Hepler1c329ca2020-02-07 18:07:23 -08001118 for (auto& sector : sectors_) {
Wyatt Hepler2c7eca02020-02-18 16:01:42 -08001119 DBG(" - Sector %u: valid %zu, recoverable %zu, free %zu",
David Rogers50185ad2020-02-07 00:02:46 -08001120 SectorIndex(&sector),
Wyatt Hepler2c7eca02020-02-18 16:01:42 -08001121 sector.valid_bytes(),
1122 sector.RecoverableBytes(partition_.sector_size_bytes()),
1123 sector.writable_bytes());
David Rogers50185ad2020-02-07 00:02:46 -08001124 }
1125}
1126
David Rogerscf680ab2020-02-12 23:28:32 -08001127void KeyValueStore::LogKeyDescriptor() const {
1128 DBG("Key descriptors: count %zu", key_descriptors_.size());
1129 for (auto& key : key_descriptors_) {
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001130 DBG(" - Key: %s, hash %#zx, transaction ID %zu, address %#zx",
David Rogerscf680ab2020-02-12 23:28:32 -08001131 key.deleted() ? "Deleted" : "Valid",
Wyatt Hepler1fc11042020-02-19 17:17:51 -08001132 static_cast<size_t>(key.hash()),
1133 static_cast<size_t>(key.transaction_id()),
1134 static_cast<size_t>(key.address()));
David Rogerscf680ab2020-02-12 23:28:32 -08001135 }
1136}
1137
Wyatt Hepler2ad60672020-01-21 08:00:16 -08001138} // namespace pw::kvs