Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 1 | /* |
| 2 | * fs/logfs/logfs_abi.h |
| 3 | * |
| 4 | * As should be obvious for Linux kernel code, license is GPLv2 |
| 5 | * |
| 6 | * Copyright (c) 2005-2008 Joern Engel <joern@logfs.org> |
| 7 | * |
| 8 | * Public header for logfs. |
| 9 | */ |
| 10 | #ifndef FS_LOGFS_LOGFS_ABI_H |
| 11 | #define FS_LOGFS_LOGFS_ABI_H |
| 12 | |
| 13 | /* For out-of-kernel compiles */ |
| 14 | #ifndef BUILD_BUG_ON |
| 15 | #define BUILD_BUG_ON(condition) /**/ |
| 16 | #endif |
| 17 | |
| 18 | #define SIZE_CHECK(type, size) \ |
| 19 | static inline void check_##type(void) \ |
| 20 | { \ |
| 21 | BUILD_BUG_ON(sizeof(struct type) != (size)); \ |
| 22 | } |
| 23 | |
| 24 | /* |
| 25 | * Throughout the logfs code, we're constantly dealing with blocks at |
| 26 | * various positions or offsets. To remove confusion, we stricly |
| 27 | * distinguish between a "position" - the logical position within a |
| 28 | * file and an "offset" - the physical location within the device. |
| 29 | * |
| 30 | * Any usage of the term offset for a logical location or position for |
| 31 | * a physical one is a bug and should get fixed. |
| 32 | */ |
| 33 | |
| 34 | /* |
| 35 | * Block are allocated in one of several segments depending on their |
| 36 | * level. The following levels are used: |
| 37 | * 0 - regular data block |
| 38 | * 1 - i1 indirect blocks |
| 39 | * 2 - i2 indirect blocks |
| 40 | * 3 - i3 indirect blocks |
| 41 | * 4 - i4 indirect blocks |
| 42 | * 5 - i5 indirect blocks |
| 43 | * 6 - ifile data blocks |
| 44 | * 7 - ifile i1 indirect blocks |
| 45 | * 8 - ifile i2 indirect blocks |
| 46 | * 9 - ifile i3 indirect blocks |
| 47 | * 10 - ifile i4 indirect blocks |
| 48 | * 11 - ifile i5 indirect blocks |
| 49 | * Potential levels to be used in the future: |
| 50 | * 12 - gc recycled blocks, long-lived data |
| 51 | * 13 - replacement blocks, short-lived data |
| 52 | * |
Anand Gadiyar | a8cd456 | 2010-05-10 14:51:19 +0530 | [diff] [blame] | 53 | * Levels 1-11 are necessary for robust gc operations and help separate |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 54 | * short-lived metadata from longer-lived file data. In the future, |
Anand Gadiyar | a8cd456 | 2010-05-10 14:51:19 +0530 | [diff] [blame] | 55 | * file data should get separated into several segments based on simple |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 56 | * heuristics. Old data recycled during gc operation is expected to be |
| 57 | * long-lived. New data is of uncertain life expectancy. New data |
| 58 | * used to replace older blocks in existing files is expected to be |
| 59 | * short-lived. |
| 60 | */ |
| 61 | |
| 62 | |
| 63 | /* Magic numbers. 64bit for superblock, 32bit for statfs f_type */ |
Joern Engel | c2f843f | 2010-03-06 10:03:11 +0100 | [diff] [blame] | 64 | #define LOGFS_MAGIC 0x7a3a8e5cb9d5bf67ull |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 65 | #define LOGFS_MAGIC_U32 0xc97e8168u |
| 66 | |
| 67 | /* |
| 68 | * Various blocksize related macros. Blocksize is currently fixed at 4KiB. |
| 69 | * Sooner or later that should become configurable and the macros replaced |
| 70 | * by something superblock-dependent. Pointers in indirect blocks are and |
| 71 | * will remain 64bit. |
| 72 | * |
| 73 | * LOGFS_BLOCKSIZE - self-explaining |
| 74 | * LOGFS_BLOCK_FACTOR - number of pointers per indirect block |
| 75 | * LOGFS_BLOCK_BITS - log2 of LOGFS_BLOCK_FACTOR, used for shifts |
| 76 | */ |
| 77 | #define LOGFS_BLOCKSIZE (4096ull) |
| 78 | #define LOGFS_BLOCK_FACTOR (LOGFS_BLOCKSIZE / sizeof(u64)) |
| 79 | #define LOGFS_BLOCK_BITS (9) |
| 80 | |
| 81 | /* |
| 82 | * Number of blocks at various levels of indirection. There are 16 direct |
| 83 | * block pointers plus a single indirect pointer. |
| 84 | */ |
| 85 | #define I0_BLOCKS (16) |
| 86 | #define I1_BLOCKS LOGFS_BLOCK_FACTOR |
| 87 | #define I2_BLOCKS (LOGFS_BLOCK_FACTOR * I1_BLOCKS) |
| 88 | #define I3_BLOCKS (LOGFS_BLOCK_FACTOR * I2_BLOCKS) |
| 89 | #define I4_BLOCKS (LOGFS_BLOCK_FACTOR * I3_BLOCKS) |
| 90 | #define I5_BLOCKS (LOGFS_BLOCK_FACTOR * I4_BLOCKS) |
| 91 | |
| 92 | #define INDIRECT_INDEX I0_BLOCKS |
| 93 | #define LOGFS_EMBEDDED_FIELDS (I0_BLOCKS + 1) |
| 94 | |
| 95 | /* |
| 96 | * Sizes at which files require another level of indirection. Files smaller |
| 97 | * than LOGFS_EMBEDDED_SIZE can be completely stored in the inode itself, |
| 98 | * similar like ext2 fast symlinks. |
| 99 | * |
| 100 | * Data at a position smaller than LOGFS_I0_SIZE is accessed through the |
| 101 | * direct pointers, else through the 1x indirect pointer and so forth. |
| 102 | */ |
| 103 | #define LOGFS_EMBEDDED_SIZE (LOGFS_EMBEDDED_FIELDS * sizeof(u64)) |
| 104 | #define LOGFS_I0_SIZE (I0_BLOCKS * LOGFS_BLOCKSIZE) |
| 105 | #define LOGFS_I1_SIZE (I1_BLOCKS * LOGFS_BLOCKSIZE) |
| 106 | #define LOGFS_I2_SIZE (I2_BLOCKS * LOGFS_BLOCKSIZE) |
| 107 | #define LOGFS_I3_SIZE (I3_BLOCKS * LOGFS_BLOCKSIZE) |
| 108 | #define LOGFS_I4_SIZE (I4_BLOCKS * LOGFS_BLOCKSIZE) |
| 109 | #define LOGFS_I5_SIZE (I5_BLOCKS * LOGFS_BLOCKSIZE) |
| 110 | |
| 111 | /* |
| 112 | * Each indirect block pointer must have this flag set, if all block pointers |
| 113 | * behind it are set, i.e. there is no hole hidden in the shadow of this |
| 114 | * indirect block pointer. |
| 115 | */ |
| 116 | #define LOGFS_FULLY_POPULATED (1ULL << 63) |
| 117 | #define pure_ofs(ofs) (ofs & ~LOGFS_FULLY_POPULATED) |
| 118 | |
| 119 | /* |
Anand Gadiyar | a8cd456 | 2010-05-10 14:51:19 +0530 | [diff] [blame] | 120 | * LogFS needs to separate data into levels. Each level is defined as the |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 121 | * maximal possible distance from the master inode (inode of the inode file). |
| 122 | * Data blocks reside on level 0, 1x indirect block on level 1, etc. |
| 123 | * Inodes reside on level 6, indirect blocks for the inode file on levels 7-11. |
| 124 | * This effort is necessary to guarantee garbage collection to always make |
| 125 | * progress. |
| 126 | * |
| 127 | * LOGFS_MAX_INDIRECT is the maximal indirection through indirect blocks, |
| 128 | * LOGFS_MAX_LEVELS is one more for the actual data level of a file. It is |
| 129 | * the maximal number of levels for one file. |
| 130 | * LOGFS_NO_AREAS is twice that, as the inode file and regular files are |
| 131 | * effectively stacked on top of each other. |
| 132 | */ |
| 133 | #define LOGFS_MAX_INDIRECT (5) |
| 134 | #define LOGFS_MAX_LEVELS (LOGFS_MAX_INDIRECT + 1) |
| 135 | #define LOGFS_NO_AREAS (2 * LOGFS_MAX_LEVELS) |
| 136 | |
| 137 | /* Maximum size of filenames */ |
| 138 | #define LOGFS_MAX_NAMELEN (255) |
| 139 | |
| 140 | /* Number of segments in the primary journal. */ |
| 141 | #define LOGFS_JOURNAL_SEGS (16) |
| 142 | |
| 143 | /* Maximum number of free/erased/etc. segments in journal entries */ |
| 144 | #define MAX_CACHED_SEGS (64) |
| 145 | |
| 146 | |
| 147 | /* |
| 148 | * LOGFS_OBJECT_HEADERSIZE is the size of a single header in the object store, |
| 149 | * LOGFS_MAX_OBJECTSIZE the size of the largest possible object, including |
| 150 | * its header, |
| 151 | * LOGFS_SEGMENT_RESERVE is the amount of space reserved for each segment for |
| 152 | * its segment header and the padded space at the end when no further objects |
| 153 | * fit. |
| 154 | */ |
| 155 | #define LOGFS_OBJECT_HEADERSIZE (0x1c) |
| 156 | #define LOGFS_SEGMENT_HEADERSIZE (0x18) |
| 157 | #define LOGFS_MAX_OBJECTSIZE (LOGFS_OBJECT_HEADERSIZE + LOGFS_BLOCKSIZE) |
| 158 | #define LOGFS_SEGMENT_RESERVE \ |
| 159 | (LOGFS_SEGMENT_HEADERSIZE + LOGFS_MAX_OBJECTSIZE - 1) |
| 160 | |
| 161 | /* |
| 162 | * Segment types: |
| 163 | * SEG_SUPER - Data or indirect block |
| 164 | * SEG_JOURNAL - Inode |
| 165 | * SEG_OSTORE - Dentry |
| 166 | */ |
| 167 | enum { |
| 168 | SEG_SUPER = 0x01, |
| 169 | SEG_JOURNAL = 0x02, |
| 170 | SEG_OSTORE = 0x03, |
| 171 | }; |
| 172 | |
| 173 | /** |
| 174 | * struct logfs_segment_header - per-segment header in the ostore |
| 175 | * |
| 176 | * @crc: crc32 of header (there is no data) |
| 177 | * @pad: unused, must be 0 |
| 178 | * @type: segment type, see above |
| 179 | * @level: GC level for all objects in this segment |
| 180 | * @segno: segment number |
| 181 | * @ec: erase count for this segment |
| 182 | * @gec: global erase count at time of writing |
| 183 | */ |
| 184 | struct logfs_segment_header { |
| 185 | __be32 crc; |
| 186 | __be16 pad; |
| 187 | __u8 type; |
| 188 | __u8 level; |
| 189 | __be32 segno; |
| 190 | __be32 ec; |
| 191 | __be64 gec; |
| 192 | }; |
| 193 | |
| 194 | SIZE_CHECK(logfs_segment_header, LOGFS_SEGMENT_HEADERSIZE); |
| 195 | |
Joern Engel | 6a08ab8 | 2010-03-05 16:07:04 +0100 | [diff] [blame] | 196 | #define LOGFS_FEATURES_INCOMPAT (0ull) |
| 197 | #define LOGFS_FEATURES_RO_COMPAT (0ull) |
| 198 | #define LOGFS_FEATURES_COMPAT (0ull) |
| 199 | |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 200 | /** |
| 201 | * struct logfs_disk_super - on-medium superblock |
| 202 | * |
| 203 | * @ds_magic: magic number, must equal LOGFS_MAGIC |
| 204 | * @ds_crc: crc32 of structure starting with the next field |
| 205 | * @ds_ifile_levels: maximum number of levels for ifile |
| 206 | * @ds_iblock_levels: maximum number of levels for regular files |
Anand Gadiyar | a8cd456 | 2010-05-10 14:51:19 +0530 | [diff] [blame] | 207 | * @ds_data_levels: number of separate levels for data |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 208 | * @pad0: reserved, must be 0 |
| 209 | * @ds_feature_incompat: incompatible filesystem features |
| 210 | * @ds_feature_ro_compat: read-only compatible filesystem features |
| 211 | * @ds_feature_compat: compatible filesystem features |
| 212 | * @ds_flags: flags |
| 213 | * @ds_segment_shift: log2 of segment size |
| 214 | * @ds_block_shift: log2 of block size |
| 215 | * @ds_write_shift: log2 of write size |
| 216 | * @pad1: reserved, must be 0 |
| 217 | * @ds_journal_seg: segments used by primary journal |
| 218 | * @ds_root_reserve: bytes reserved for the superuser |
| 219 | * @ds_speed_reserve: bytes reserved to speed up GC |
| 220 | * @ds_bad_seg_reserve: number of segments reserved to handle bad blocks |
| 221 | * @pad2: reserved, must be 0 |
| 222 | * @pad3: reserved, must be 0 |
| 223 | * |
| 224 | * Contains only read-only fields. Read-write fields like the amount of used |
| 225 | * space is tracked in the dynamic superblock, which is stored in the journal. |
| 226 | */ |
| 227 | struct logfs_disk_super { |
| 228 | struct logfs_segment_header ds_sh; |
| 229 | __be64 ds_magic; |
| 230 | |
| 231 | __be32 ds_crc; |
| 232 | __u8 ds_ifile_levels; |
| 233 | __u8 ds_iblock_levels; |
| 234 | __u8 ds_data_levels; |
| 235 | __u8 ds_segment_shift; |
| 236 | __u8 ds_block_shift; |
| 237 | __u8 ds_write_shift; |
| 238 | __u8 pad0[6]; |
| 239 | |
| 240 | __be64 ds_filesystem_size; |
| 241 | __be32 ds_segment_size; |
| 242 | __be32 ds_bad_seg_reserve; |
| 243 | |
| 244 | __be64 ds_feature_incompat; |
| 245 | __be64 ds_feature_ro_compat; |
| 246 | |
| 247 | __be64 ds_feature_compat; |
| 248 | __be64 ds_feature_flags; |
| 249 | |
| 250 | __be64 ds_root_reserve; |
| 251 | __be64 ds_speed_reserve; |
| 252 | |
| 253 | __be32 ds_journal_seg[LOGFS_JOURNAL_SEGS]; |
| 254 | |
| 255 | __be64 ds_super_ofs[2]; |
| 256 | __be64 pad3[8]; |
| 257 | }; |
| 258 | |
| 259 | SIZE_CHECK(logfs_disk_super, 256); |
| 260 | |
| 261 | /* |
| 262 | * Object types: |
| 263 | * OBJ_BLOCK - Data or indirect block |
| 264 | * OBJ_INODE - Inode |
| 265 | * OBJ_DENTRY - Dentry |
| 266 | */ |
| 267 | enum { |
| 268 | OBJ_BLOCK = 0x04, |
| 269 | OBJ_INODE = 0x05, |
| 270 | OBJ_DENTRY = 0x06, |
| 271 | }; |
| 272 | |
| 273 | /** |
| 274 | * struct logfs_object_header - per-object header in the ostore |
| 275 | * |
| 276 | * @crc: crc32 of header, excluding data_crc |
| 277 | * @len: length of data |
| 278 | * @type: object type, see above |
| 279 | * @compr: compression type |
| 280 | * @ino: inode number |
| 281 | * @bix: block index |
| 282 | * @data_crc: crc32 of payload |
| 283 | */ |
| 284 | struct logfs_object_header { |
| 285 | __be32 crc; |
| 286 | __be16 len; |
| 287 | __u8 type; |
| 288 | __u8 compr; |
| 289 | __be64 ino; |
| 290 | __be64 bix; |
| 291 | __be32 data_crc; |
| 292 | } __attribute__((packed)); |
| 293 | |
| 294 | SIZE_CHECK(logfs_object_header, LOGFS_OBJECT_HEADERSIZE); |
| 295 | |
| 296 | /* |
| 297 | * Reserved inode numbers: |
| 298 | * LOGFS_INO_MASTER - master inode (for inode file) |
| 299 | * LOGFS_INO_ROOT - root directory |
| 300 | * LOGFS_INO_SEGFILE - per-segment used bytes and erase count |
| 301 | */ |
| 302 | enum { |
| 303 | LOGFS_INO_MAPPING = 0x00, |
| 304 | LOGFS_INO_MASTER = 0x01, |
| 305 | LOGFS_INO_ROOT = 0x02, |
| 306 | LOGFS_INO_SEGFILE = 0x03, |
| 307 | LOGFS_RESERVED_INOS = 0x10, |
| 308 | }; |
| 309 | |
| 310 | /* |
| 311 | * Inode flags. High bits should never be written to the medium. They are |
| 312 | * reserved for in-memory usage. |
| 313 | * Low bits should either remain in sync with the corresponding FS_*_FL or |
| 314 | * reuse slots that obviously don't make sense for logfs. |
| 315 | * |
| 316 | * LOGFS_IF_DIRTY Inode must be written back |
| 317 | * LOGFS_IF_ZOMBIE Inode has been deleted |
| 318 | * LOGFS_IF_STILLBORN -ENOSPC happened when creating inode |
| 319 | */ |
| 320 | #define LOGFS_IF_COMPRESSED 0x00000004 /* == FS_COMPR_FL */ |
| 321 | #define LOGFS_IF_DIRTY 0x20000000 |
| 322 | #define LOGFS_IF_ZOMBIE 0x40000000 |
| 323 | #define LOGFS_IF_STILLBORN 0x80000000 |
| 324 | |
| 325 | /* Flags available to chattr */ |
| 326 | #define LOGFS_FL_USER_VISIBLE (LOGFS_IF_COMPRESSED) |
| 327 | #define LOGFS_FL_USER_MODIFIABLE (LOGFS_IF_COMPRESSED) |
| 328 | /* Flags inherited from parent directory on file/directory creation */ |
| 329 | #define LOGFS_FL_INHERITED (LOGFS_IF_COMPRESSED) |
| 330 | |
| 331 | /** |
| 332 | * struct logfs_disk_inode - on-medium inode |
| 333 | * |
| 334 | * @di_mode: file mode |
| 335 | * @di_pad: reserved, must be 0 |
| 336 | * @di_flags: inode flags, see above |
| 337 | * @di_uid: user id |
| 338 | * @di_gid: group id |
| 339 | * @di_ctime: change time |
| 340 | * @di_mtime: modify time |
| 341 | * @di_refcount: reference count (aka nlink or link count) |
| 342 | * @di_generation: inode generation, for nfs |
| 343 | * @di_used_bytes: number of bytes used |
| 344 | * @di_size: file size |
| 345 | * @di_data: data pointers |
| 346 | */ |
| 347 | struct logfs_disk_inode { |
| 348 | __be16 di_mode; |
| 349 | __u8 di_height; |
| 350 | __u8 di_pad; |
| 351 | __be32 di_flags; |
| 352 | __be32 di_uid; |
| 353 | __be32 di_gid; |
| 354 | |
| 355 | __be64 di_ctime; |
| 356 | __be64 di_mtime; |
| 357 | |
| 358 | __be64 di_atime; |
| 359 | __be32 di_refcount; |
| 360 | __be32 di_generation; |
| 361 | |
| 362 | __be64 di_used_bytes; |
| 363 | __be64 di_size; |
| 364 | |
| 365 | __be64 di_data[LOGFS_EMBEDDED_FIELDS]; |
| 366 | }; |
| 367 | |
| 368 | SIZE_CHECK(logfs_disk_inode, 200); |
| 369 | |
| 370 | #define INODE_POINTER_OFS \ |
| 371 | (offsetof(struct logfs_disk_inode, di_data) / sizeof(__be64)) |
| 372 | #define INODE_USED_OFS \ |
| 373 | (offsetof(struct logfs_disk_inode, di_used_bytes) / sizeof(__be64)) |
| 374 | #define INODE_SIZE_OFS \ |
| 375 | (offsetof(struct logfs_disk_inode, di_size) / sizeof(__be64)) |
| 376 | #define INODE_HEIGHT_OFS (0) |
| 377 | |
| 378 | /** |
| 379 | * struct logfs_disk_dentry - on-medium dentry structure |
| 380 | * |
| 381 | * @ino: inode number |
| 382 | * @namelen: length of file name |
| 383 | * @type: file type, identical to bits 12..15 of mode |
| 384 | * @name: file name |
| 385 | */ |
| 386 | /* FIXME: add 6 bytes of padding to remove the __packed */ |
| 387 | struct logfs_disk_dentry { |
| 388 | __be64 ino; |
| 389 | __be16 namelen; |
| 390 | __u8 type; |
| 391 | __u8 name[LOGFS_MAX_NAMELEN]; |
| 392 | } __attribute__((packed)); |
| 393 | |
| 394 | SIZE_CHECK(logfs_disk_dentry, 266); |
| 395 | |
| 396 | #define RESERVED 0xffffffff |
| 397 | #define BADSEG 0xffffffff |
| 398 | /** |
| 399 | * struct logfs_segment_entry - segment file entry |
| 400 | * |
| 401 | * @ec_level: erase count and level |
| 402 | * @valid: number of valid bytes |
| 403 | * |
| 404 | * Segment file contains one entry for every segment. ec_level contains the |
| 405 | * erasecount in the upper 28 bits and the level in the lower 4 bits. An |
| 406 | * ec_level of BADSEG (-1) identifies bad segments. valid contains the number |
| 407 | * of valid bytes or RESERVED (-1 again) if the segment is used for either the |
| 408 | * superblock or the journal, or when the segment is bad. |
| 409 | */ |
| 410 | struct logfs_segment_entry { |
| 411 | __be32 ec_level; |
| 412 | __be32 valid; |
| 413 | }; |
| 414 | |
| 415 | SIZE_CHECK(logfs_segment_entry, 8); |
| 416 | |
| 417 | /** |
| 418 | * struct logfs_journal_header - header for journal entries (JEs) |
| 419 | * |
| 420 | * @h_crc: crc32 of journal entry |
| 421 | * @h_len: length of compressed journal entry, |
| 422 | * not including header |
| 423 | * @h_datalen: length of uncompressed data |
| 424 | * @h_type: JE type |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 425 | * @h_compr: compression type |
| 426 | * @h_pad: reserved |
| 427 | */ |
| 428 | struct logfs_journal_header { |
| 429 | __be32 h_crc; |
| 430 | __be16 h_len; |
| 431 | __be16 h_datalen; |
| 432 | __be16 h_type; |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 433 | __u8 h_compr; |
Joern Engel | 9cf05b4 | 2010-03-06 10:01:46 +0100 | [diff] [blame] | 434 | __u8 h_pad[5]; |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 435 | }; |
| 436 | |
| 437 | SIZE_CHECK(logfs_journal_header, 16); |
| 438 | |
| 439 | /* |
| 440 | * Life expectency of data. |
| 441 | * VIM_DEFAULT - default vim |
| 442 | * VIM_SEGFILE - for segment file only - very short-living |
| 443 | * VIM_GC - GC'd data - likely long-living |
| 444 | */ |
| 445 | enum logfs_vim { |
| 446 | VIM_DEFAULT = 0, |
| 447 | VIM_SEGFILE = 1, |
| 448 | }; |
| 449 | |
| 450 | /** |
| 451 | * struct logfs_je_area - wbuf header |
| 452 | * |
| 453 | * @segno: segment number of area |
| 454 | * @used_bytes: number of bytes already used |
| 455 | * @gc_level: GC level |
| 456 | * @vim: life expectancy of data |
| 457 | * |
| 458 | * "Areas" are segments currently being used for writing. There is at least |
Anand Gadiyar | a8cd456 | 2010-05-10 14:51:19 +0530 | [diff] [blame] | 459 | * one area per GC level. Several may be used to separate long-living from |
Joern Engel | 5db53f3 | 2009-11-20 20:13:39 +0100 | [diff] [blame] | 460 | * short-living data. If an area with unknown vim is encountered, it can |
| 461 | * simply be closed. |
| 462 | * The write buffer immediately follow this header. |
| 463 | */ |
| 464 | struct logfs_je_area { |
| 465 | __be32 segno; |
| 466 | __be32 used_bytes; |
| 467 | __u8 gc_level; |
| 468 | __u8 vim; |
| 469 | } __attribute__((packed)); |
| 470 | |
| 471 | SIZE_CHECK(logfs_je_area, 10); |
| 472 | |
| 473 | #define MAX_JOURNAL_HEADER \ |
| 474 | (sizeof(struct logfs_journal_header) + sizeof(struct logfs_je_area)) |
| 475 | |
| 476 | /** |
| 477 | * struct logfs_je_dynsb - dynamic superblock |
| 478 | * |
| 479 | * @ds_gec: global erase count |
| 480 | * @ds_sweeper: current position of GC "sweeper" |
| 481 | * @ds_rename_dir: source directory ino (see dir.c documentation) |
| 482 | * @ds_rename_pos: position of source dd (see dir.c documentation) |
| 483 | * @ds_victim_ino: victims of incomplete dir operation (see dir.c) |
| 484 | * @ds_victim_ino: parent inode of victim (see dir.c) |
| 485 | * @ds_used_bytes: number of used bytes |
| 486 | */ |
| 487 | struct logfs_je_dynsb { |
| 488 | __be64 ds_gec; |
| 489 | __be64 ds_sweeper; |
| 490 | |
| 491 | __be64 ds_rename_dir; |
| 492 | __be64 ds_rename_pos; |
| 493 | |
| 494 | __be64 ds_victim_ino; |
| 495 | __be64 ds_victim_parent; /* XXX */ |
| 496 | |
| 497 | __be64 ds_used_bytes; |
| 498 | __be32 ds_generation; |
| 499 | __be32 pad; |
| 500 | }; |
| 501 | |
| 502 | SIZE_CHECK(logfs_je_dynsb, 64); |
| 503 | |
| 504 | /** |
| 505 | * struct logfs_je_anchor - anchor of filesystem tree, aka master inode |
| 506 | * |
| 507 | * @da_size: size of inode file |
| 508 | * @da_last_ino: last created inode |
| 509 | * @da_used_bytes: number of bytes used |
| 510 | * @da_data: data pointers |
| 511 | */ |
| 512 | struct logfs_je_anchor { |
| 513 | __be64 da_size; |
| 514 | __be64 da_last_ino; |
| 515 | |
| 516 | __be64 da_used_bytes; |
| 517 | u8 da_height; |
| 518 | u8 pad[7]; |
| 519 | |
| 520 | __be64 da_data[LOGFS_EMBEDDED_FIELDS]; |
| 521 | }; |
| 522 | |
| 523 | SIZE_CHECK(logfs_je_anchor, 168); |
| 524 | |
| 525 | /** |
| 526 | * struct logfs_je_spillout - spillout entry (from 1st to 2nd journal) |
| 527 | * |
| 528 | * @so_segment: segments used for 2nd journal |
| 529 | * |
| 530 | * Length of the array is given by h_len field in the header. |
| 531 | */ |
| 532 | struct logfs_je_spillout { |
| 533 | __be64 so_segment[0]; |
| 534 | }; |
| 535 | |
| 536 | SIZE_CHECK(logfs_je_spillout, 0); |
| 537 | |
| 538 | /** |
| 539 | * struct logfs_je_journal_ec - erase counts for all journal segments |
| 540 | * |
| 541 | * @ec: erase count |
| 542 | * |
| 543 | * Length of the array is given by h_len field in the header. |
| 544 | */ |
| 545 | struct logfs_je_journal_ec { |
| 546 | __be32 ec[0]; |
| 547 | }; |
| 548 | |
| 549 | SIZE_CHECK(logfs_je_journal_ec, 0); |
| 550 | |
| 551 | /** |
| 552 | * struct logfs_je_free_segments - list of free segmetns with erase count |
| 553 | */ |
| 554 | struct logfs_je_free_segments { |
| 555 | __be32 segno; |
| 556 | __be32 ec; |
| 557 | }; |
| 558 | |
| 559 | SIZE_CHECK(logfs_je_free_segments, 8); |
| 560 | |
| 561 | /** |
| 562 | * struct logfs_seg_alias - list of segment aliases |
| 563 | */ |
| 564 | struct logfs_seg_alias { |
| 565 | __be32 old_segno; |
| 566 | __be32 new_segno; |
| 567 | }; |
| 568 | |
| 569 | SIZE_CHECK(logfs_seg_alias, 8); |
| 570 | |
| 571 | /** |
| 572 | * struct logfs_obj_alias - list of object aliases |
| 573 | */ |
| 574 | struct logfs_obj_alias { |
| 575 | __be64 ino; |
| 576 | __be64 bix; |
| 577 | __be64 val; |
| 578 | u8 level; |
| 579 | u8 pad[5]; |
| 580 | __be16 child_no; |
| 581 | }; |
| 582 | |
| 583 | SIZE_CHECK(logfs_obj_alias, 32); |
| 584 | |
| 585 | /** |
| 586 | * Compression types. |
| 587 | * |
| 588 | * COMPR_NONE - uncompressed |
| 589 | * COMPR_ZLIB - compressed with zlib |
| 590 | */ |
| 591 | enum { |
| 592 | COMPR_NONE = 0, |
| 593 | COMPR_ZLIB = 1, |
| 594 | }; |
| 595 | |
| 596 | /* |
| 597 | * Journal entries come in groups of 16. First group contains unique |
| 598 | * entries, next groups contain one entry per level |
| 599 | * |
| 600 | * JE_FIRST - smallest possible journal entry number |
| 601 | * |
| 602 | * JEG_BASE - base group, containing unique entries |
| 603 | * JE_COMMIT - commit entry, validates all previous entries |
| 604 | * JE_DYNSB - dynamic superblock, anything that ought to be in the |
| 605 | * superblock but cannot because it is read-write data |
| 606 | * JE_ANCHOR - anchor aka master inode aka inode file's inode |
| 607 | * JE_ERASECOUNT erasecounts for all journal segments |
| 608 | * JE_SPILLOUT - unused |
| 609 | * JE_SEG_ALIAS - aliases segments |
| 610 | * JE_AREA - area description |
| 611 | * |
| 612 | * JE_LAST - largest possible journal entry number |
| 613 | */ |
| 614 | enum { |
| 615 | JE_FIRST = 0x01, |
| 616 | |
| 617 | JEG_BASE = 0x00, |
| 618 | JE_COMMIT = 0x02, |
| 619 | JE_DYNSB = 0x03, |
| 620 | JE_ANCHOR = 0x04, |
| 621 | JE_ERASECOUNT = 0x05, |
| 622 | JE_SPILLOUT = 0x06, |
| 623 | JE_OBJ_ALIAS = 0x0d, |
| 624 | JE_AREA = 0x0e, |
| 625 | |
| 626 | JE_LAST = 0x0e, |
| 627 | }; |
| 628 | |
| 629 | #endif |