Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame^] | 1 | /* |
| 2 | * JFFS2 -- Journalling Flash File System, Version 2. |
| 3 | * |
| 4 | * Copyright (C) 2001-2003 Red Hat, Inc. |
| 5 | * |
| 6 | * Created by David Woodhouse <dwmw2@infradead.org> |
| 7 | * |
| 8 | * For licensing information, see the file 'LICENCE' in this directory. |
| 9 | * |
| 10 | * $Id: build.c,v 1.69 2004/12/16 20:22:18 dmarlin Exp $ |
| 11 | * |
| 12 | */ |
| 13 | |
| 14 | #include <linux/kernel.h> |
| 15 | #include <linux/sched.h> |
| 16 | #include <linux/slab.h> |
| 17 | #include <linux/vmalloc.h> |
| 18 | #include <linux/mtd/mtd.h> |
| 19 | #include "nodelist.h" |
| 20 | |
| 21 | static void jffs2_build_remove_unlinked_inode(struct jffs2_sb_info *, struct jffs2_inode_cache *, struct jffs2_full_dirent **); |
| 22 | |
| 23 | static inline struct jffs2_inode_cache * |
| 24 | first_inode_chain(int *i, struct jffs2_sb_info *c) |
| 25 | { |
| 26 | for (; *i < INOCACHE_HASHSIZE; (*i)++) { |
| 27 | if (c->inocache_list[*i]) |
| 28 | return c->inocache_list[*i]; |
| 29 | } |
| 30 | return NULL; |
| 31 | } |
| 32 | |
| 33 | static inline struct jffs2_inode_cache * |
| 34 | next_inode(int *i, struct jffs2_inode_cache *ic, struct jffs2_sb_info *c) |
| 35 | { |
| 36 | /* More in this chain? */ |
| 37 | if (ic->next) |
| 38 | return ic->next; |
| 39 | (*i)++; |
| 40 | return first_inode_chain(i, c); |
| 41 | } |
| 42 | |
| 43 | #define for_each_inode(i, c, ic) \ |
| 44 | for (i = 0, ic = first_inode_chain(&i, (c)); \ |
| 45 | ic; \ |
| 46 | ic = next_inode(&i, ic, (c))) |
| 47 | |
| 48 | |
| 49 | static inline void jffs2_build_inode_pass1(struct jffs2_sb_info *c, struct jffs2_inode_cache *ic) |
| 50 | { |
| 51 | struct jffs2_full_dirent *fd; |
| 52 | |
| 53 | D1(printk(KERN_DEBUG "jffs2_build_inode building directory inode #%u\n", ic->ino)); |
| 54 | |
| 55 | /* For each child, increase nlink */ |
| 56 | for(fd = ic->scan_dents; fd; fd = fd->next) { |
| 57 | struct jffs2_inode_cache *child_ic; |
| 58 | if (!fd->ino) |
| 59 | continue; |
| 60 | |
| 61 | /* XXX: Can get high latency here with huge directories */ |
| 62 | |
| 63 | child_ic = jffs2_get_ino_cache(c, fd->ino); |
| 64 | if (!child_ic) { |
| 65 | printk(KERN_NOTICE "Eep. Child \"%s\" (ino #%u) of dir ino #%u doesn't exist!\n", |
| 66 | fd->name, fd->ino, ic->ino); |
| 67 | jffs2_mark_node_obsolete(c, fd->raw); |
| 68 | continue; |
| 69 | } |
| 70 | |
| 71 | if (child_ic->nlink++ && fd->type == DT_DIR) { |
| 72 | printk(KERN_NOTICE "Child dir \"%s\" (ino #%u) of dir ino #%u appears to be a hard link\n", fd->name, fd->ino, ic->ino); |
| 73 | if (fd->ino == 1 && ic->ino == 1) { |
| 74 | printk(KERN_NOTICE "This is mostly harmless, and probably caused by creating a JFFS2 image\n"); |
| 75 | printk(KERN_NOTICE "using a buggy version of mkfs.jffs2. Use at least v1.17.\n"); |
| 76 | } |
| 77 | /* What do we do about it? */ |
| 78 | } |
| 79 | D1(printk(KERN_DEBUG "Increased nlink for child \"%s\" (ino #%u)\n", fd->name, fd->ino)); |
| 80 | /* Can't free them. We might need them in pass 2 */ |
| 81 | } |
| 82 | } |
| 83 | |
| 84 | /* Scan plan: |
| 85 | - Scan physical nodes. Build map of inodes/dirents. Allocate inocaches as we go |
| 86 | - Scan directory tree from top down, setting nlink in inocaches |
| 87 | - Scan inocaches for inodes with nlink==0 |
| 88 | */ |
| 89 | static int jffs2_build_filesystem(struct jffs2_sb_info *c) |
| 90 | { |
| 91 | int ret; |
| 92 | int i; |
| 93 | struct jffs2_inode_cache *ic; |
| 94 | struct jffs2_full_dirent *fd; |
| 95 | struct jffs2_full_dirent *dead_fds = NULL; |
| 96 | |
| 97 | /* First, scan the medium and build all the inode caches with |
| 98 | lists of physical nodes */ |
| 99 | |
| 100 | c->flags |= JFFS2_SB_FLAG_MOUNTING; |
| 101 | ret = jffs2_scan_medium(c); |
| 102 | if (ret) |
| 103 | goto exit; |
| 104 | |
| 105 | D1(printk(KERN_DEBUG "Scanned flash completely\n")); |
| 106 | D2(jffs2_dump_block_lists(c)); |
| 107 | |
| 108 | /* Now scan the directory tree, increasing nlink according to every dirent found. */ |
| 109 | for_each_inode(i, c, ic) { |
| 110 | D1(printk(KERN_DEBUG "Pass 1: ino #%u\n", ic->ino)); |
| 111 | |
| 112 | D1(BUG_ON(ic->ino > c->highest_ino)); |
| 113 | |
| 114 | if (ic->scan_dents) { |
| 115 | jffs2_build_inode_pass1(c, ic); |
| 116 | cond_resched(); |
| 117 | } |
| 118 | } |
| 119 | c->flags &= ~JFFS2_SB_FLAG_MOUNTING; |
| 120 | |
| 121 | D1(printk(KERN_DEBUG "Pass 1 complete\n")); |
| 122 | |
| 123 | /* Next, scan for inodes with nlink == 0 and remove them. If |
| 124 | they were directories, then decrement the nlink of their |
| 125 | children too, and repeat the scan. As that's going to be |
| 126 | a fairly uncommon occurrence, it's not so evil to do it this |
| 127 | way. Recursion bad. */ |
| 128 | D1(printk(KERN_DEBUG "Pass 2 starting\n")); |
| 129 | |
| 130 | for_each_inode(i, c, ic) { |
| 131 | D1(printk(KERN_DEBUG "Pass 2: ino #%u, nlink %d, ic %p, nodes %p\n", ic->ino, ic->nlink, ic, ic->nodes)); |
| 132 | if (ic->nlink) |
| 133 | continue; |
| 134 | |
| 135 | jffs2_build_remove_unlinked_inode(c, ic, &dead_fds); |
| 136 | cond_resched(); |
| 137 | } |
| 138 | |
| 139 | D1(printk(KERN_DEBUG "Pass 2a starting\n")); |
| 140 | |
| 141 | while (dead_fds) { |
| 142 | fd = dead_fds; |
| 143 | dead_fds = fd->next; |
| 144 | |
| 145 | ic = jffs2_get_ino_cache(c, fd->ino); |
| 146 | D1(printk(KERN_DEBUG "Removing dead_fd ino #%u (\"%s\"), ic at %p\n", fd->ino, fd->name, ic)); |
| 147 | |
| 148 | if (ic) |
| 149 | jffs2_build_remove_unlinked_inode(c, ic, &dead_fds); |
| 150 | jffs2_free_full_dirent(fd); |
| 151 | } |
| 152 | |
| 153 | D1(printk(KERN_DEBUG "Pass 2 complete\n")); |
| 154 | |
| 155 | /* Finally, we can scan again and free the dirent structs */ |
| 156 | for_each_inode(i, c, ic) { |
| 157 | D1(printk(KERN_DEBUG "Pass 3: ino #%u, ic %p, nodes %p\n", ic->ino, ic, ic->nodes)); |
| 158 | |
| 159 | while(ic->scan_dents) { |
| 160 | fd = ic->scan_dents; |
| 161 | ic->scan_dents = fd->next; |
| 162 | jffs2_free_full_dirent(fd); |
| 163 | } |
| 164 | ic->scan_dents = NULL; |
| 165 | cond_resched(); |
| 166 | } |
| 167 | D1(printk(KERN_DEBUG "Pass 3 complete\n")); |
| 168 | D2(jffs2_dump_block_lists(c)); |
| 169 | |
| 170 | /* Rotate the lists by some number to ensure wear levelling */ |
| 171 | jffs2_rotate_lists(c); |
| 172 | |
| 173 | ret = 0; |
| 174 | |
| 175 | exit: |
| 176 | if (ret) { |
| 177 | for_each_inode(i, c, ic) { |
| 178 | while(ic->scan_dents) { |
| 179 | fd = ic->scan_dents; |
| 180 | ic->scan_dents = fd->next; |
| 181 | jffs2_free_full_dirent(fd); |
| 182 | } |
| 183 | } |
| 184 | } |
| 185 | |
| 186 | return ret; |
| 187 | } |
| 188 | |
| 189 | static void jffs2_build_remove_unlinked_inode(struct jffs2_sb_info *c, struct jffs2_inode_cache *ic, struct jffs2_full_dirent **dead_fds) |
| 190 | { |
| 191 | struct jffs2_raw_node_ref *raw; |
| 192 | struct jffs2_full_dirent *fd; |
| 193 | |
| 194 | D1(printk(KERN_DEBUG "JFFS2: Removing ino #%u with nlink == zero.\n", ic->ino)); |
| 195 | |
| 196 | raw = ic->nodes; |
| 197 | while (raw != (void *)ic) { |
| 198 | struct jffs2_raw_node_ref *next = raw->next_in_ino; |
| 199 | D1(printk(KERN_DEBUG "obsoleting node at 0x%08x\n", ref_offset(raw))); |
| 200 | jffs2_mark_node_obsolete(c, raw); |
| 201 | raw = next; |
| 202 | } |
| 203 | |
| 204 | if (ic->scan_dents) { |
| 205 | int whinged = 0; |
| 206 | D1(printk(KERN_DEBUG "Inode #%u was a directory which may have children...\n", ic->ino)); |
| 207 | |
| 208 | while(ic->scan_dents) { |
| 209 | struct jffs2_inode_cache *child_ic; |
| 210 | |
| 211 | fd = ic->scan_dents; |
| 212 | ic->scan_dents = fd->next; |
| 213 | |
| 214 | if (!fd->ino) { |
| 215 | /* It's a deletion dirent. Ignore it */ |
| 216 | D1(printk(KERN_DEBUG "Child \"%s\" is a deletion dirent, skipping...\n", fd->name)); |
| 217 | jffs2_free_full_dirent(fd); |
| 218 | continue; |
| 219 | } |
| 220 | if (!whinged) { |
| 221 | whinged = 1; |
| 222 | printk(KERN_NOTICE "Inode #%u was a directory with children - removing those too...\n", ic->ino); |
| 223 | } |
| 224 | |
| 225 | D1(printk(KERN_DEBUG "Removing child \"%s\", ino #%u\n", |
| 226 | fd->name, fd->ino)); |
| 227 | |
| 228 | child_ic = jffs2_get_ino_cache(c, fd->ino); |
| 229 | if (!child_ic) { |
| 230 | printk(KERN_NOTICE "Cannot remove child \"%s\", ino #%u, because it doesn't exist\n", fd->name, fd->ino); |
| 231 | jffs2_free_full_dirent(fd); |
| 232 | continue; |
| 233 | } |
| 234 | |
| 235 | /* Reduce nlink of the child. If it's now zero, stick it on the |
| 236 | dead_fds list to be cleaned up later. Else just free the fd */ |
| 237 | |
| 238 | child_ic->nlink--; |
| 239 | |
| 240 | if (!child_ic->nlink) { |
| 241 | D1(printk(KERN_DEBUG "Inode #%u (\"%s\") has now got zero nlink. Adding to dead_fds list.\n", |
| 242 | fd->ino, fd->name)); |
| 243 | fd->next = *dead_fds; |
| 244 | *dead_fds = fd; |
| 245 | } else { |
| 246 | D1(printk(KERN_DEBUG "Inode #%u (\"%s\") has now got nlink %d. Ignoring.\n", |
| 247 | fd->ino, fd->name, child_ic->nlink)); |
| 248 | jffs2_free_full_dirent(fd); |
| 249 | } |
| 250 | } |
| 251 | } |
| 252 | |
| 253 | /* |
| 254 | We don't delete the inocache from the hash list and free it yet. |
| 255 | The erase code will do that, when all the nodes are completely gone. |
| 256 | */ |
| 257 | } |
| 258 | |
| 259 | static void jffs2_calc_trigger_levels(struct jffs2_sb_info *c) |
| 260 | { |
| 261 | uint32_t size; |
| 262 | |
| 263 | /* Deletion should almost _always_ be allowed. We're fairly |
| 264 | buggered once we stop allowing people to delete stuff |
| 265 | because there's not enough free space... */ |
| 266 | c->resv_blocks_deletion = 2; |
| 267 | |
| 268 | /* Be conservative about how much space we need before we allow writes. |
| 269 | On top of that which is required for deletia, require an extra 2% |
| 270 | of the medium to be available, for overhead caused by nodes being |
| 271 | split across blocks, etc. */ |
| 272 | |
| 273 | size = c->flash_size / 50; /* 2% of flash size */ |
| 274 | size += c->nr_blocks * 100; /* And 100 bytes per eraseblock */ |
| 275 | size += c->sector_size - 1; /* ... and round up */ |
| 276 | |
| 277 | c->resv_blocks_write = c->resv_blocks_deletion + (size / c->sector_size); |
| 278 | |
| 279 | /* When do we let the GC thread run in the background */ |
| 280 | |
| 281 | c->resv_blocks_gctrigger = c->resv_blocks_write + 1; |
| 282 | |
| 283 | /* When do we allow garbage collection to merge nodes to make |
| 284 | long-term progress at the expense of short-term space exhaustion? */ |
| 285 | c->resv_blocks_gcmerge = c->resv_blocks_deletion + 1; |
| 286 | |
| 287 | /* When do we allow garbage collection to eat from bad blocks rather |
| 288 | than actually making progress? */ |
| 289 | c->resv_blocks_gcbad = 0;//c->resv_blocks_deletion + 2; |
| 290 | |
| 291 | /* If there's less than this amount of dirty space, don't bother |
| 292 | trying to GC to make more space. It'll be a fruitless task */ |
| 293 | c->nospc_dirty_size = c->sector_size + (c->flash_size / 100); |
| 294 | |
| 295 | D1(printk(KERN_DEBUG "JFFS2 trigger levels (size %d KiB, block size %d KiB, %d blocks)\n", |
| 296 | c->flash_size / 1024, c->sector_size / 1024, c->nr_blocks)); |
| 297 | D1(printk(KERN_DEBUG "Blocks required to allow deletion: %d (%d KiB)\n", |
| 298 | c->resv_blocks_deletion, c->resv_blocks_deletion*c->sector_size/1024)); |
| 299 | D1(printk(KERN_DEBUG "Blocks required to allow writes: %d (%d KiB)\n", |
| 300 | c->resv_blocks_write, c->resv_blocks_write*c->sector_size/1024)); |
| 301 | D1(printk(KERN_DEBUG "Blocks required to quiesce GC thread: %d (%d KiB)\n", |
| 302 | c->resv_blocks_gctrigger, c->resv_blocks_gctrigger*c->sector_size/1024)); |
| 303 | D1(printk(KERN_DEBUG "Blocks required to allow GC merges: %d (%d KiB)\n", |
| 304 | c->resv_blocks_gcmerge, c->resv_blocks_gcmerge*c->sector_size/1024)); |
| 305 | D1(printk(KERN_DEBUG "Blocks required to GC bad blocks: %d (%d KiB)\n", |
| 306 | c->resv_blocks_gcbad, c->resv_blocks_gcbad*c->sector_size/1024)); |
| 307 | D1(printk(KERN_DEBUG "Amount of dirty space required to GC: %d bytes\n", |
| 308 | c->nospc_dirty_size)); |
| 309 | } |
| 310 | |
| 311 | int jffs2_do_mount_fs(struct jffs2_sb_info *c) |
| 312 | { |
| 313 | int i; |
| 314 | |
| 315 | c->free_size = c->flash_size; |
| 316 | c->nr_blocks = c->flash_size / c->sector_size; |
| 317 | if (c->mtd->flags & MTD_NO_VIRTBLOCKS) |
| 318 | c->blocks = vmalloc(sizeof(struct jffs2_eraseblock) * c->nr_blocks); |
| 319 | else |
| 320 | c->blocks = kmalloc(sizeof(struct jffs2_eraseblock) * c->nr_blocks, GFP_KERNEL); |
| 321 | if (!c->blocks) |
| 322 | return -ENOMEM; |
| 323 | for (i=0; i<c->nr_blocks; i++) { |
| 324 | INIT_LIST_HEAD(&c->blocks[i].list); |
| 325 | c->blocks[i].offset = i * c->sector_size; |
| 326 | c->blocks[i].free_size = c->sector_size; |
| 327 | c->blocks[i].dirty_size = 0; |
| 328 | c->blocks[i].wasted_size = 0; |
| 329 | c->blocks[i].unchecked_size = 0; |
| 330 | c->blocks[i].used_size = 0; |
| 331 | c->blocks[i].first_node = NULL; |
| 332 | c->blocks[i].last_node = NULL; |
| 333 | c->blocks[i].bad_count = 0; |
| 334 | } |
| 335 | |
| 336 | init_MUTEX(&c->alloc_sem); |
| 337 | init_MUTEX(&c->erase_free_sem); |
| 338 | init_waitqueue_head(&c->erase_wait); |
| 339 | init_waitqueue_head(&c->inocache_wq); |
| 340 | spin_lock_init(&c->erase_completion_lock); |
| 341 | spin_lock_init(&c->inocache_lock); |
| 342 | |
| 343 | INIT_LIST_HEAD(&c->clean_list); |
| 344 | INIT_LIST_HEAD(&c->very_dirty_list); |
| 345 | INIT_LIST_HEAD(&c->dirty_list); |
| 346 | INIT_LIST_HEAD(&c->erasable_list); |
| 347 | INIT_LIST_HEAD(&c->erasing_list); |
| 348 | INIT_LIST_HEAD(&c->erase_pending_list); |
| 349 | INIT_LIST_HEAD(&c->erasable_pending_wbuf_list); |
| 350 | INIT_LIST_HEAD(&c->erase_complete_list); |
| 351 | INIT_LIST_HEAD(&c->free_list); |
| 352 | INIT_LIST_HEAD(&c->bad_list); |
| 353 | INIT_LIST_HEAD(&c->bad_used_list); |
| 354 | c->highest_ino = 1; |
| 355 | |
| 356 | if (jffs2_build_filesystem(c)) { |
| 357 | D1(printk(KERN_DEBUG "build_fs failed\n")); |
| 358 | jffs2_free_ino_caches(c); |
| 359 | jffs2_free_raw_node_refs(c); |
| 360 | if (c->mtd->flags & MTD_NO_VIRTBLOCKS) { |
| 361 | vfree(c->blocks); |
| 362 | } else { |
| 363 | kfree(c->blocks); |
| 364 | } |
| 365 | return -EIO; |
| 366 | } |
| 367 | |
| 368 | jffs2_calc_trigger_levels(c); |
| 369 | |
| 370 | return 0; |
| 371 | } |