Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* |
| 2 | * Copyright 1999 Hans Reiser, see reiserfs/README for licensing and copyright details |
| 3 | */ |
| 4 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 5 | #include <linux/time.h> |
| 6 | #include <linux/pagemap.h> |
| 7 | #include <linux/buffer_head.h> |
| 8 | #include <linux/reiserfs_fs.h> |
| 9 | |
| 10 | /* access to tail : when one is going to read tail it must make sure, that is not running. |
| 11 | direct2indirect and indirect2direct can not run concurrently */ |
| 12 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 13 | /* Converts direct items to an unformatted node. Panics if file has no |
| 14 | tail. -ENOSPC if no disk space for conversion */ |
| 15 | /* path points to first direct item of the file regarless of how many of |
| 16 | them are there */ |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 17 | int direct2indirect(struct reiserfs_transaction_handle *th, struct inode *inode, |
Josef "Jeff" Sipek | fec6d05 | 2006-12-08 02:36:32 -0800 | [diff] [blame] | 18 | struct treepath *path, struct buffer_head *unbh, |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 19 | loff_t tail_offset) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 20 | { |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 21 | struct super_block *sb = inode->i_sb; |
| 22 | struct buffer_head *up_to_date_bh; |
| 23 | struct item_head *p_le_ih = PATH_PITEM_HEAD(path); |
| 24 | unsigned long total_tail = 0; |
| 25 | struct cpu_key end_key; /* Key to search for the last byte of the |
| 26 | converted item. */ |
| 27 | struct item_head ind_ih; /* new indirect item to be inserted or |
| 28 | key of unfm pointer to be pasted */ |
| 29 | int n_blk_size, n_retval; /* returned value for reiserfs_insert_item and clones */ |
| 30 | unp_t unfm_ptr; /* Handle on an unformatted node |
| 31 | that will be inserted in the |
| 32 | tree. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 33 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 34 | BUG_ON(!th->t_trans_id); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 36 | REISERFS_SB(sb)->s_direct2indirect++; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 37 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 38 | n_blk_size = sb->s_blocksize; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 39 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 40 | /* and key to search for append or insert pointer to the new |
| 41 | unformatted node. */ |
| 42 | copy_item_head(&ind_ih, p_le_ih); |
| 43 | set_le_ih_k_offset(&ind_ih, tail_offset); |
| 44 | set_le_ih_k_type(&ind_ih, TYPE_INDIRECT); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 45 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 46 | /* Set the key to search for the place for new unfm pointer */ |
| 47 | make_cpu_key(&end_key, inode, tail_offset, TYPE_INDIRECT, 4); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 48 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 49 | // FIXME: we could avoid this |
| 50 | if (search_for_position_by_key(sb, &end_key, path) == POSITION_FOUND) { |
| 51 | reiserfs_warning(sb, "PAP-14030: direct2indirect: " |
| 52 | "pasted or inserted byte exists in the tree %K. " |
| 53 | "Use fsck to repair.", &end_key); |
| 54 | pathrelse(path); |
| 55 | return -EIO; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 56 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 57 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 58 | p_le_ih = PATH_PITEM_HEAD(path); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 59 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 60 | unfm_ptr = cpu_to_le32(unbh->b_blocknr); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 61 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 62 | if (is_statdata_le_ih(p_le_ih)) { |
| 63 | /* Insert new indirect item. */ |
| 64 | set_ih_free_space(&ind_ih, 0); /* delete at nearest future */ |
| 65 | put_ih_item_len(&ind_ih, UNFM_P_SIZE); |
| 66 | PATH_LAST_POSITION(path)++; |
| 67 | n_retval = |
| 68 | reiserfs_insert_item(th, path, &end_key, &ind_ih, inode, |
| 69 | (char *)&unfm_ptr); |
| 70 | } else { |
| 71 | /* Paste into last indirect item of an object. */ |
| 72 | n_retval = reiserfs_paste_into_item(th, path, &end_key, inode, |
| 73 | (char *)&unfm_ptr, |
| 74 | UNFM_P_SIZE); |
| 75 | } |
| 76 | if (n_retval) { |
| 77 | return n_retval; |
| 78 | } |
| 79 | // note: from here there are two keys which have matching first |
| 80 | // three key components. They only differ by the fourth one. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 81 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 82 | /* Set the key to search for the direct items of the file */ |
| 83 | make_cpu_key(&end_key, inode, max_reiserfs_offset(inode), TYPE_DIRECT, |
| 84 | 4); |
| 85 | |
| 86 | /* Move bytes from the direct items to the new unformatted node |
| 87 | and delete them. */ |
| 88 | while (1) { |
| 89 | int tail_size; |
| 90 | |
| 91 | /* end_key.k_offset is set so, that we will always have found |
| 92 | last item of the file */ |
| 93 | if (search_for_position_by_key(sb, &end_key, path) == |
| 94 | POSITION_FOUND) |
| 95 | reiserfs_panic(sb, |
| 96 | "PAP-14050: direct2indirect: " |
| 97 | "direct item (%K) not found", &end_key); |
| 98 | p_le_ih = PATH_PITEM_HEAD(path); |
| 99 | RFALSE(!is_direct_le_ih(p_le_ih), |
| 100 | "vs-14055: direct item expected(%K), found %h", |
| 101 | &end_key, p_le_ih); |
| 102 | tail_size = (le_ih_k_offset(p_le_ih) & (n_blk_size - 1)) |
| 103 | + ih_item_len(p_le_ih) - 1; |
| 104 | |
| 105 | /* we only send the unbh pointer if the buffer is not up to date. |
| 106 | ** this avoids overwriting good data from writepage() with old data |
| 107 | ** from the disk or buffer cache |
| 108 | ** Special case: unbh->b_page will be NULL if we are coming through |
| 109 | ** DIRECT_IO handler here. |
| 110 | */ |
| 111 | if (!unbh->b_page || buffer_uptodate(unbh) |
| 112 | || PageUptodate(unbh->b_page)) { |
| 113 | up_to_date_bh = NULL; |
| 114 | } else { |
| 115 | up_to_date_bh = unbh; |
| 116 | } |
| 117 | n_retval = reiserfs_delete_item(th, path, &end_key, inode, |
| 118 | up_to_date_bh); |
| 119 | |
| 120 | total_tail += n_retval; |
| 121 | if (tail_size == n_retval) |
| 122 | // done: file does not have direct items anymore |
| 123 | break; |
| 124 | |
| 125 | } |
| 126 | /* if we've copied bytes from disk into the page, we need to zero |
| 127 | ** out the unused part of the block (it was not up to date before) |
| 128 | */ |
| 129 | if (up_to_date_bh) { |
| 130 | unsigned pgoff = |
| 131 | (tail_offset + total_tail - 1) & (PAGE_CACHE_SIZE - 1); |
| 132 | char *kaddr = kmap_atomic(up_to_date_bh->b_page, KM_USER0); |
| 133 | memset(kaddr + pgoff, 0, n_blk_size - total_tail); |
| 134 | kunmap_atomic(kaddr, KM_USER0); |
| 135 | } |
| 136 | |
| 137 | REISERFS_I(inode)->i_first_direct_byte = U32_MAX; |
| 138 | |
| 139 | return 0; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 140 | } |
| 141 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 142 | /* stolen from fs/buffer.c */ |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 143 | void reiserfs_unmap_buffer(struct buffer_head *bh) |
| 144 | { |
| 145 | lock_buffer(bh); |
| 146 | if (buffer_journaled(bh) || buffer_journal_dirty(bh)) { |
| 147 | BUG(); |
| 148 | } |
| 149 | clear_buffer_dirty(bh); |
| 150 | /* Remove the buffer from whatever list it belongs to. We are mostly |
| 151 | interested in removing it from per-sb j_dirty_buffers list, to avoid |
| 152 | BUG() on attempt to write not mapped buffer */ |
| 153 | if ((!list_empty(&bh->b_assoc_buffers) || bh->b_private) && bh->b_page) { |
| 154 | struct inode *inode = bh->b_page->mapping->host; |
| 155 | struct reiserfs_journal *j = SB_JOURNAL(inode->i_sb); |
| 156 | spin_lock(&j->j_dirty_buffers_lock); |
| 157 | list_del_init(&bh->b_assoc_buffers); |
| 158 | reiserfs_free_jh(bh); |
| 159 | spin_unlock(&j->j_dirty_buffers_lock); |
| 160 | } |
| 161 | clear_buffer_mapped(bh); |
| 162 | clear_buffer_req(bh); |
| 163 | clear_buffer_new(bh); |
| 164 | bh->b_bdev = NULL; |
| 165 | unlock_buffer(bh); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 166 | } |
| 167 | |
| 168 | /* this first locks inode (neither reads nor sync are permitted), |
| 169 | reads tail through page cache, insert direct item. When direct item |
| 170 | inserted successfully inode is left locked. Return value is always |
| 171 | what we expect from it (number of cut bytes). But when tail remains |
| 172 | in the unformatted node, we set mode to SKIP_BALANCING and unlock |
| 173 | inode */ |
Josef "Jeff" Sipek | fec6d05 | 2006-12-08 02:36:32 -0800 | [diff] [blame] | 174 | int indirect2direct(struct reiserfs_transaction_handle *th, struct inode *p_s_inode, struct page *page, struct treepath *p_s_path, /* path to the indirect item. */ |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 175 | const struct cpu_key *p_s_item_key, /* Key to look for unformatted node pointer to be cut. */ |
| 176 | loff_t n_new_file_size, /* New file size. */ |
| 177 | char *p_c_mode) |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 178 | { |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 179 | struct super_block *p_s_sb = p_s_inode->i_sb; |
| 180 | struct item_head s_ih; |
| 181 | unsigned long n_block_size = p_s_sb->s_blocksize; |
| 182 | char *tail; |
| 183 | int tail_len, round_tail_len; |
| 184 | loff_t pos, pos1; /* position of first byte of the tail */ |
| 185 | struct cpu_key key; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 186 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 187 | BUG_ON(!th->t_trans_id); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 188 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 189 | REISERFS_SB(p_s_sb)->s_indirect2direct++; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 190 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 191 | *p_c_mode = M_SKIP_BALANCING; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 192 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 193 | /* store item head path points to. */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 194 | copy_item_head(&s_ih, PATH_PITEM_HEAD(p_s_path)); |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 195 | |
| 196 | tail_len = (n_new_file_size & (n_block_size - 1)); |
| 197 | if (get_inode_sd_version(p_s_inode) == STAT_DATA_V2) |
| 198 | round_tail_len = ROUND_UP(tail_len); |
| 199 | else |
| 200 | round_tail_len = tail_len; |
| 201 | |
| 202 | pos = |
| 203 | le_ih_k_offset(&s_ih) - 1 + (ih_item_len(&s_ih) / UNFM_P_SIZE - |
| 204 | 1) * p_s_sb->s_blocksize; |
| 205 | pos1 = pos; |
| 206 | |
Jes Sorensen | 1b1dcc1 | 2006-01-09 15:59:24 -0800 | [diff] [blame] | 207 | // we are protected by i_mutex. The tail can not disapper, not |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 208 | // append can be done either |
| 209 | // we are in truncate or packing tail in file_release |
| 210 | |
| 211 | tail = (char *)kmap(page); /* this can schedule */ |
| 212 | |
| 213 | if (path_changed(&s_ih, p_s_path)) { |
| 214 | /* re-search indirect item */ |
| 215 | if (search_for_position_by_key(p_s_sb, p_s_item_key, p_s_path) |
| 216 | == POSITION_NOT_FOUND) |
| 217 | reiserfs_panic(p_s_sb, |
| 218 | "PAP-5520: indirect2direct: " |
| 219 | "item to be converted %K does not exist", |
| 220 | p_s_item_key); |
| 221 | copy_item_head(&s_ih, PATH_PITEM_HEAD(p_s_path)); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 222 | #ifdef CONFIG_REISERFS_CHECK |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 223 | pos = le_ih_k_offset(&s_ih) - 1 + |
| 224 | (ih_item_len(&s_ih) / UNFM_P_SIZE - |
| 225 | 1) * p_s_sb->s_blocksize; |
| 226 | if (pos != pos1) |
| 227 | reiserfs_panic(p_s_sb, "vs-5530: indirect2direct: " |
| 228 | "tail position changed while we were reading it"); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 229 | #endif |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 230 | } |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 231 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 232 | /* Set direct item header to insert. */ |
| 233 | make_le_item_head(&s_ih, NULL, get_inode_item_key_version(p_s_inode), |
| 234 | pos1 + 1, TYPE_DIRECT, round_tail_len, |
| 235 | 0xffff /*ih_free_space */ ); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 236 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 237 | /* we want a pointer to the first byte of the tail in the page. |
| 238 | ** the page was locked and this part of the page was up to date when |
| 239 | ** indirect2direct was called, so we know the bytes are still valid |
| 240 | */ |
| 241 | tail = tail + (pos & (PAGE_CACHE_SIZE - 1)); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 242 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 243 | PATH_LAST_POSITION(p_s_path)++; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 244 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 245 | key = *p_s_item_key; |
| 246 | set_cpu_key_k_type(&key, TYPE_DIRECT); |
| 247 | key.key_length = 4; |
| 248 | /* Insert tail as new direct item in the tree */ |
| 249 | if (reiserfs_insert_item(th, p_s_path, &key, &s_ih, p_s_inode, |
| 250 | tail ? tail : NULL) < 0) { |
| 251 | /* No disk memory. So we can not convert last unformatted node |
| 252 | to the direct item. In this case we used to adjust |
| 253 | indirect items's ih_free_space. Now ih_free_space is not |
| 254 | used, it would be ideal to write zeros to corresponding |
| 255 | unformatted node. For now i_size is considered as guard for |
| 256 | going out of file size */ |
| 257 | kunmap(page); |
| 258 | return n_block_size - round_tail_len; |
| 259 | } |
| 260 | kunmap(page); |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 261 | |
Linus Torvalds | bd4c625 | 2005-07-12 20:21:28 -0700 | [diff] [blame] | 262 | /* make sure to get the i_blocks changes from reiserfs_insert_item */ |
| 263 | reiserfs_update_sd(th, p_s_inode); |
| 264 | |
| 265 | // note: we have now the same as in above direct2indirect |
| 266 | // conversion: there are two keys which have matching first three |
| 267 | // key components. They only differ by the fouhth one. |
| 268 | |
| 269 | /* We have inserted new direct item and must remove last |
| 270 | unformatted node. */ |
| 271 | *p_c_mode = M_CUT; |
| 272 | |
| 273 | /* we store position of first direct item in the in-core inode */ |
| 274 | //mark_file_with_tail (p_s_inode, pos1 + 1); |
| 275 | REISERFS_I(p_s_inode)->i_first_direct_byte = pos1 + 1; |
| 276 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 277 | return n_block_size - round_tail_len; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 278 | } |