Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2007 Oracle. All rights reserved. |
| 3 | * |
| 4 | * This program is free software; you can redistribute it and/or |
| 5 | * modify it under the terms of the GNU General Public |
| 6 | * License v2 as published by the Free Software Foundation. |
| 7 | * |
| 8 | * This program is distributed in the hope that it will be useful, |
| 9 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 11 | * General Public License for more details. |
| 12 | * |
| 13 | * You should have received a copy of the GNU General Public |
| 14 | * License along with this program; if not, write to the |
| 15 | * Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
| 16 | * Boston, MA 021110-1307, USA. |
| 17 | */ |
| 18 | |
| 19 | #ifndef __BTRFS_ORDERED_DATA__ |
| 20 | #define __BTRFS_ORDERED_DATA__ |
| 21 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 22 | /* one of these per inode */ |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 23 | struct btrfs_ordered_inode_tree { |
Josef Bacik | 49958fd | 2010-02-02 21:48:28 +0000 | [diff] [blame] | 24 | spinlock_t lock; |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 25 | struct rb_root tree; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 26 | struct rb_node *last; |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 27 | }; |
| 28 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 29 | /* |
| 30 | * these are used to collect checksums done just before bios submission. |
| 31 | * They are attached via a list into the ordered extent, and |
| 32 | * checksum items are inserted into the tree after all the blocks in |
| 33 | * the ordered extent are on disk |
| 34 | */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 35 | struct btrfs_sector_sum { |
Chris Mason | d20f704 | 2008-12-08 16:58:54 -0500 | [diff] [blame] | 36 | /* bytenr on disk */ |
| 37 | u64 bytenr; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 38 | u32 sum; |
| 39 | }; |
| 40 | |
| 41 | struct btrfs_ordered_sum { |
Chris Mason | d20f704 | 2008-12-08 16:58:54 -0500 | [diff] [blame] | 42 | /* bytenr is the start of this extent on disk */ |
| 43 | u64 bytenr; |
| 44 | |
Chris Mason | 3edf7d3 | 2008-07-18 06:17:13 -0400 | [diff] [blame] | 45 | /* |
| 46 | * this is the length in bytes covered by the sums array below. |
Chris Mason | 3edf7d3 | 2008-07-18 06:17:13 -0400 | [diff] [blame] | 47 | */ |
| 48 | unsigned long len; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 49 | struct list_head list; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 50 | /* last field is a variable length array of btrfs_sector_sums */ |
Chris Mason | ed98b56 | 2008-07-22 23:06:42 -0400 | [diff] [blame] | 51 | struct btrfs_sector_sum sums[]; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 52 | }; |
| 53 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 54 | /* |
| 55 | * bits for the flags field: |
| 56 | * |
| 57 | * BTRFS_ORDERED_IO_DONE is set when all of the blocks are written. |
| 58 | * It is used to make sure metadata is inserted into the tree only once |
| 59 | * per extent. |
| 60 | * |
| 61 | * BTRFS_ORDERED_COMPLETE is set when the extent is removed from the |
| 62 | * rbtree, just before waking any waiters. It is used to indicate the |
| 63 | * IO is done and any metadata is inserted into the tree. |
| 64 | */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 65 | #define BTRFS_ORDERED_IO_DONE 0 /* set when all the pages are written */ |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 66 | |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 67 | #define BTRFS_ORDERED_COMPLETE 1 /* set when removed from the tree */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 68 | |
Yan Zheng | 7ea394f | 2008-08-05 13:05:02 -0400 | [diff] [blame] | 69 | #define BTRFS_ORDERED_NOCOW 2 /* set when we want to write in place */ |
| 70 | |
Li Zefan | 261507a0 | 2010-12-17 14:21:50 +0800 | [diff] [blame] | 71 | #define BTRFS_ORDERED_COMPRESSED 3 /* writing a zlib compressed extent */ |
Chris Mason | c8b9781 | 2008-10-29 14:49:59 -0400 | [diff] [blame] | 72 | |
Yan Zheng | d899e05 | 2008-10-30 14:25:28 -0400 | [diff] [blame] | 73 | #define BTRFS_ORDERED_PREALLOC 4 /* set when writing to prealloced extent */ |
| 74 | |
Josef Bacik | 4b46fce | 2010-05-23 11:00:55 -0400 | [diff] [blame] | 75 | #define BTRFS_ORDERED_DIRECT 5 /* set when we're doing DIO with this extent */ |
| 76 | |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 77 | #define BTRFS_ORDERED_IOERR 6 /* We had an io error when writing this out */ |
| 78 | |
Adam Buchbinder | 48fc7f7 | 2012-09-19 21:48:00 -0400 | [diff] [blame] | 79 | #define BTRFS_ORDERED_UPDATED_ISIZE 7 /* indicates whether this ordered extent |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 80 | * has done its due diligence in updating |
| 81 | * the isize. */ |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 82 | #define BTRFS_ORDERED_LOGGED_CSUM 8 /* We've logged the csums on this ordered |
| 83 | ordered extent */ |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 84 | |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 85 | struct btrfs_ordered_extent { |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 86 | /* logical offset in the file */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 87 | u64 file_offset; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 88 | |
| 89 | /* disk byte number */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 90 | u64 start; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 91 | |
Chris Mason | c8b9781 | 2008-10-29 14:49:59 -0400 | [diff] [blame] | 92 | /* ram length of the extent in bytes */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 93 | u64 len; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 94 | |
Chris Mason | c8b9781 | 2008-10-29 14:49:59 -0400 | [diff] [blame] | 95 | /* extent length on disk */ |
| 96 | u64 disk_len; |
| 97 | |
Chris Mason | 8b62b72 | 2009-09-02 16:53:46 -0400 | [diff] [blame] | 98 | /* number of bytes that still need writing */ |
| 99 | u64 bytes_left; |
| 100 | |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 101 | /* number of bytes that still need csumming */ |
| 102 | u64 csum_bytes_left; |
| 103 | |
Miao Xie | b9a8cc5 | 2012-09-06 04:01:21 -0600 | [diff] [blame] | 104 | /* |
| 105 | * the end of the ordered extent which is behind it but |
| 106 | * didn't update disk_i_size. Please see the comment of |
| 107 | * btrfs_ordered_update_i_size(); |
| 108 | */ |
| 109 | u64 outstanding_isize; |
| 110 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 111 | /* flags (described above) */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 112 | unsigned long flags; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 113 | |
Li Zefan | 261507a0 | 2010-12-17 14:21:50 +0800 | [diff] [blame] | 114 | /* compression algorithm */ |
| 115 | int compress_type; |
| 116 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 117 | /* reference count */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 118 | atomic_t refs; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 119 | |
Chris Mason | 3eaa288 | 2008-07-24 11:57:52 -0400 | [diff] [blame] | 120 | /* the inode we belong to */ |
| 121 | struct inode *inode; |
| 122 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 123 | /* list of checksums for insertion when the extent io is done */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 124 | struct list_head list; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 125 | |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 126 | /* If we need to wait on this to be done */ |
| 127 | struct list_head log_list; |
| 128 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 129 | /* used to wait for the BTRFS_ORDERED_COMPLETE bit */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 130 | wait_queue_head_t wait; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 131 | |
| 132 | /* our friendly rbtree entry */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 133 | struct rb_node rb_node; |
Chris Mason | 3eaa288 | 2008-07-24 11:57:52 -0400 | [diff] [blame] | 134 | |
| 135 | /* a per root list of all the pending ordered extents */ |
| 136 | struct list_head root_extent_list; |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 137 | |
| 138 | struct btrfs_work work; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 139 | |
Miao Xie | 9afab88 | 2012-10-25 09:41:36 +0000 | [diff] [blame] | 140 | struct completion completion; |
| 141 | struct btrfs_work flush_work; |
| 142 | struct list_head work_list; |
| 143 | }; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 144 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 145 | /* |
| 146 | * calculates the total size you need to allocate for an ordered sum |
| 147 | * structure spanning 'bytes' in the file |
| 148 | */ |
Chris Mason | 9ba4611 | 2008-07-23 09:26:26 -0400 | [diff] [blame] | 149 | static inline int btrfs_ordered_sum_size(struct btrfs_root *root, |
| 150 | unsigned long bytes) |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 151 | { |
| 152 | unsigned long num_sectors = (bytes + root->sectorsize - 1) / |
| 153 | root->sectorsize; |
Chris Mason | 3edf7d3 | 2008-07-18 06:17:13 -0400 | [diff] [blame] | 154 | num_sectors++; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 155 | return sizeof(struct btrfs_ordered_sum) + |
| 156 | num_sectors * sizeof(struct btrfs_sector_sum); |
| 157 | } |
| 158 | |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 159 | static inline void |
| 160 | btrfs_ordered_inode_tree_init(struct btrfs_ordered_inode_tree *t) |
| 161 | { |
Josef Bacik | 49958fd | 2010-02-02 21:48:28 +0000 | [diff] [blame] | 162 | spin_lock_init(&t->lock); |
Eric Paris | 6bef4d3 | 2010-02-23 19:43:04 +0000 | [diff] [blame] | 163 | t->tree = RB_ROOT; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 164 | t->last = NULL; |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 165 | } |
| 166 | |
Jeff Mahoney | 143bede | 2012-03-01 14:56:26 +0100 | [diff] [blame] | 167 | void btrfs_put_ordered_extent(struct btrfs_ordered_extent *entry); |
| 168 | void btrfs_remove_ordered_extent(struct inode *inode, |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 169 | struct btrfs_ordered_extent *entry); |
| 170 | int btrfs_dec_test_ordered_pending(struct inode *inode, |
Josef Bacik | 5a1a3df | 2010-02-02 20:51:14 +0000 | [diff] [blame] | 171 | struct btrfs_ordered_extent **cached, |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 172 | u64 file_offset, u64 io_size, int uptodate); |
Chris Mason | 163cf09 | 2010-11-28 19:56:33 -0500 | [diff] [blame] | 173 | int btrfs_dec_test_first_ordered_pending(struct inode *inode, |
| 174 | struct btrfs_ordered_extent **cached, |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 175 | u64 *file_offset, u64 io_size, |
| 176 | int uptodate); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 177 | int btrfs_add_ordered_extent(struct inode *inode, u64 file_offset, |
Josef Bacik | 4b46fce | 2010-05-23 11:00:55 -0400 | [diff] [blame] | 178 | u64 start, u64 len, u64 disk_len, int type); |
| 179 | int btrfs_add_ordered_extent_dio(struct inode *inode, u64 file_offset, |
| 180 | u64 start, u64 len, u64 disk_len, int type); |
Li Zefan | 261507a0 | 2010-12-17 14:21:50 +0800 | [diff] [blame] | 181 | int btrfs_add_ordered_extent_compress(struct inode *inode, u64 file_offset, |
| 182 | u64 start, u64 len, u64 disk_len, |
| 183 | int type, int compress_type); |
Jeff Mahoney | 143bede | 2012-03-01 14:56:26 +0100 | [diff] [blame] | 184 | void btrfs_add_ordered_sum(struct inode *inode, |
| 185 | struct btrfs_ordered_extent *entry, |
| 186 | struct btrfs_ordered_sum *sum); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 187 | struct btrfs_ordered_extent *btrfs_lookup_ordered_extent(struct inode *inode, |
| 188 | u64 file_offset); |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 189 | void btrfs_start_ordered_extent(struct inode *inode, |
| 190 | struct btrfs_ordered_extent *entry, int wait); |
Jeff Mahoney | 143bede | 2012-03-01 14:56:26 +0100 | [diff] [blame] | 191 | void btrfs_wait_ordered_range(struct inode *inode, u64 start, u64 len); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 192 | struct btrfs_ordered_extent * |
| 193 | btrfs_lookup_first_ordered_extent(struct inode * inode, u64 file_offset); |
Josef Bacik | 4b46fce | 2010-05-23 11:00:55 -0400 | [diff] [blame] | 194 | struct btrfs_ordered_extent *btrfs_lookup_ordered_range(struct inode *inode, |
| 195 | u64 file_offset, |
| 196 | u64 len); |
Yan, Zheng | c216775 | 2009-11-12 09:34:21 +0000 | [diff] [blame] | 197 | int btrfs_ordered_update_i_size(struct inode *inode, u64 offset, |
Chris Mason | dbe674a | 2008-07-17 12:54:05 -0400 | [diff] [blame] | 198 | struct btrfs_ordered_extent *ordered); |
Miao Xie | e4100d9 | 2013-04-05 07:20:56 +0000 | [diff] [blame] | 199 | int btrfs_find_ordered_sum(struct inode *inode, u64 offset, u64 disk_bytenr, |
| 200 | u32 *sum, int len); |
Josef Bacik | 569e0f3 | 2013-02-13 11:09:14 -0500 | [diff] [blame] | 201 | int btrfs_run_ordered_operations(struct btrfs_trans_handle *trans, |
| 202 | struct btrfs_root *root, int wait); |
Jeff Mahoney | 143bede | 2012-03-01 14:56:26 +0100 | [diff] [blame] | 203 | void btrfs_add_ordered_operation(struct btrfs_trans_handle *trans, |
| 204 | struct btrfs_root *root, |
| 205 | struct inode *inode); |
Liu Bo | 6bbe3a9 | 2012-09-14 02:58:07 -0600 | [diff] [blame] | 206 | void btrfs_wait_ordered_extents(struct btrfs_root *root, int delay_iput); |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 207 | void btrfs_get_logged_extents(struct btrfs_root *log, struct inode *inode); |
| 208 | void btrfs_wait_logged_extents(struct btrfs_root *log, u64 transid); |
| 209 | void btrfs_free_logged_extents(struct btrfs_root *log, u64 transid); |
Miao Xie | 6352b91 | 2012-09-06 04:01:51 -0600 | [diff] [blame] | 210 | int __init ordered_data_init(void); |
| 211 | void ordered_data_exit(void); |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 212 | #endif |