Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2007 Oracle. All rights reserved. |
| 3 | * |
| 4 | * This program is free software; you can redistribute it and/or |
| 5 | * modify it under the terms of the GNU General Public |
| 6 | * License v2 as published by the Free Software Foundation. |
| 7 | * |
| 8 | * This program is distributed in the hope that it will be useful, |
| 9 | * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| 10 | * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| 11 | * General Public License for more details. |
| 12 | * |
| 13 | * You should have received a copy of the GNU General Public |
| 14 | * License along with this program; if not, write to the |
| 15 | * Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
| 16 | * Boston, MA 021110-1307, USA. |
| 17 | */ |
| 18 | |
| 19 | #ifndef __BTRFS_ORDERED_DATA__ |
| 20 | #define __BTRFS_ORDERED_DATA__ |
| 21 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 22 | /* one of these per inode */ |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 23 | struct btrfs_ordered_inode_tree { |
Josef Bacik | 49958fd | 2010-02-02 21:48:28 +0000 | [diff] [blame] | 24 | spinlock_t lock; |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 25 | struct rb_root tree; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 26 | struct rb_node *last; |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 27 | }; |
| 28 | |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 29 | struct btrfs_ordered_sum { |
Chris Mason | d20f704 | 2008-12-08 16:58:54 -0500 | [diff] [blame] | 30 | /* bytenr is the start of this extent on disk */ |
| 31 | u64 bytenr; |
| 32 | |
Chris Mason | 3edf7d3 | 2008-07-18 06:17:13 -0400 | [diff] [blame] | 33 | /* |
| 34 | * this is the length in bytes covered by the sums array below. |
Chris Mason | 3edf7d3 | 2008-07-18 06:17:13 -0400 | [diff] [blame] | 35 | */ |
Miao Xie | f51a4a1 | 2013-06-19 10:36:09 +0800 | [diff] [blame] | 36 | int len; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 37 | struct list_head list; |
Miao Xie | f51a4a1 | 2013-06-19 10:36:09 +0800 | [diff] [blame] | 38 | /* last field is a variable length array of csums */ |
| 39 | u32 sums[]; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 40 | }; |
| 41 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 42 | /* |
| 43 | * bits for the flags field: |
| 44 | * |
| 45 | * BTRFS_ORDERED_IO_DONE is set when all of the blocks are written. |
| 46 | * It is used to make sure metadata is inserted into the tree only once |
| 47 | * per extent. |
| 48 | * |
| 49 | * BTRFS_ORDERED_COMPLETE is set when the extent is removed from the |
| 50 | * rbtree, just before waking any waiters. It is used to indicate the |
| 51 | * IO is done and any metadata is inserted into the tree. |
| 52 | */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 53 | #define BTRFS_ORDERED_IO_DONE 0 /* set when all the pages are written */ |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 54 | |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 55 | #define BTRFS_ORDERED_COMPLETE 1 /* set when removed from the tree */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 56 | |
Yan Zheng | 7ea394f | 2008-08-05 13:05:02 -0400 | [diff] [blame] | 57 | #define BTRFS_ORDERED_NOCOW 2 /* set when we want to write in place */ |
| 58 | |
Li Zefan | 261507a0 | 2010-12-17 14:21:50 +0800 | [diff] [blame] | 59 | #define BTRFS_ORDERED_COMPRESSED 3 /* writing a zlib compressed extent */ |
Chris Mason | c8b9781 | 2008-10-29 14:49:59 -0400 | [diff] [blame] | 60 | |
Nicholas D Steeves | 0132761 | 2016-05-19 21:18:45 -0400 | [diff] [blame] | 61 | #define BTRFS_ORDERED_PREALLOC 4 /* set when writing to preallocated extent */ |
Yan Zheng | d899e05 | 2008-10-30 14:25:28 -0400 | [diff] [blame] | 62 | |
Josef Bacik | 4b46fce | 2010-05-23 11:00:55 -0400 | [diff] [blame] | 63 | #define BTRFS_ORDERED_DIRECT 5 /* set when we're doing DIO with this extent */ |
| 64 | |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 65 | #define BTRFS_ORDERED_IOERR 6 /* We had an io error when writing this out */ |
| 66 | |
Adam Buchbinder | 48fc7f7 | 2012-09-19 21:48:00 -0400 | [diff] [blame] | 67 | #define BTRFS_ORDERED_UPDATED_ISIZE 7 /* indicates whether this ordered extent |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 68 | * has done its due diligence in updating |
| 69 | * the isize. */ |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 70 | #define BTRFS_ORDERED_LOGGED_CSUM 8 /* We've logged the csums on this ordered |
| 71 | ordered extent */ |
Josef Bacik | 77cef2e | 2013-08-29 13:57:21 -0400 | [diff] [blame] | 72 | #define BTRFS_ORDERED_TRUNCATED 9 /* Set when we have to truncate an extent */ |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 73 | |
Josef Bacik | 50d9aa9 | 2014-11-21 14:52:38 -0500 | [diff] [blame] | 74 | #define BTRFS_ORDERED_LOGGED 10 /* Set when we've waited on this ordered extent |
| 75 | * in the logging code. */ |
Josef Bacik | 161c3549 | 2015-09-24 16:17:39 -0400 | [diff] [blame] | 76 | #define BTRFS_ORDERED_PENDING 11 /* We are waiting for this ordered extent to |
| 77 | * complete in the current transaction. */ |
Liu Bo | 1af4a0a | 2017-02-13 15:35:09 -0800 | [diff] [blame] | 78 | #define BTRFS_ORDERED_REGULAR 12 /* Regular IO for COW */ |
| 79 | |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 80 | struct btrfs_ordered_extent { |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 81 | /* logical offset in the file */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 82 | u64 file_offset; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 83 | |
| 84 | /* disk byte number */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 85 | u64 start; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 86 | |
Chris Mason | c8b9781 | 2008-10-29 14:49:59 -0400 | [diff] [blame] | 87 | /* ram length of the extent in bytes */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 88 | u64 len; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 89 | |
Chris Mason | c8b9781 | 2008-10-29 14:49:59 -0400 | [diff] [blame] | 90 | /* extent length on disk */ |
| 91 | u64 disk_len; |
| 92 | |
Chris Mason | 8b62b72 | 2009-09-02 16:53:46 -0400 | [diff] [blame] | 93 | /* number of bytes that still need writing */ |
| 94 | u64 bytes_left; |
| 95 | |
Miao Xie | b9a8cc5 | 2012-09-06 04:01:21 -0600 | [diff] [blame] | 96 | /* |
| 97 | * the end of the ordered extent which is behind it but |
| 98 | * didn't update disk_i_size. Please see the comment of |
| 99 | * btrfs_ordered_update_i_size(); |
| 100 | */ |
| 101 | u64 outstanding_isize; |
| 102 | |
Josef Bacik | 77cef2e | 2013-08-29 13:57:21 -0400 | [diff] [blame] | 103 | /* |
| 104 | * If we get truncated we need to adjust the file extent we enter for |
| 105 | * this ordered extent so that we do not expose stale data. |
| 106 | */ |
| 107 | u64 truncated_len; |
| 108 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 109 | /* flags (described above) */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 110 | unsigned long flags; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 111 | |
Li Zefan | 261507a0 | 2010-12-17 14:21:50 +0800 | [diff] [blame] | 112 | /* compression algorithm */ |
| 113 | int compress_type; |
| 114 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 115 | /* reference count */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 116 | atomic_t refs; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 117 | |
Chris Mason | 3eaa288 | 2008-07-24 11:57:52 -0400 | [diff] [blame] | 118 | /* the inode we belong to */ |
| 119 | struct inode *inode; |
| 120 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 121 | /* list of checksums for insertion when the extent io is done */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 122 | struct list_head list; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 123 | |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 124 | /* If we need to wait on this to be done */ |
| 125 | struct list_head log_list; |
| 126 | |
Josef Bacik | 50d9aa9 | 2014-11-21 14:52:38 -0500 | [diff] [blame] | 127 | /* If the transaction needs to wait on this ordered extent */ |
| 128 | struct list_head trans_list; |
| 129 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 130 | /* used to wait for the BTRFS_ORDERED_COMPLETE bit */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 131 | wait_queue_head_t wait; |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 132 | |
| 133 | /* our friendly rbtree entry */ |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 134 | struct rb_node rb_node; |
Chris Mason | 3eaa288 | 2008-07-24 11:57:52 -0400 | [diff] [blame] | 135 | |
| 136 | /* a per root list of all the pending ordered extents */ |
| 137 | struct list_head root_extent_list; |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 138 | |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 139 | struct btrfs_work work; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 140 | |
Miao Xie | 9afab88 | 2012-10-25 09:41:36 +0000 | [diff] [blame] | 141 | struct completion completion; |
Qu Wenruo | d458b05 | 2014-02-28 10:46:19 +0800 | [diff] [blame] | 142 | struct btrfs_work flush_work; |
Miao Xie | 9afab88 | 2012-10-25 09:41:36 +0000 | [diff] [blame] | 143 | struct list_head work_list; |
| 144 | }; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 145 | |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 146 | /* |
| 147 | * calculates the total size you need to allocate for an ordered sum |
| 148 | * structure spanning 'bytes' in the file |
| 149 | */ |
Jeff Mahoney | da17066 | 2016-06-15 09:22:56 -0400 | [diff] [blame] | 150 | static inline int btrfs_ordered_sum_size(struct btrfs_fs_info *fs_info, |
Chris Mason | 9ba4611 | 2008-07-23 09:26:26 -0400 | [diff] [blame] | 151 | unsigned long bytes) |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 152 | { |
Jeff Mahoney | da17066 | 2016-06-15 09:22:56 -0400 | [diff] [blame] | 153 | int num_sectors = (int)DIV_ROUND_UP(bytes, fs_info->sectorsize); |
Miao Xie | f51a4a1 | 2013-06-19 10:36:09 +0800 | [diff] [blame] | 154 | return sizeof(struct btrfs_ordered_sum) + num_sectors * sizeof(u32); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 155 | } |
| 156 | |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 157 | static inline void |
| 158 | btrfs_ordered_inode_tree_init(struct btrfs_ordered_inode_tree *t) |
| 159 | { |
Josef Bacik | 49958fd | 2010-02-02 21:48:28 +0000 | [diff] [blame] | 160 | spin_lock_init(&t->lock); |
Eric Paris | 6bef4d3 | 2010-02-23 19:43:04 +0000 | [diff] [blame] | 161 | t->tree = RB_ROOT; |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 162 | t->last = NULL; |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 163 | } |
| 164 | |
Jeff Mahoney | 143bede | 2012-03-01 14:56:26 +0100 | [diff] [blame] | 165 | void btrfs_put_ordered_extent(struct btrfs_ordered_extent *entry); |
| 166 | void btrfs_remove_ordered_extent(struct inode *inode, |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 167 | struct btrfs_ordered_extent *entry); |
| 168 | int btrfs_dec_test_ordered_pending(struct inode *inode, |
Josef Bacik | 5a1a3df | 2010-02-02 20:51:14 +0000 | [diff] [blame] | 169 | struct btrfs_ordered_extent **cached, |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 170 | u64 file_offset, u64 io_size, int uptodate); |
Chris Mason | 163cf09 | 2010-11-28 19:56:33 -0500 | [diff] [blame] | 171 | int btrfs_dec_test_first_ordered_pending(struct inode *inode, |
| 172 | struct btrfs_ordered_extent **cached, |
Josef Bacik | 5fd0204 | 2012-05-02 14:00:54 -0400 | [diff] [blame] | 173 | u64 *file_offset, u64 io_size, |
| 174 | int uptodate); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 175 | int btrfs_add_ordered_extent(struct inode *inode, u64 file_offset, |
Josef Bacik | 4b46fce | 2010-05-23 11:00:55 -0400 | [diff] [blame] | 176 | u64 start, u64 len, u64 disk_len, int type); |
| 177 | int btrfs_add_ordered_extent_dio(struct inode *inode, u64 file_offset, |
| 178 | u64 start, u64 len, u64 disk_len, int type); |
Li Zefan | 261507a0 | 2010-12-17 14:21:50 +0800 | [diff] [blame] | 179 | int btrfs_add_ordered_extent_compress(struct inode *inode, u64 file_offset, |
| 180 | u64 start, u64 len, u64 disk_len, |
| 181 | int type, int compress_type); |
Jeff Mahoney | 143bede | 2012-03-01 14:56:26 +0100 | [diff] [blame] | 182 | void btrfs_add_ordered_sum(struct inode *inode, |
| 183 | struct btrfs_ordered_extent *entry, |
| 184 | struct btrfs_ordered_sum *sum); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 185 | struct btrfs_ordered_extent *btrfs_lookup_ordered_extent(struct inode *inode, |
| 186 | u64 file_offset); |
Chris Mason | eb84ae0 | 2008-07-17 13:53:27 -0400 | [diff] [blame] | 187 | void btrfs_start_ordered_extent(struct inode *inode, |
| 188 | struct btrfs_ordered_extent *entry, int wait); |
Josef Bacik | 0ef8b72 | 2013-10-25 16:13:35 -0400 | [diff] [blame] | 189 | int btrfs_wait_ordered_range(struct inode *inode, u64 start, u64 len); |
Chris Mason | e6dcd2d | 2008-07-17 12:53:50 -0400 | [diff] [blame] | 190 | struct btrfs_ordered_extent * |
| 191 | btrfs_lookup_first_ordered_extent(struct inode * inode, u64 file_offset); |
Nikolay Borisov | a776c6f | 2017-02-20 13:50:49 +0200 | [diff] [blame] | 192 | struct btrfs_ordered_extent *btrfs_lookup_ordered_range( |
| 193 | struct btrfs_inode *inode, |
| 194 | u64 file_offset, |
| 195 | u64 len); |
Filipe Manana | b659ef0 | 2015-03-31 14:16:52 +0100 | [diff] [blame] | 196 | bool btrfs_have_ordered_extents_in_range(struct inode *inode, |
| 197 | u64 file_offset, |
| 198 | u64 len); |
Yan, Zheng | c216775 | 2009-11-12 09:34:21 +0000 | [diff] [blame] | 199 | int btrfs_ordered_update_i_size(struct inode *inode, u64 offset, |
Chris Mason | dbe674a | 2008-07-17 12:54:05 -0400 | [diff] [blame] | 200 | struct btrfs_ordered_extent *ordered); |
Miao Xie | e4100d9 | 2013-04-05 07:20:56 +0000 | [diff] [blame] | 201 | int btrfs_find_ordered_sum(struct inode *inode, u64 offset, u64 disk_bytenr, |
| 202 | u32 *sum, int len); |
Filipe Manana | 578def7 | 2016-04-26 15:36:38 +0100 | [diff] [blame] | 203 | int btrfs_wait_ordered_extents(struct btrfs_root *root, int nr, |
| 204 | const u64 range_start, const u64 range_len); |
Filipe Manana | f0e9b7d | 2016-05-14 09:12:53 +0100 | [diff] [blame] | 205 | int btrfs_wait_ordered_roots(struct btrfs_fs_info *fs_info, int nr, |
Filipe Manana | 578def7 | 2016-04-26 15:36:38 +0100 | [diff] [blame] | 206 | const u64 range_start, const u64 range_len); |
Nikolay Borisov | 2234663 | 2017-01-18 00:31:39 +0200 | [diff] [blame] | 207 | void btrfs_get_logged_extents(struct btrfs_inode *inode, |
Filipe Manana | 0870295 | 2014-11-13 17:00:35 +0000 | [diff] [blame] | 208 | struct list_head *logged_list, |
| 209 | const loff_t start, |
| 210 | const loff_t end); |
Miao Xie | 827463c | 2014-01-14 20:31:51 +0800 | [diff] [blame] | 211 | void btrfs_put_logged_extents(struct list_head *logged_list); |
| 212 | void btrfs_submit_logged_extents(struct list_head *logged_list, |
| 213 | struct btrfs_root *log); |
Josef Bacik | 50d9aa9 | 2014-11-21 14:52:38 -0500 | [diff] [blame] | 214 | void btrfs_wait_logged_extents(struct btrfs_trans_handle *trans, |
| 215 | struct btrfs_root *log, u64 transid); |
Josef Bacik | 2ab28f3 | 2012-10-12 15:27:49 -0400 | [diff] [blame] | 216 | void btrfs_free_logged_extents(struct btrfs_root *log, u64 transid); |
Miao Xie | 6352b91 | 2012-09-06 04:01:51 -0600 | [diff] [blame] | 217 | int __init ordered_data_init(void); |
| 218 | void ordered_data_exit(void); |
Chris Mason | dc17ff8 | 2008-01-08 15:46:30 -0500 | [diff] [blame] | 219 | #endif |