Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | #ifndef _RAID10_H |
| 2 | #define _RAID10_H |
| 3 | |
Jonathan Brassow | dc280d98 | 2012-07-31 10:03:52 +1000 | [diff] [blame] | 4 | struct raid10_info { |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 5 | struct md_rdev *rdev, *replacement; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 6 | sector_t head_position; |
NeilBrown | 2bb7773 | 2011-07-27 11:00:36 +1000 | [diff] [blame] | 7 | int recovery_disabled; /* matches |
| 8 | * mddev->recovery_disabled |
| 9 | * when we shouldn't try |
| 10 | * recovering this device. |
| 11 | */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 12 | }; |
| 13 | |
NeilBrown | e879a87 | 2011-10-11 16:49:02 +1100 | [diff] [blame] | 14 | struct r10conf { |
NeilBrown | fd01b88 | 2011-10-11 16:47:53 +1100 | [diff] [blame] | 15 | struct mddev *mddev; |
Jonathan Brassow | dc280d98 | 2012-07-31 10:03:52 +1000 | [diff] [blame] | 16 | struct raid10_info *mirrors; |
| 17 | struct raid10_info *mirrors_new, *mirrors_old; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 18 | spinlock_t device_lock; |
| 19 | |
| 20 | /* geometry */ |
NeilBrown | 5cf00fc | 2012-05-21 09:28:20 +1000 | [diff] [blame] | 21 | struct geom { |
| 22 | int raid_disks; |
| 23 | int near_copies; /* number of copies laid out |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 24 | * raid0 style */ |
NeilBrown | 5cf00fc | 2012-05-21 09:28:20 +1000 | [diff] [blame] | 25 | int far_copies; /* number of copies laid out |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 26 | * at large strides across drives |
| 27 | */ |
NeilBrown | 5cf00fc | 2012-05-21 09:28:20 +1000 | [diff] [blame] | 28 | int far_offset; /* far_copies are offset by 1 |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 29 | * stripe instead of many |
NeilBrown | c93983b | 2006-06-26 00:27:41 -0700 | [diff] [blame] | 30 | */ |
NeilBrown | 5cf00fc | 2012-05-21 09:28:20 +1000 | [diff] [blame] | 31 | sector_t stride; /* distance between far copies. |
NeilBrown | c93983b | 2006-06-26 00:27:41 -0700 | [diff] [blame] | 32 | * This is size / far_copies unless |
| 33 | * far_offset, in which case it is |
| 34 | * 1 stripe. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 35 | */ |
Jonathan Brassow | 475901a | 2013-02-21 13:28:10 +1100 | [diff] [blame] | 36 | int far_set_size; /* The number of devices in a set, |
| 37 | * where a 'set' are devices that |
| 38 | * contain far/offset copies of |
| 39 | * each other. |
| 40 | */ |
NeilBrown | 5cf00fc | 2012-05-21 09:28:20 +1000 | [diff] [blame] | 41 | int chunk_shift; /* shift from chunks to sectors */ |
| 42 | sector_t chunk_mask; |
NeilBrown | f8c9e74 | 2012-05-21 09:28:33 +1000 | [diff] [blame] | 43 | } prev, geo; |
NeilBrown | 5cf00fc | 2012-05-21 09:28:20 +1000 | [diff] [blame] | 44 | int copies; /* near_copies * far_copies. |
| 45 | * must be <= raid_disks |
| 46 | */ |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 47 | |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 48 | sector_t dev_sectors; /* temp copy of |
| 49 | * mddev->dev_sectors */ |
NeilBrown | f8c9e74 | 2012-05-21 09:28:33 +1000 | [diff] [blame] | 50 | sector_t reshape_progress; |
NeilBrown | 3ea7daa | 2012-05-22 13:53:47 +1000 | [diff] [blame] | 51 | sector_t reshape_safe; |
| 52 | unsigned long reshape_checkpoint; |
| 53 | sector_t offset_diff; |
Trela, Maciej | dab8b29 | 2010-03-08 16:02:45 +1100 | [diff] [blame] | 54 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 55 | struct list_head retry_list; |
NeilBrown | 6cce3b2 | 2006-01-06 00:20:16 -0800 | [diff] [blame] | 56 | /* queue pending writes and submit them on unplug */ |
| 57 | struct bio_list pending_bio_list; |
NeilBrown | 34db0cd | 2011-10-11 16:50:01 +1100 | [diff] [blame] | 58 | int pending_count; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 59 | |
| 60 | spinlock_t resync_lock; |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 61 | int nr_pending; |
| 62 | int nr_waiting; |
| 63 | int nr_queued; |
| 64 | int barrier; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 65 | sector_t next_resync; |
NeilBrown | 6cce3b2 | 2006-01-06 00:20:16 -0800 | [diff] [blame] | 66 | int fullsync; /* set to 1 if a full sync is needed, |
| 67 | * (fresh device added). |
| 68 | * Cleared when a sync completes. |
| 69 | */ |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 70 | int have_replacement; /* There is at least one |
| 71 | * replacement device. |
| 72 | */ |
NeilBrown | 0a27ec9 | 2006-01-06 00:20:13 -0800 | [diff] [blame] | 73 | wait_queue_head_t wait_barrier; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 74 | |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 75 | mempool_t *r10bio_pool; |
| 76 | mempool_t *r10buf_pool; |
NeilBrown | 4443ae1 | 2006-01-06 00:20:28 -0800 | [diff] [blame] | 77 | struct page *tmppage; |
Trela, Maciej | dab8b29 | 2010-03-08 16:02:45 +1100 | [diff] [blame] | 78 | |
| 79 | /* When taking over an array from a different personality, we store |
| 80 | * the new thread here until we fully activate the array. |
| 81 | */ |
NeilBrown | 2b8bf34 | 2011-10-11 16:48:23 +1100 | [diff] [blame] | 82 | struct md_thread *thread; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 83 | }; |
| 84 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 85 | /* |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 86 | * this is our 'private' RAID10 bio. |
| 87 | * |
| 88 | * it contains information about what kind of IO operations were started |
| 89 | * for this RAID10 operation, and about their status: |
| 90 | */ |
| 91 | |
NeilBrown | 9f2c9d1 | 2011-10-11 16:48:43 +1100 | [diff] [blame] | 92 | struct r10bio { |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 93 | atomic_t remaining; /* 'have we finished' count, |
| 94 | * used from IRQ handlers |
| 95 | */ |
| 96 | sector_t sector; /* virtual sector number */ |
| 97 | int sectors; |
| 98 | unsigned long state; |
NeilBrown | fd01b88 | 2011-10-11 16:47:53 +1100 | [diff] [blame] | 99 | struct mddev *mddev; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 100 | /* |
| 101 | * original bio going to /dev/mdx |
| 102 | */ |
| 103 | struct bio *master_bio; |
| 104 | /* |
| 105 | * if the IO is in READ direction, then this is where we read |
| 106 | */ |
| 107 | int read_slot; |
| 108 | |
| 109 | struct list_head retry_list; |
| 110 | /* |
| 111 | * if the IO is in WRITE direction, then multiple bios are used, |
| 112 | * one for each copy. |
| 113 | * When resyncing we also use one for each copy. |
| 114 | * When reconstructing, we use 2 bios, one for read, one for write. |
| 115 | * We choose the number when they are allocated. |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 116 | * We sometimes need an extra bio to write to the replacement. |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 117 | */ |
NeilBrown | e0ee778 | 2012-08-18 09:51:42 +1000 | [diff] [blame] | 118 | struct r10dev { |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 119 | struct bio *bio; |
| 120 | union { |
| 121 | struct bio *repl_bio; /* used for resync and |
| 122 | * writes */ |
| 123 | struct md_rdev *rdev; /* used for reads |
| 124 | * (read_slot >= 0) */ |
| 125 | }; |
| 126 | sector_t addr; |
| 127 | int devnum; |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 128 | } devs[0]; |
| 129 | }; |
| 130 | |
| 131 | /* bits for r10bio.state */ |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 132 | enum r10bio_state { |
| 133 | R10BIO_Uptodate, |
| 134 | R10BIO_IsSync, |
| 135 | R10BIO_IsRecover, |
NeilBrown | 3ea7daa | 2012-05-22 13:53:47 +1000 | [diff] [blame] | 136 | R10BIO_IsReshape, |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 137 | R10BIO_Degraded, |
NeilBrown | 856e08e | 2011-07-28 11:39:23 +1000 | [diff] [blame] | 138 | /* Set ReadError on bios that experience a read error |
| 139 | * so that raid10d knows what to do with them. |
| 140 | */ |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 141 | R10BIO_ReadError, |
NeilBrown | 749c55e | 2011-07-28 11:39:24 +1000 | [diff] [blame] | 142 | /* If a write for this request means we can clear some |
| 143 | * known-bad-block records, we set this flag. |
| 144 | */ |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 145 | R10BIO_MadeGood, |
| 146 | R10BIO_WriteError, |
NeilBrown | f8c9e74 | 2012-05-21 09:28:33 +1000 | [diff] [blame] | 147 | /* During a reshape we might be performing IO on the |
| 148 | * 'previous' part of the array, in which case this |
| 149 | * flag is set |
| 150 | */ |
| 151 | R10BIO_Previous, |
NeilBrown | 69335ef | 2011-12-23 10:17:54 +1100 | [diff] [blame] | 152 | }; |
Jonathan Brassow | cc4d1ef | 2012-07-31 10:03:53 +1000 | [diff] [blame] | 153 | |
| 154 | extern int md_raid10_congested(struct mddev *mddev, int bits); |
| 155 | |
Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 156 | #endif |