blob: c78e6a9e59cea0bacb112031aa1dd93929605d3d [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (C) 2003 Sistina Software Limited.
3 * Copyright (C) 2004-2005 Red Hat, Inc. All rights reserved.
4 *
5 * This file is released under the GPL.
6 */
7
Mikulas Patocka586e80e2008-10-21 17:44:59 +01008#include <linux/device-mapper.h>
9
Mike Snitzerf4790822013-09-12 18:06:12 -040010#include "dm.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070011#include "dm-path-selector.h"
Mike Andersonb15546f2007-10-19 22:48:02 +010012#include "dm-uevent.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -070013
14#include <linux/ctype.h>
15#include <linux/init.h>
16#include <linux/mempool.h>
17#include <linux/module.h>
18#include <linux/pagemap.h>
19#include <linux/slab.h>
20#include <linux/time.h>
21#include <linux/workqueue.h>
Mikulas Patocka35991652012-06-03 00:29:58 +010022#include <linux/delay.h>
Chandra Seetharamancfae5c92008-05-01 14:50:11 -070023#include <scsi/scsi_dh.h>
Arun Sharma600634972011-07-26 16:09:06 -070024#include <linux/atomic.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070025
Alasdair G Kergon72d94862006-06-26 00:27:35 -070026#define DM_MSG_PREFIX "multipath"
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +000027#define DM_PG_INIT_DELAY_MSECS 2000
28#define DM_PG_INIT_DELAY_DEFAULT ((unsigned) -1)
Linus Torvalds1da177e2005-04-16 15:20:36 -070029
30/* Path properties */
31struct pgpath {
32 struct list_head list;
33
34 struct priority_group *pg; /* Owning PG */
Kiyoshi Ueda66800732008-10-10 13:36:58 +010035 unsigned is_active; /* Path status */
Linus Torvalds1da177e2005-04-16 15:20:36 -070036 unsigned fail_count; /* Cumulative failure count */
37
Josef "Jeff" Sipekc922d5f2006-12-08 02:36:33 -080038 struct dm_path path;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +000039 struct delayed_work activate_path;
Linus Torvalds1da177e2005-04-16 15:20:36 -070040};
41
42#define path_to_pgpath(__pgp) container_of((__pgp), struct pgpath, path)
43
44/*
45 * Paths are grouped into Priority Groups and numbered from 1 upwards.
46 * Each has a path selector which controls which path gets used.
47 */
48struct priority_group {
49 struct list_head list;
50
51 struct multipath *m; /* Owning multipath instance */
52 struct path_selector ps;
53
54 unsigned pg_num; /* Reference number */
55 unsigned bypassed; /* Temporarily bypass this PG? */
56
57 unsigned nr_pgpaths; /* Number of paths in PG */
58 struct list_head pgpaths;
59};
60
61/* Multipath context */
62struct multipath {
63 struct list_head list;
64 struct dm_target *ti;
65
Chandra Seetharamancfae5c92008-05-01 14:50:11 -070066 const char *hw_handler_name;
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -070067 char *hw_handler_params;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +000068
Mike Snitzer1fbdd2b2012-06-03 00:29:43 +010069 spinlock_t lock;
70
Linus Torvalds1da177e2005-04-16 15:20:36 -070071 unsigned nr_priority_groups;
72 struct list_head priority_groups;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +000073
74 wait_queue_head_t pg_init_wait; /* Wait for pg_init completion */
75
Linus Torvalds1da177e2005-04-16 15:20:36 -070076 unsigned pg_init_required; /* pg_init needs calling? */
Alasdair G Kergonc3cd4f62005-07-12 15:53:04 -070077 unsigned pg_init_in_progress; /* Only one pg_init allowed at once */
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +000078 unsigned pg_init_delay_retry; /* Delay pg_init retry? */
Linus Torvalds1da177e2005-04-16 15:20:36 -070079
80 unsigned nr_valid_paths; /* Total number of usable paths */
81 struct pgpath *current_pgpath;
82 struct priority_group *current_pg;
83 struct priority_group *next_pg; /* Switch to this PG if set */
84 unsigned repeat_count; /* I/Os left before calling PS again */
85
Mike Snitzer1fbdd2b2012-06-03 00:29:43 +010086 unsigned queue_io:1; /* Must we queue all I/O? */
87 unsigned queue_if_no_path:1; /* Queue I/O if last path fails? */
88 unsigned saved_queue_if_no_path:1; /* Saved state during suspension */
Mike Snitzera58a9352012-07-27 15:08:04 +010089 unsigned retain_attached_hw_handler:1; /* If there's already a hw_handler present, don't change it. */
Shiva Krishna Merla954a73d2013-10-30 03:26:38 +000090 unsigned pg_init_disabled:1; /* pg_init is not currently allowed */
Mike Snitzer1fbdd2b2012-06-03 00:29:43 +010091
Dave Wysochanskic9e45582007-10-19 22:47:53 +010092 unsigned pg_init_retries; /* Number of times to retry pg_init */
93 unsigned pg_init_count; /* Number of times pg_init called */
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +000094 unsigned pg_init_delay_msecs; /* Number of msecs before pg_init retry */
Linus Torvalds1da177e2005-04-16 15:20:36 -070095
Mike Snitzer1fbdd2b2012-06-03 00:29:43 +010096 unsigned queue_size;
Linus Torvalds1da177e2005-04-16 15:20:36 -070097 struct work_struct process_queued_ios;
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +010098 struct list_head queued_ios;
Linus Torvalds1da177e2005-04-16 15:20:36 -070099
100 struct work_struct trigger_event;
101
102 /*
Alasdair G Kergon028867a2007-07-12 17:26:32 +0100103 * We must use a mempool of dm_mpath_io structs so that we
Linus Torvalds1da177e2005-04-16 15:20:36 -0700104 * can resubmit bios on error.
105 */
106 mempool_t *mpio_pool;
Mike Anderson6380f262009-12-10 23:52:21 +0000107
108 struct mutex work_mutex;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700109};
110
111/*
112 * Context information attached to each bio we process.
113 */
Alasdair G Kergon028867a2007-07-12 17:26:32 +0100114struct dm_mpath_io {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700115 struct pgpath *pgpath;
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100116 size_t nr_bytes;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700117};
118
119typedef int (*action_fn) (struct pgpath *pgpath);
120
Christoph Lametere18b8902006-12-06 20:33:20 -0800121static struct kmem_cache *_mpio_cache;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700122
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -0700123static struct workqueue_struct *kmultipathd, *kmpath_handlerd;
David Howellsc4028952006-11-22 14:57:56 +0000124static void process_queued_ios(struct work_struct *work);
125static void trigger_event(struct work_struct *work);
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -0700126static void activate_path(struct work_struct *work);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700127
128
129/*-----------------------------------------------
130 * Allocation routines
131 *-----------------------------------------------*/
132
133static struct pgpath *alloc_pgpath(void)
134{
Micha³ Miros³awe69fae52006-10-03 01:15:34 -0700135 struct pgpath *pgpath = kzalloc(sizeof(*pgpath), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700136
Mike Anderson224cb3e2008-08-29 09:36:09 +0200137 if (pgpath) {
Kiyoshi Ueda66800732008-10-10 13:36:58 +0100138 pgpath->is_active = 1;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000139 INIT_DELAYED_WORK(&pgpath->activate_path, activate_path);
Mike Anderson224cb3e2008-08-29 09:36:09 +0200140 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700141
142 return pgpath;
143}
144
Alasdair G Kergon028867a2007-07-12 17:26:32 +0100145static void free_pgpath(struct pgpath *pgpath)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146{
147 kfree(pgpath);
148}
149
150static struct priority_group *alloc_priority_group(void)
151{
152 struct priority_group *pg;
153
Micha³ Miros³awe69fae52006-10-03 01:15:34 -0700154 pg = kzalloc(sizeof(*pg), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700155
Micha³ Miros³awe69fae52006-10-03 01:15:34 -0700156 if (pg)
157 INIT_LIST_HEAD(&pg->pgpaths);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700158
159 return pg;
160}
161
162static void free_pgpaths(struct list_head *pgpaths, struct dm_target *ti)
163{
164 struct pgpath *pgpath, *tmp;
Hannes Reineckeae11b1b2008-07-17 17:49:02 -0700165 struct multipath *m = ti->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700166
167 list_for_each_entry_safe(pgpath, tmp, pgpaths, list) {
168 list_del(&pgpath->list);
Hannes Reineckeae11b1b2008-07-17 17:49:02 -0700169 if (m->hw_handler_name)
170 scsi_dh_detach(bdev_get_queue(pgpath->path.dev->bdev));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700171 dm_put_device(ti, pgpath->path.dev);
172 free_pgpath(pgpath);
173 }
174}
175
176static void free_priority_group(struct priority_group *pg,
177 struct dm_target *ti)
178{
179 struct path_selector *ps = &pg->ps;
180
181 if (ps->type) {
182 ps->type->destroy(ps);
183 dm_put_path_selector(ps->type);
184 }
185
186 free_pgpaths(&pg->pgpaths, ti);
187 kfree(pg);
188}
189
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700190static struct multipath *alloc_multipath(struct dm_target *ti)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700191{
192 struct multipath *m;
Mike Snitzerf4790822013-09-12 18:06:12 -0400193 unsigned min_ios = dm_get_reserved_rq_based_ios();
Linus Torvalds1da177e2005-04-16 15:20:36 -0700194
Micha³ Miros³awe69fae52006-10-03 01:15:34 -0700195 m = kzalloc(sizeof(*m), GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700196 if (m) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197 INIT_LIST_HEAD(&m->priority_groups);
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100198 INIT_LIST_HEAD(&m->queued_ios);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 spin_lock_init(&m->lock);
200 m->queue_io = 1;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000201 m->pg_init_delay_msecs = DM_PG_INIT_DELAY_DEFAULT;
David Howellsc4028952006-11-22 14:57:56 +0000202 INIT_WORK(&m->process_queued_ios, process_queued_ios);
203 INIT_WORK(&m->trigger_event, trigger_event);
Kiyoshi Ueda2bded7b2010-03-06 02:32:13 +0000204 init_waitqueue_head(&m->pg_init_wait);
Mike Anderson6380f262009-12-10 23:52:21 +0000205 mutex_init(&m->work_mutex);
Mike Snitzerf4790822013-09-12 18:06:12 -0400206 m->mpio_pool = mempool_create_slab_pool(min_ios, _mpio_cache);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700207 if (!m->mpio_pool) {
208 kfree(m);
209 return NULL;
210 }
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700211 m->ti = ti;
212 ti->private = m;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700213 }
214
215 return m;
216}
217
218static void free_multipath(struct multipath *m)
219{
220 struct priority_group *pg, *tmp;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700221
222 list_for_each_entry_safe(pg, tmp, &m->priority_groups, list) {
223 list_del(&pg->list);
224 free_priority_group(pg, m->ti);
225 }
226
Chandra Seetharamancfae5c92008-05-01 14:50:11 -0700227 kfree(m->hw_handler_name);
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -0700228 kfree(m->hw_handler_params);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700229 mempool_destroy(m->mpio_pool);
230 kfree(m);
231}
232
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100233static int set_mapinfo(struct multipath *m, union map_info *info)
234{
235 struct dm_mpath_io *mpio;
236
237 mpio = mempool_alloc(m->mpio_pool, GFP_ATOMIC);
238 if (!mpio)
239 return -ENOMEM;
240
241 memset(mpio, 0, sizeof(*mpio));
242 info->ptr = mpio;
243
244 return 0;
245}
246
247static void clear_mapinfo(struct multipath *m, union map_info *info)
248{
249 struct dm_mpath_io *mpio = info->ptr;
250
251 info->ptr = NULL;
252 mempool_free(mpio, m->mpio_pool);
253}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700254
255/*-----------------------------------------------
256 * Path selection
257 *-----------------------------------------------*/
258
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000259static void __pg_init_all_paths(struct multipath *m)
260{
261 struct pgpath *pgpath;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000262 unsigned long pg_init_delay = 0;
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000263
Hannes Reinecke17f4ff42014-02-28 15:33:42 +0100264 if (m->pg_init_in_progress || m->pg_init_disabled)
265 return;
266
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000267 m->pg_init_count++;
268 m->pg_init_required = 0;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000269 if (m->pg_init_delay_retry)
270 pg_init_delay = msecs_to_jiffies(m->pg_init_delay_msecs != DM_PG_INIT_DELAY_DEFAULT ?
271 m->pg_init_delay_msecs : DM_PG_INIT_DELAY_MSECS);
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000272 list_for_each_entry(pgpath, &m->current_pg->pgpaths, list) {
273 /* Skip failed paths */
274 if (!pgpath->is_active)
275 continue;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000276 if (queue_delayed_work(kmpath_handlerd, &pgpath->activate_path,
277 pg_init_delay))
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000278 m->pg_init_in_progress++;
279 }
280}
281
Linus Torvalds1da177e2005-04-16 15:20:36 -0700282static void __switch_pg(struct multipath *m, struct pgpath *pgpath)
283{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700284 m->current_pg = pgpath->pg;
285
286 /* Must we initialise the PG first, and queue I/O till it's ready? */
Chandra Seetharamancfae5c92008-05-01 14:50:11 -0700287 if (m->hw_handler_name) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700288 m->pg_init_required = 1;
289 m->queue_io = 1;
290 } else {
291 m->pg_init_required = 0;
292 m->queue_io = 0;
293 }
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100294
295 m->pg_init_count = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296}
297
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100298static int __choose_path_in_pg(struct multipath *m, struct priority_group *pg,
299 size_t nr_bytes)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700300{
Josef "Jeff" Sipekc922d5f2006-12-08 02:36:33 -0800301 struct dm_path *path;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700302
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100303 path = pg->ps.type->select_path(&pg->ps, &m->repeat_count, nr_bytes);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700304 if (!path)
305 return -ENXIO;
306
307 m->current_pgpath = path_to_pgpath(path);
308
309 if (m->current_pg != pg)
310 __switch_pg(m, m->current_pgpath);
311
312 return 0;
313}
314
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100315static void __choose_pgpath(struct multipath *m, size_t nr_bytes)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316{
317 struct priority_group *pg;
318 unsigned bypassed = 1;
319
320 if (!m->nr_valid_paths)
321 goto failed;
322
323 /* Were we instructed to switch PG? */
324 if (m->next_pg) {
325 pg = m->next_pg;
326 m->next_pg = NULL;
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100327 if (!__choose_path_in_pg(m, pg, nr_bytes))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700328 return;
329 }
330
331 /* Don't change PG until it has no remaining paths */
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100332 if (m->current_pg && !__choose_path_in_pg(m, m->current_pg, nr_bytes))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700333 return;
334
335 /*
336 * Loop through priority groups until we find a valid path.
337 * First time we skip PGs marked 'bypassed'.
Mike Christief220fd42012-06-03 00:29:45 +0100338 * Second time we only try the ones we skipped, but set
339 * pg_init_delay_retry so we do not hammer controllers.
Linus Torvalds1da177e2005-04-16 15:20:36 -0700340 */
341 do {
342 list_for_each_entry(pg, &m->priority_groups, list) {
343 if (pg->bypassed == bypassed)
344 continue;
Mike Christief220fd42012-06-03 00:29:45 +0100345 if (!__choose_path_in_pg(m, pg, nr_bytes)) {
346 if (!bypassed)
347 m->pg_init_delay_retry = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348 return;
Mike Christief220fd42012-06-03 00:29:45 +0100349 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700350 }
351 } while (bypassed--);
352
353failed:
354 m->current_pgpath = NULL;
355 m->current_pg = NULL;
356}
357
Kiyoshi Ueda45e15722006-12-08 02:41:10 -0800358/*
359 * Check whether bios must be queued in the device-mapper core rather
360 * than here in the target.
361 *
362 * m->lock must be held on entry.
363 *
364 * If m->queue_if_no_path and m->saved_queue_if_no_path hold the
365 * same value then we are not between multipath_presuspend()
366 * and multipath_resume() calls and we have no need to check
367 * for the DMF_NOFLUSH_SUSPENDING flag.
368 */
369static int __must_push_back(struct multipath *m)
370{
371 return (m->queue_if_no_path != m->saved_queue_if_no_path &&
372 dm_noflush_suspending(m->ti));
373}
374
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100375static int map_io(struct multipath *m, struct request *clone,
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100376 union map_info *map_context, unsigned was_queued)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700377{
Kiyoshi Uedad2a7ad22006-12-08 02:41:06 -0800378 int r = DM_MAPIO_REMAPPED;
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100379 size_t nr_bytes = blk_rq_bytes(clone);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700380 unsigned long flags;
381 struct pgpath *pgpath;
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100382 struct block_device *bdev;
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100383 struct dm_mpath_io *mpio = map_context->ptr;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700384
385 spin_lock_irqsave(&m->lock, flags);
386
387 /* Do we need to select a new pgpath? */
388 if (!m->current_pgpath ||
389 (!m->queue_io && (m->repeat_count && --m->repeat_count == 0)))
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100390 __choose_pgpath(m, nr_bytes);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700391
392 pgpath = m->current_pgpath;
393
394 if (was_queued)
395 m->queue_size--;
396
Hannes Reineckeb63349a2013-10-01 11:49:56 +0200397 if (m->pg_init_required) {
398 if (!m->pg_init_in_progress)
399 queue_work(kmultipathd, &m->process_queued_ios);
400 r = DM_MAPIO_REQUEUE;
401 } else if ((pgpath && m->queue_io) ||
402 (!pgpath && m->queue_if_no_path)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700403 /* Queue for the daemon to resubmit */
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100404 list_add_tail(&clone->queuelist, &m->queued_ios);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700405 m->queue_size++;
Hannes Reineckeb63349a2013-10-01 11:49:56 +0200406 if (!m->queue_io)
Alasdair G Kergonc5573082005-05-05 16:16:07 -0700407 queue_work(kmultipathd, &m->process_queued_ios);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700408 pgpath = NULL;
Kiyoshi Uedad2a7ad22006-12-08 02:41:06 -0800409 r = DM_MAPIO_SUBMITTED;
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100410 } else if (pgpath) {
411 bdev = pgpath->path.dev->bdev;
412 clone->q = bdev_get_queue(bdev);
413 clone->rq_disk = bdev->bd_disk;
414 } else if (__must_push_back(m))
Kiyoshi Ueda45e15722006-12-08 02:41:10 -0800415 r = DM_MAPIO_REQUEUE;
416 else
417 r = -EIO; /* Failed */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700418
419 mpio->pgpath = pgpath;
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100420 mpio->nr_bytes = nr_bytes;
421
422 if (r == DM_MAPIO_REMAPPED && pgpath->pg->ps.type->start_io)
423 pgpath->pg->ps.type->start_io(&pgpath->pg->ps, &pgpath->path,
424 nr_bytes);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700425
426 spin_unlock_irqrestore(&m->lock, flags);
427
428 return r;
429}
430
431/*
432 * If we run out of usable paths, should we queue I/O or error it?
433 */
Alasdair G Kergon485ef692005-09-27 21:45:45 -0700434static int queue_if_no_path(struct multipath *m, unsigned queue_if_no_path,
435 unsigned save_old_value)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700436{
437 unsigned long flags;
438
439 spin_lock_irqsave(&m->lock, flags);
440
Alasdair G Kergon485ef692005-09-27 21:45:45 -0700441 if (save_old_value)
442 m->saved_queue_if_no_path = m->queue_if_no_path;
443 else
444 m->saved_queue_if_no_path = queue_if_no_path;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700445 m->queue_if_no_path = queue_if_no_path;
Alasdair G Kergonc3cd4f62005-07-12 15:53:04 -0700446 if (!m->queue_if_no_path && m->queue_size)
Alasdair G Kergonc5573082005-05-05 16:16:07 -0700447 queue_work(kmultipathd, &m->process_queued_ios);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700448
449 spin_unlock_irqrestore(&m->lock, flags);
450
451 return 0;
452}
453
454/*-----------------------------------------------------------------
455 * The multipath daemon is responsible for resubmitting queued ios.
456 *---------------------------------------------------------------*/
457
458static void dispatch_queued_ios(struct multipath *m)
459{
460 int r;
461 unsigned long flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700462 union map_info *info;
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100463 struct request *clone, *n;
464 LIST_HEAD(cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700465
466 spin_lock_irqsave(&m->lock, flags);
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100467 list_splice_init(&m->queued_ios, &cl);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700468 spin_unlock_irqrestore(&m->lock, flags);
469
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100470 list_for_each_entry_safe(clone, n, &cl, queuelist) {
471 list_del_init(&clone->queuelist);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700472
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100473 info = dm_get_rq_mapinfo(clone);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700474
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100475 r = map_io(m, clone, info, 1);
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100476 if (r < 0) {
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100477 clear_mapinfo(m, info);
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100478 dm_kill_unmapped_request(clone, r);
479 } else if (r == DM_MAPIO_REMAPPED)
480 dm_dispatch_request(clone);
481 else if (r == DM_MAPIO_REQUEUE) {
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100482 clear_mapinfo(m, info);
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100483 dm_requeue_unmapped_request(clone);
484 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700485 }
486}
487
David Howellsc4028952006-11-22 14:57:56 +0000488static void process_queued_ios(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700489{
David Howellsc4028952006-11-22 14:57:56 +0000490 struct multipath *m =
491 container_of(work, struct multipath, process_queued_ios);
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000492 struct pgpath *pgpath = NULL;
Chandra Seetharamane54f77d2009-06-22 10:12:12 +0100493 unsigned must_queue = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700494 unsigned long flags;
495
496 spin_lock_irqsave(&m->lock, flags);
497
498 if (!m->current_pgpath)
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +0100499 __choose_pgpath(m, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700500
501 pgpath = m->current_pgpath;
502
Alasdair G Kergonc3cd4f62005-07-12 15:53:04 -0700503 if ((pgpath && !m->queue_io) ||
504 (!pgpath && !m->queue_if_no_path))
505 must_queue = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700506
Hannes Reinecke17f4ff42014-02-28 15:33:42 +0100507 if (pgpath && m->pg_init_required)
Kiyoshi Uedafb612642010-03-06 02:32:18 +0000508 __pg_init_all_paths(m);
509
Linus Torvalds1da177e2005-04-16 15:20:36 -0700510 spin_unlock_irqrestore(&m->lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700511 if (!must_queue)
512 dispatch_queued_ios(m);
513}
514
515/*
516 * An event is triggered whenever a path is taken out of use.
517 * Includes path failure and PG bypass.
518 */
David Howellsc4028952006-11-22 14:57:56 +0000519static void trigger_event(struct work_struct *work)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700520{
David Howellsc4028952006-11-22 14:57:56 +0000521 struct multipath *m =
522 container_of(work, struct multipath, trigger_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700523
524 dm_table_event(m->ti->table);
525}
526
527/*-----------------------------------------------------------------
528 * Constructor/argument parsing:
529 * <#multipath feature args> [<arg>]*
530 * <#hw_handler args> [hw_handler [<arg>]*]
531 * <#priority groups>
532 * <initial priority group>
533 * [<selector> <#selector args> [<arg>]*
534 * <#paths> <#per-path selector args>
535 * [<path> [<arg>]* ]+ ]+
536 *---------------------------------------------------------------*/
Mike Snitzer498f0102011-08-02 12:32:04 +0100537static int parse_path_selector(struct dm_arg_set *as, struct priority_group *pg,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700538 struct dm_target *ti)
539{
540 int r;
541 struct path_selector_type *pst;
542 unsigned ps_argc;
543
Mike Snitzer498f0102011-08-02 12:32:04 +0100544 static struct dm_arg _args[] = {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700545 {0, 1024, "invalid number of path selector args"},
Linus Torvalds1da177e2005-04-16 15:20:36 -0700546 };
547
Mike Snitzer498f0102011-08-02 12:32:04 +0100548 pst = dm_get_path_selector(dm_shift_arg(as));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700549 if (!pst) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700550 ti->error = "unknown path selector type";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700551 return -EINVAL;
552 }
553
Mike Snitzer498f0102011-08-02 12:32:04 +0100554 r = dm_read_arg_group(_args, as, &ps_argc, &ti->error);
Mikulas Patocka371b2e32008-07-21 12:00:24 +0100555 if (r) {
556 dm_put_path_selector(pst);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700557 return -EINVAL;
Mikulas Patocka371b2e32008-07-21 12:00:24 +0100558 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700559
560 r = pst->create(&pg->ps, ps_argc, as->argv);
561 if (r) {
562 dm_put_path_selector(pst);
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700563 ti->error = "path selector constructor failed";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700564 return r;
565 }
566
567 pg->ps.type = pst;
Mike Snitzer498f0102011-08-02 12:32:04 +0100568 dm_consume_args(as, ps_argc);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700569
570 return 0;
571}
572
Mike Snitzer498f0102011-08-02 12:32:04 +0100573static struct pgpath *parse_path(struct dm_arg_set *as, struct path_selector *ps,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700574 struct dm_target *ti)
575{
576 int r;
577 struct pgpath *p;
Hannes Reineckeae11b1b2008-07-17 17:49:02 -0700578 struct multipath *m = ti->private;
Mike Snitzera58a9352012-07-27 15:08:04 +0100579 struct request_queue *q = NULL;
580 const char *attached_handler_name;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700581
582 /* we need at least a path arg */
583 if (as->argc < 1) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700584 ti->error = "no device given";
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100585 return ERR_PTR(-EINVAL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700586 }
587
588 p = alloc_pgpath();
589 if (!p)
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100590 return ERR_PTR(-ENOMEM);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700591
Mike Snitzer498f0102011-08-02 12:32:04 +0100592 r = dm_get_device(ti, dm_shift_arg(as), dm_table_get_mode(ti->table),
Nikanth Karthikesan8215d6e2010-03-06 02:32:27 +0000593 &p->path.dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700594 if (r) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700595 ti->error = "error getting device";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700596 goto bad;
597 }
598
Mike Snitzera58a9352012-07-27 15:08:04 +0100599 if (m->retain_attached_hw_handler || m->hw_handler_name)
600 q = bdev_get_queue(p->path.dev->bdev);
Hannes Reineckea0cf7ea2009-06-22 10:12:11 +0100601
Mike Snitzera58a9352012-07-27 15:08:04 +0100602 if (m->retain_attached_hw_handler) {
603 attached_handler_name = scsi_dh_attached_handler_name(q, GFP_KERNEL);
604 if (attached_handler_name) {
605 /*
606 * Reset hw_handler_name to match the attached handler
607 * and clear any hw_handler_params associated with the
608 * ignored handler.
609 *
610 * NB. This modifies the table line to show the actual
611 * handler instead of the original table passed in.
612 */
613 kfree(m->hw_handler_name);
614 m->hw_handler_name = attached_handler_name;
615
616 kfree(m->hw_handler_params);
617 m->hw_handler_params = NULL;
618 }
619 }
620
621 if (m->hw_handler_name) {
622 /*
623 * Increments scsi_dh reference, even when using an
624 * already-attached handler.
625 */
Hannes Reineckea0cf7ea2009-06-22 10:12:11 +0100626 r = scsi_dh_attach(q, m->hw_handler_name);
627 if (r == -EBUSY) {
628 /*
Mike Snitzera58a9352012-07-27 15:08:04 +0100629 * Already attached to different hw_handler:
Hannes Reineckea0cf7ea2009-06-22 10:12:11 +0100630 * try to reattach with correct one.
631 */
632 scsi_dh_detach(q);
633 r = scsi_dh_attach(q, m->hw_handler_name);
634 }
635
Hannes Reineckeae11b1b2008-07-17 17:49:02 -0700636 if (r < 0) {
Hannes Reineckea0cf7ea2009-06-22 10:12:11 +0100637 ti->error = "error attaching hardware handler";
Hannes Reineckeae11b1b2008-07-17 17:49:02 -0700638 dm_put_device(ti, p->path.dev);
639 goto bad;
640 }
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -0700641
642 if (m->hw_handler_params) {
643 r = scsi_dh_set_params(q, m->hw_handler_params);
644 if (r < 0) {
645 ti->error = "unable to set hardware "
646 "handler parameters";
647 scsi_dh_detach(q);
648 dm_put_device(ti, p->path.dev);
649 goto bad;
650 }
651 }
Hannes Reineckeae11b1b2008-07-17 17:49:02 -0700652 }
653
Linus Torvalds1da177e2005-04-16 15:20:36 -0700654 r = ps->type->add_path(ps, &p->path, as->argc, as->argv, &ti->error);
655 if (r) {
656 dm_put_device(ti, p->path.dev);
657 goto bad;
658 }
659
660 return p;
661
662 bad:
663 free_pgpath(p);
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100664 return ERR_PTR(r);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700665}
666
Mike Snitzer498f0102011-08-02 12:32:04 +0100667static struct priority_group *parse_priority_group(struct dm_arg_set *as,
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700668 struct multipath *m)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700669{
Mike Snitzer498f0102011-08-02 12:32:04 +0100670 static struct dm_arg _args[] = {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700671 {1, 1024, "invalid number of paths"},
672 {0, 1024, "invalid number of selector args"}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700673 };
674
675 int r;
Mike Snitzer498f0102011-08-02 12:32:04 +0100676 unsigned i, nr_selector_args, nr_args;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700677 struct priority_group *pg;
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700678 struct dm_target *ti = m->ti;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700679
680 if (as->argc < 2) {
681 as->argc = 0;
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100682 ti->error = "not enough priority group arguments";
683 return ERR_PTR(-EINVAL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700684 }
685
686 pg = alloc_priority_group();
687 if (!pg) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700688 ti->error = "couldn't allocate priority group";
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100689 return ERR_PTR(-ENOMEM);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700690 }
691 pg->m = m;
692
693 r = parse_path_selector(as, pg, ti);
694 if (r)
695 goto bad;
696
697 /*
698 * read the paths
699 */
Mike Snitzer498f0102011-08-02 12:32:04 +0100700 r = dm_read_arg(_args, as, &pg->nr_pgpaths, &ti->error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701 if (r)
702 goto bad;
703
Mike Snitzer498f0102011-08-02 12:32:04 +0100704 r = dm_read_arg(_args + 1, as, &nr_selector_args, &ti->error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705 if (r)
706 goto bad;
707
Mike Snitzer498f0102011-08-02 12:32:04 +0100708 nr_args = 1 + nr_selector_args;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700709 for (i = 0; i < pg->nr_pgpaths; i++) {
710 struct pgpath *pgpath;
Mike Snitzer498f0102011-08-02 12:32:04 +0100711 struct dm_arg_set path_args;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700712
Mike Snitzer498f0102011-08-02 12:32:04 +0100713 if (as->argc < nr_args) {
Mikulas Patocka148acff2008-07-21 12:00:30 +0100714 ti->error = "not enough path parameters";
Alasdair G Kergon6bbf79a2010-08-12 04:13:49 +0100715 r = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700716 goto bad;
Mikulas Patocka148acff2008-07-21 12:00:30 +0100717 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700718
Mike Snitzer498f0102011-08-02 12:32:04 +0100719 path_args.argc = nr_args;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700720 path_args.argv = as->argv;
721
722 pgpath = parse_path(&path_args, &pg->ps, ti);
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100723 if (IS_ERR(pgpath)) {
724 r = PTR_ERR(pgpath);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700725 goto bad;
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100726 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700727
728 pgpath->pg = pg;
729 list_add_tail(&pgpath->list, &pg->pgpaths);
Mike Snitzer498f0102011-08-02 12:32:04 +0100730 dm_consume_args(as, nr_args);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731 }
732
733 return pg;
734
735 bad:
736 free_priority_group(pg, ti);
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100737 return ERR_PTR(r);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700738}
739
Mike Snitzer498f0102011-08-02 12:32:04 +0100740static int parse_hw_handler(struct dm_arg_set *as, struct multipath *m)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700741{
Linus Torvalds1da177e2005-04-16 15:20:36 -0700742 unsigned hw_argc;
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -0700743 int ret;
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700744 struct dm_target *ti = m->ti;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700745
Mike Snitzer498f0102011-08-02 12:32:04 +0100746 static struct dm_arg _args[] = {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700747 {0, 1024, "invalid number of hardware handler args"},
Linus Torvalds1da177e2005-04-16 15:20:36 -0700748 };
749
Mike Snitzer498f0102011-08-02 12:32:04 +0100750 if (dm_read_arg_group(_args, as, &hw_argc, &ti->error))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 return -EINVAL;
752
753 if (!hw_argc)
754 return 0;
755
Mike Snitzer498f0102011-08-02 12:32:04 +0100756 m->hw_handler_name = kstrdup(dm_shift_arg(as), GFP_KERNEL);
Mike Snitzer510193a2012-05-12 01:43:21 +0100757 if (!try_then_request_module(scsi_dh_handler_exist(m->hw_handler_name),
758 "scsi_dh_%s", m->hw_handler_name)) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700759 ti->error = "unknown hardware handler type";
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -0700760 ret = -EINVAL;
761 goto fail;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700762 }
Chandra Seetharaman14e98c52008-11-13 23:39:06 +0000763
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -0700764 if (hw_argc > 1) {
765 char *p;
766 int i, j, len = 4;
767
768 for (i = 0; i <= hw_argc - 2; i++)
769 len += strlen(as->argv[i]) + 1;
770 p = m->hw_handler_params = kzalloc(len, GFP_KERNEL);
771 if (!p) {
772 ti->error = "memory allocation failed";
773 ret = -ENOMEM;
774 goto fail;
775 }
776 j = sprintf(p, "%d", hw_argc - 1);
777 for (i = 0, p+=j+1; i <= hw_argc - 2; i++, p+=j+1)
778 j = sprintf(p, "%s", as->argv[i]);
779 }
Mike Snitzer498f0102011-08-02 12:32:04 +0100780 dm_consume_args(as, hw_argc - 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700781
782 return 0;
Chandra Seetharaman2bfd2e12009-08-03 12:42:45 -0700783fail:
784 kfree(m->hw_handler_name);
785 m->hw_handler_name = NULL;
786 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700787}
788
Mike Snitzer498f0102011-08-02 12:32:04 +0100789static int parse_features(struct dm_arg_set *as, struct multipath *m)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700790{
791 int r;
792 unsigned argc;
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700793 struct dm_target *ti = m->ti;
Mike Snitzer498f0102011-08-02 12:32:04 +0100794 const char *arg_name;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700795
Mike Snitzer498f0102011-08-02 12:32:04 +0100796 static struct dm_arg _args[] = {
Mike Snitzera58a9352012-07-27 15:08:04 +0100797 {0, 6, "invalid number of feature args"},
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100798 {1, 50, "pg_init_retries must be between 1 and 50"},
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000799 {0, 60000, "pg_init_delay_msecs must be between 0 and 60000"},
Linus Torvalds1da177e2005-04-16 15:20:36 -0700800 };
801
Mike Snitzer498f0102011-08-02 12:32:04 +0100802 r = dm_read_arg_group(_args, as, &argc, &ti->error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700803 if (r)
804 return -EINVAL;
805
806 if (!argc)
807 return 0;
808
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100809 do {
Mike Snitzer498f0102011-08-02 12:32:04 +0100810 arg_name = dm_shift_arg(as);
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100811 argc--;
812
Mike Snitzer498f0102011-08-02 12:32:04 +0100813 if (!strcasecmp(arg_name, "queue_if_no_path")) {
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100814 r = queue_if_no_path(m, 1, 0);
815 continue;
816 }
817
Mike Snitzera58a9352012-07-27 15:08:04 +0100818 if (!strcasecmp(arg_name, "retain_attached_hw_handler")) {
819 m->retain_attached_hw_handler = 1;
820 continue;
821 }
822
Mike Snitzer498f0102011-08-02 12:32:04 +0100823 if (!strcasecmp(arg_name, "pg_init_retries") &&
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100824 (argc >= 1)) {
Mike Snitzer498f0102011-08-02 12:32:04 +0100825 r = dm_read_arg(_args + 1, as, &m->pg_init_retries, &ti->error);
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100826 argc--;
827 continue;
828 }
829
Mike Snitzer498f0102011-08-02 12:32:04 +0100830 if (!strcasecmp(arg_name, "pg_init_delay_msecs") &&
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000831 (argc >= 1)) {
Mike Snitzer498f0102011-08-02 12:32:04 +0100832 r = dm_read_arg(_args + 2, as, &m->pg_init_delay_msecs, &ti->error);
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +0000833 argc--;
834 continue;
835 }
836
Linus Torvalds1da177e2005-04-16 15:20:36 -0700837 ti->error = "Unrecognised multipath feature request";
Dave Wysochanskic9e45582007-10-19 22:47:53 +0100838 r = -EINVAL;
839 } while (argc && !r);
840
841 return r;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700842}
843
844static int multipath_ctr(struct dm_target *ti, unsigned int argc,
845 char **argv)
846{
Mike Snitzer498f0102011-08-02 12:32:04 +0100847 /* target arguments */
848 static struct dm_arg _args[] = {
Mike Snitzera490a072011-03-24 13:54:33 +0000849 {0, 1024, "invalid number of priority groups"},
850 {0, 1024, "invalid initial priority group number"},
Linus Torvalds1da177e2005-04-16 15:20:36 -0700851 };
852
853 int r;
854 struct multipath *m;
Mike Snitzer498f0102011-08-02 12:32:04 +0100855 struct dm_arg_set as;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700856 unsigned pg_count = 0;
857 unsigned next_pg_num;
858
859 as.argc = argc;
860 as.argv = argv;
861
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700862 m = alloc_multipath(ti);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700863 if (!m) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700864 ti->error = "can't allocate multipath";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700865 return -EINVAL;
866 }
867
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700868 r = parse_features(&as, m);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700869 if (r)
870 goto bad;
871
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700872 r = parse_hw_handler(&as, m);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700873 if (r)
874 goto bad;
875
Mike Snitzer498f0102011-08-02 12:32:04 +0100876 r = dm_read_arg(_args, &as, &m->nr_priority_groups, &ti->error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700877 if (r)
878 goto bad;
879
Mike Snitzer498f0102011-08-02 12:32:04 +0100880 r = dm_read_arg(_args + 1, &as, &next_pg_num, &ti->error);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700881 if (r)
882 goto bad;
883
Mike Snitzera490a072011-03-24 13:54:33 +0000884 if ((!m->nr_priority_groups && next_pg_num) ||
885 (m->nr_priority_groups && !next_pg_num)) {
886 ti->error = "invalid initial priority group";
887 r = -EINVAL;
888 goto bad;
889 }
890
Linus Torvalds1da177e2005-04-16 15:20:36 -0700891 /* parse the priority groups */
892 while (as.argc) {
893 struct priority_group *pg;
894
Micha³ Miros³aw28f16c22006-10-03 01:15:33 -0700895 pg = parse_priority_group(&as, m);
Benjamin Marzinski01460f32008-10-10 13:36:57 +0100896 if (IS_ERR(pg)) {
897 r = PTR_ERR(pg);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700898 goto bad;
899 }
900
901 m->nr_valid_paths += pg->nr_pgpaths;
902 list_add_tail(&pg->list, &m->priority_groups);
903 pg_count++;
904 pg->pg_num = pg_count;
905 if (!--next_pg_num)
906 m->next_pg = pg;
907 }
908
909 if (pg_count != m->nr_priority_groups) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -0700910 ti->error = "priority group count mismatch";
Linus Torvalds1da177e2005-04-16 15:20:36 -0700911 r = -EINVAL;
912 goto bad;
913 }
914
Alasdair G Kergon55a62ee2013-03-01 22:45:47 +0000915 ti->num_flush_bios = 1;
916 ti->num_discard_bios = 1;
Mike Snitzer042bcef2013-05-10 14:37:16 +0100917 ti->num_write_same_bios = 1;
Mikulas Patocka86279212009-06-22 10:12:24 +0100918
Linus Torvalds1da177e2005-04-16 15:20:36 -0700919 return 0;
920
921 bad:
922 free_multipath(m);
923 return r;
924}
925
Kiyoshi Ueda2bded7b2010-03-06 02:32:13 +0000926static void multipath_wait_for_pg_init_completion(struct multipath *m)
927{
928 DECLARE_WAITQUEUE(wait, current);
929 unsigned long flags;
930
931 add_wait_queue(&m->pg_init_wait, &wait);
932
933 while (1) {
934 set_current_state(TASK_UNINTERRUPTIBLE);
935
936 spin_lock_irqsave(&m->lock, flags);
937 if (!m->pg_init_in_progress) {
938 spin_unlock_irqrestore(&m->lock, flags);
939 break;
940 }
941 spin_unlock_irqrestore(&m->lock, flags);
942
943 io_schedule();
944 }
945 set_current_state(TASK_RUNNING);
946
947 remove_wait_queue(&m->pg_init_wait, &wait);
948}
949
950static void flush_multipath_work(struct multipath *m)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700951{
Shiva Krishna Merla954a73d2013-10-30 03:26:38 +0000952 unsigned long flags;
953
954 spin_lock_irqsave(&m->lock, flags);
955 m->pg_init_disabled = 1;
956 spin_unlock_irqrestore(&m->lock, flags);
957
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -0700958 flush_workqueue(kmpath_handlerd);
Kiyoshi Ueda2bded7b2010-03-06 02:32:13 +0000959 multipath_wait_for_pg_init_completion(m);
Alasdair G Kergona044d012005-07-12 15:53:02 -0700960 flush_workqueue(kmultipathd);
Tejun Heo43829732012-08-20 14:51:24 -0700961 flush_work(&m->trigger_event);
Shiva Krishna Merla954a73d2013-10-30 03:26:38 +0000962
963 spin_lock_irqsave(&m->lock, flags);
964 m->pg_init_disabled = 0;
965 spin_unlock_irqrestore(&m->lock, flags);
Kiyoshi Ueda6df400a2009-12-10 23:52:19 +0000966}
967
968static void multipath_dtr(struct dm_target *ti)
969{
970 struct multipath *m = ti->private;
971
Kiyoshi Ueda2bded7b2010-03-06 02:32:13 +0000972 flush_multipath_work(m);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700973 free_multipath(m);
974}
975
976/*
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100977 * Map cloned requests
Linus Torvalds1da177e2005-04-16 15:20:36 -0700978 */
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100979static int multipath_map(struct dm_target *ti, struct request *clone,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700980 union map_info *map_context)
981{
982 int r;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700983 struct multipath *m = (struct multipath *) ti->private;
984
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100985 if (set_mapinfo(m, map_context) < 0)
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100986 /* ENOMEM, requeue */
987 return DM_MAPIO_REQUEUE;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700988
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +0100989 clone->cmd_flags |= REQ_FAILFAST_TRANSPORT;
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100990 r = map_io(m, clone, map_context, 0);
Kiyoshi Ueda45e15722006-12-08 02:41:10 -0800991 if (r < 0 || r == DM_MAPIO_REQUEUE)
Jun'ichi Nomura466891f2012-03-28 18:41:25 +0100992 clear_mapinfo(m, map_context);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700993
994 return r;
995}
996
997/*
998 * Take a path out of use.
999 */
1000static int fail_path(struct pgpath *pgpath)
1001{
1002 unsigned long flags;
1003 struct multipath *m = pgpath->pg->m;
1004
1005 spin_lock_irqsave(&m->lock, flags);
1006
Kiyoshi Ueda66800732008-10-10 13:36:58 +01001007 if (!pgpath->is_active)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001008 goto out;
1009
Alasdair G Kergon72d94862006-06-26 00:27:35 -07001010 DMWARN("Failing path %s.", pgpath->path.dev->name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001011
1012 pgpath->pg->ps.type->fail_path(&pgpath->pg->ps, &pgpath->path);
Kiyoshi Ueda66800732008-10-10 13:36:58 +01001013 pgpath->is_active = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001014 pgpath->fail_count++;
1015
1016 m->nr_valid_paths--;
1017
1018 if (pgpath == m->current_pgpath)
1019 m->current_pgpath = NULL;
1020
Mike Andersonb15546f2007-10-19 22:48:02 +01001021 dm_path_uevent(DM_UEVENT_PATH_FAILED, m->ti,
1022 pgpath->path.dev->name, m->nr_valid_paths);
1023
Alasdair G Kergonfe9cf302009-01-06 03:05:13 +00001024 schedule_work(&m->trigger_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001025
1026out:
1027 spin_unlock_irqrestore(&m->lock, flags);
1028
1029 return 0;
1030}
1031
1032/*
1033 * Reinstate a previously-failed path
1034 */
1035static int reinstate_path(struct pgpath *pgpath)
1036{
1037 int r = 0;
1038 unsigned long flags;
1039 struct multipath *m = pgpath->pg->m;
1040
1041 spin_lock_irqsave(&m->lock, flags);
1042
Kiyoshi Ueda66800732008-10-10 13:36:58 +01001043 if (pgpath->is_active)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001044 goto out;
1045
Alasdair G Kergondef052d2008-07-21 12:00:31 +01001046 if (!pgpath->pg->ps.type->reinstate_path) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001047 DMWARN("Reinstate path not supported by path selector %s",
1048 pgpath->pg->ps.type->name);
1049 r = -EINVAL;
1050 goto out;
1051 }
1052
1053 r = pgpath->pg->ps.type->reinstate_path(&pgpath->pg->ps, &pgpath->path);
1054 if (r)
1055 goto out;
1056
Kiyoshi Ueda66800732008-10-10 13:36:58 +01001057 pgpath->is_active = 1;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001058
Chandra Seetharamane54f77d2009-06-22 10:12:12 +01001059 if (!m->nr_valid_paths++ && m->queue_size) {
1060 m->current_pgpath = NULL;
Alasdair G Kergonc5573082005-05-05 16:16:07 -07001061 queue_work(kmultipathd, &m->process_queued_ios);
Chandra Seetharamane54f77d2009-06-22 10:12:12 +01001062 } else if (m->hw_handler_name && (m->current_pg == pgpath->pg)) {
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001063 if (queue_work(kmpath_handlerd, &pgpath->activate_path.work))
Chandra Seetharamane54f77d2009-06-22 10:12:12 +01001064 m->pg_init_in_progress++;
1065 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001066
Mike Andersonb15546f2007-10-19 22:48:02 +01001067 dm_path_uevent(DM_UEVENT_PATH_REINSTATED, m->ti,
1068 pgpath->path.dev->name, m->nr_valid_paths);
1069
Alasdair G Kergonfe9cf302009-01-06 03:05:13 +00001070 schedule_work(&m->trigger_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001071
1072out:
1073 spin_unlock_irqrestore(&m->lock, flags);
1074
1075 return r;
1076}
1077
1078/*
1079 * Fail or reinstate all paths that match the provided struct dm_dev.
1080 */
1081static int action_dev(struct multipath *m, struct dm_dev *dev,
1082 action_fn action)
1083{
Mike Snitzer19040c02011-03-24 13:54:31 +00001084 int r = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001085 struct pgpath *pgpath;
1086 struct priority_group *pg;
1087
1088 list_for_each_entry(pg, &m->priority_groups, list) {
1089 list_for_each_entry(pgpath, &pg->pgpaths, list) {
1090 if (pgpath->path.dev == dev)
1091 r = action(pgpath);
1092 }
1093 }
1094
1095 return r;
1096}
1097
1098/*
1099 * Temporarily try to avoid having to use the specified PG
1100 */
1101static void bypass_pg(struct multipath *m, struct priority_group *pg,
1102 int bypassed)
1103{
1104 unsigned long flags;
1105
1106 spin_lock_irqsave(&m->lock, flags);
1107
1108 pg->bypassed = bypassed;
1109 m->current_pgpath = NULL;
1110 m->current_pg = NULL;
1111
1112 spin_unlock_irqrestore(&m->lock, flags);
1113
Alasdair G Kergonfe9cf302009-01-06 03:05:13 +00001114 schedule_work(&m->trigger_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001115}
1116
1117/*
1118 * Switch to using the specified PG from the next I/O that gets mapped
1119 */
1120static int switch_pg_num(struct multipath *m, const char *pgstr)
1121{
1122 struct priority_group *pg;
1123 unsigned pgnum;
1124 unsigned long flags;
Mikulas Patocka31998ef2012-03-28 18:41:26 +01001125 char dummy;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001126
Mikulas Patocka31998ef2012-03-28 18:41:26 +01001127 if (!pgstr || (sscanf(pgstr, "%u%c", &pgnum, &dummy) != 1) || !pgnum ||
Linus Torvalds1da177e2005-04-16 15:20:36 -07001128 (pgnum > m->nr_priority_groups)) {
1129 DMWARN("invalid PG number supplied to switch_pg_num");
1130 return -EINVAL;
1131 }
1132
1133 spin_lock_irqsave(&m->lock, flags);
1134 list_for_each_entry(pg, &m->priority_groups, list) {
1135 pg->bypassed = 0;
1136 if (--pgnum)
1137 continue;
1138
1139 m->current_pgpath = NULL;
1140 m->current_pg = NULL;
1141 m->next_pg = pg;
1142 }
1143 spin_unlock_irqrestore(&m->lock, flags);
1144
Alasdair G Kergonfe9cf302009-01-06 03:05:13 +00001145 schedule_work(&m->trigger_event);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001146 return 0;
1147}
1148
1149/*
1150 * Set/clear bypassed status of a PG.
1151 * PGs are numbered upwards from 1 in the order they were declared.
1152 */
1153static int bypass_pg_num(struct multipath *m, const char *pgstr, int bypassed)
1154{
1155 struct priority_group *pg;
1156 unsigned pgnum;
Mikulas Patocka31998ef2012-03-28 18:41:26 +01001157 char dummy;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001158
Mikulas Patocka31998ef2012-03-28 18:41:26 +01001159 if (!pgstr || (sscanf(pgstr, "%u%c", &pgnum, &dummy) != 1) || !pgnum ||
Linus Torvalds1da177e2005-04-16 15:20:36 -07001160 (pgnum > m->nr_priority_groups)) {
1161 DMWARN("invalid PG number supplied to bypass_pg");
1162 return -EINVAL;
1163 }
1164
1165 list_for_each_entry(pg, &m->priority_groups, list) {
1166 if (!--pgnum)
1167 break;
1168 }
1169
1170 bypass_pg(m, pg, bypassed);
1171 return 0;
1172}
1173
1174/*
Dave Wysochanskic9e45582007-10-19 22:47:53 +01001175 * Should we retry pg_init immediately?
1176 */
1177static int pg_init_limit_reached(struct multipath *m, struct pgpath *pgpath)
1178{
1179 unsigned long flags;
1180 int limit_reached = 0;
1181
1182 spin_lock_irqsave(&m->lock, flags);
1183
Shiva Krishna Merla954a73d2013-10-30 03:26:38 +00001184 if (m->pg_init_count <= m->pg_init_retries && !m->pg_init_disabled)
Dave Wysochanskic9e45582007-10-19 22:47:53 +01001185 m->pg_init_required = 1;
1186 else
1187 limit_reached = 1;
1188
1189 spin_unlock_irqrestore(&m->lock, flags);
1190
1191 return limit_reached;
1192}
1193
Chandra Seetharaman3ae31f62009-10-21 09:22:46 -07001194static void pg_init_done(void *data, int errors)
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001195{
Moger, Babu83c0d5d2010-03-06 02:29:45 +00001196 struct pgpath *pgpath = data;
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001197 struct priority_group *pg = pgpath->pg;
1198 struct multipath *m = pg->m;
1199 unsigned long flags;
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001200 unsigned delay_retry = 0;
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001201
1202 /* device or driver problems */
1203 switch (errors) {
1204 case SCSI_DH_OK:
1205 break;
1206 case SCSI_DH_NOSYS:
1207 if (!m->hw_handler_name) {
1208 errors = 0;
1209 break;
1210 }
Moger, Babuf7b934c2010-03-06 02:29:49 +00001211 DMERR("Could not failover the device: Handler scsi_dh_%s "
1212 "Error %d.", m->hw_handler_name, errors);
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001213 /*
1214 * Fail path for now, so we do not ping pong
1215 */
1216 fail_path(pgpath);
1217 break;
1218 case SCSI_DH_DEV_TEMP_BUSY:
1219 /*
1220 * Probably doing something like FW upgrade on the
1221 * controller so try the other pg.
1222 */
1223 bypass_pg(m, pg, 1);
1224 break;
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001225 case SCSI_DH_RETRY:
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001226 /* Wait before retrying. */
1227 delay_retry = 1;
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001228 case SCSI_DH_IMM_RETRY:
1229 case SCSI_DH_RES_TEMP_UNAVAIL:
1230 if (pg_init_limit_reached(m, pgpath))
1231 fail_path(pgpath);
1232 errors = 0;
1233 break;
1234 default:
1235 /*
1236 * We probably do not want to fail the path for a device
1237 * error, but this is what the old dm did. In future
1238 * patches we can do more advanced handling.
1239 */
1240 fail_path(pgpath);
1241 }
1242
1243 spin_lock_irqsave(&m->lock, flags);
1244 if (errors) {
Chandra Seetharamane54f77d2009-06-22 10:12:12 +01001245 if (pgpath == m->current_pgpath) {
1246 DMERR("Could not failover device. Error %d.", errors);
1247 m->current_pgpath = NULL;
1248 m->current_pg = NULL;
1249 }
Kiyoshi Uedad0259bf2010-03-06 02:30:02 +00001250 } else if (!m->pg_init_required)
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001251 pg->bypassed = 0;
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001252
Kiyoshi Uedad0259bf2010-03-06 02:30:02 +00001253 if (--m->pg_init_in_progress)
1254 /* Activations of other paths are still on going */
1255 goto out;
1256
1257 if (!m->pg_init_required)
1258 m->queue_io = 0;
1259
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001260 m->pg_init_delay_retry = delay_retry;
Kiyoshi Uedad0259bf2010-03-06 02:30:02 +00001261 queue_work(kmultipathd, &m->process_queued_ios);
1262
Kiyoshi Ueda2bded7b2010-03-06 02:32:13 +00001263 /*
1264 * Wake up any thread waiting to suspend.
1265 */
1266 wake_up(&m->pg_init_wait);
1267
Kiyoshi Uedad0259bf2010-03-06 02:30:02 +00001268out:
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001269 spin_unlock_irqrestore(&m->lock, flags);
1270}
1271
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -07001272static void activate_path(struct work_struct *work)
1273{
Chandra Seetharamane54f77d2009-06-22 10:12:12 +01001274 struct pgpath *pgpath =
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001275 container_of(work, struct pgpath, activate_path.work);
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -07001276
Chandra Seetharaman3ae31f62009-10-21 09:22:46 -07001277 scsi_dh_activate(bdev_get_queue(pgpath->path.dev->bdev),
Moger, Babu83c0d5d2010-03-06 02:29:45 +00001278 pg_init_done, pgpath);
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -07001279}
1280
Hannes Reinecke7e782af2013-07-01 15:16:26 +02001281static int noretry_error(int error)
1282{
1283 switch (error) {
1284 case -EOPNOTSUPP:
1285 case -EREMOTEIO:
1286 case -EILSEQ:
1287 case -ENODATA:
Jun'ichi Nomuracc9d3c32013-09-13 14:54:30 +09001288 case -ENOSPC:
Hannes Reinecke7e782af2013-07-01 15:16:26 +02001289 return 1;
1290 }
1291
1292 /* Anything else could be a path failure, so should be retried */
1293 return 0;
1294}
1295
Linus Torvalds1da177e2005-04-16 15:20:36 -07001296/*
1297 * end_io handling
1298 */
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001299static int do_end_io(struct multipath *m, struct request *clone,
Alasdair G Kergon028867a2007-07-12 17:26:32 +01001300 int error, struct dm_mpath_io *mpio)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001301{
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001302 /*
1303 * We don't queue any clone request inside the multipath target
1304 * during end I/O handling, since those clone requests don't have
1305 * bio clones. If we queue them inside the multipath target,
1306 * we need to make bio clones, that requires memory allocation.
1307 * (See drivers/md/dm.c:end_clone_bio() about why the clone requests
1308 * don't have bio clones.)
1309 * Instead of queueing the clone request here, we queue the original
1310 * request into dm core, which will remake a clone request and
1311 * clone bios for it and resubmit it later.
1312 */
1313 int r = DM_ENDIO_REQUEUE;
Stefan Bader640eb3b2005-11-21 21:32:35 -08001314 unsigned long flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001315
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001316 if (!error && !clone->errors)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001317 return 0; /* I/O complete */
1318
Mike Snitzerf84cb8a2013-09-19 12:13:58 -04001319 if (noretry_error(error)) {
1320 if ((clone->cmd_flags & REQ_WRITE_SAME) &&
1321 !clone->q->limits.max_write_same_sectors) {
1322 struct queue_limits *limits;
1323
1324 /* device doesn't really support WRITE SAME, disable it */
1325 limits = dm_get_queue_limits(dm_table_get_md(m->ti->table));
1326 limits->max_write_same_sectors = 0;
1327 }
Mike Snitzer959eb4e2010-08-12 04:14:32 +01001328 return error;
Mike Snitzerf84cb8a2013-09-19 12:13:58 -04001329 }
Mike Snitzer959eb4e2010-08-12 04:14:32 +01001330
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001331 if (mpio->pgpath)
1332 fail_path(mpio->pgpath);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001333
Stefan Bader640eb3b2005-11-21 21:32:35 -08001334 spin_lock_irqsave(&m->lock, flags);
Hannes Reinecke751b2a72011-01-18 10:13:12 +01001335 if (!m->nr_valid_paths) {
1336 if (!m->queue_if_no_path) {
1337 if (!__must_push_back(m))
1338 r = -EIO;
1339 } else {
1340 if (error == -EBADE)
1341 r = error;
1342 }
1343 }
Stefan Bader640eb3b2005-11-21 21:32:35 -08001344 spin_unlock_irqrestore(&m->lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001345
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001346 return r;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001347}
1348
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001349static int multipath_end_io(struct dm_target *ti, struct request *clone,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001350 int error, union map_info *map_context)
1351{
Alasdair G Kergon028867a2007-07-12 17:26:32 +01001352 struct multipath *m = ti->private;
1353 struct dm_mpath_io *mpio = map_context->ptr;
Wei Yongjuna71a2612012-10-12 16:59:42 +01001354 struct pgpath *pgpath;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001355 struct path_selector *ps;
1356 int r;
1357
Jun'ichi Nomura466891f2012-03-28 18:41:25 +01001358 BUG_ON(!mpio);
1359
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001360 r = do_end_io(m, clone, error, mpio);
Wei Yongjuna71a2612012-10-12 16:59:42 +01001361 pgpath = mpio->pgpath;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001362 if (pgpath) {
1363 ps = &pgpath->pg->ps;
1364 if (ps->type->end_io)
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +01001365 ps->type->end_io(ps, &pgpath->path, mpio->nr_bytes);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001366 }
Jun'ichi Nomura466891f2012-03-28 18:41:25 +01001367 clear_mapinfo(m, map_context);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001368
1369 return r;
1370}
1371
1372/*
1373 * Suspend can't complete until all the I/O is processed so if
Alasdair G Kergon436d4102005-07-12 15:53:03 -07001374 * the last path fails we must error any remaining I/O.
1375 * Note that if the freeze_bdev fails while suspending, the
1376 * queue_if_no_path state is lost - userspace should reset it.
Linus Torvalds1da177e2005-04-16 15:20:36 -07001377 */
1378static void multipath_presuspend(struct dm_target *ti)
1379{
1380 struct multipath *m = (struct multipath *) ti->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001381
Alasdair G Kergon485ef692005-09-27 21:45:45 -07001382 queue_if_no_path(m, 0, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001383}
1384
Kiyoshi Ueda6df400a2009-12-10 23:52:19 +00001385static void multipath_postsuspend(struct dm_target *ti)
1386{
Mike Anderson6380f262009-12-10 23:52:21 +00001387 struct multipath *m = ti->private;
1388
1389 mutex_lock(&m->work_mutex);
Kiyoshi Ueda2bded7b2010-03-06 02:32:13 +00001390 flush_multipath_work(m);
Mike Anderson6380f262009-12-10 23:52:21 +00001391 mutex_unlock(&m->work_mutex);
Kiyoshi Ueda6df400a2009-12-10 23:52:19 +00001392}
1393
Alasdair G Kergon436d4102005-07-12 15:53:03 -07001394/*
1395 * Restore the queue_if_no_path setting.
1396 */
Linus Torvalds1da177e2005-04-16 15:20:36 -07001397static void multipath_resume(struct dm_target *ti)
1398{
1399 struct multipath *m = (struct multipath *) ti->private;
1400 unsigned long flags;
1401
1402 spin_lock_irqsave(&m->lock, flags);
Alasdair G Kergon436d4102005-07-12 15:53:03 -07001403 m->queue_if_no_path = m->saved_queue_if_no_path;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001404 spin_unlock_irqrestore(&m->lock, flags);
1405}
1406
1407/*
1408 * Info output has the following format:
1409 * num_multipath_feature_args [multipath_feature_args]*
1410 * num_handler_status_args [handler_status_args]*
1411 * num_groups init_group_number
1412 * [A|D|E num_ps_status_args [ps_status_args]*
1413 * num_paths num_selector_args
1414 * [path_dev A|F fail_count [selector_args]* ]+ ]+
1415 *
1416 * Table output has the following format (identical to the constructor string):
1417 * num_feature_args [features_args]*
1418 * num_handler_args hw_handler [hw_handler_args]*
1419 * num_groups init_group_number
1420 * [priority selector-name num_ps_args [ps_args]*
1421 * num_paths num_selector_args [path_dev [selector_args]* ]+ ]+
1422 */
Mikulas Patockafd7c0922013-03-01 22:45:44 +00001423static void multipath_status(struct dm_target *ti, status_type_t type,
1424 unsigned status_flags, char *result, unsigned maxlen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001425{
1426 int sz = 0;
1427 unsigned long flags;
1428 struct multipath *m = (struct multipath *) ti->private;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001429 struct priority_group *pg;
1430 struct pgpath *p;
1431 unsigned pg_num;
1432 char state;
1433
1434 spin_lock_irqsave(&m->lock, flags);
1435
1436 /* Features */
1437 if (type == STATUSTYPE_INFO)
Dave Wysochanskic9e45582007-10-19 22:47:53 +01001438 DMEMIT("2 %u %u ", m->queue_size, m->pg_init_count);
1439 else {
1440 DMEMIT("%u ", m->queue_if_no_path +
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001441 (m->pg_init_retries > 0) * 2 +
Mike Snitzera58a9352012-07-27 15:08:04 +01001442 (m->pg_init_delay_msecs != DM_PG_INIT_DELAY_DEFAULT) * 2 +
1443 m->retain_attached_hw_handler);
Dave Wysochanskic9e45582007-10-19 22:47:53 +01001444 if (m->queue_if_no_path)
1445 DMEMIT("queue_if_no_path ");
1446 if (m->pg_init_retries)
1447 DMEMIT("pg_init_retries %u ", m->pg_init_retries);
Chandra Seetharaman4e2d19e2011-01-13 20:00:01 +00001448 if (m->pg_init_delay_msecs != DM_PG_INIT_DELAY_DEFAULT)
1449 DMEMIT("pg_init_delay_msecs %u ", m->pg_init_delay_msecs);
Mike Snitzera58a9352012-07-27 15:08:04 +01001450 if (m->retain_attached_hw_handler)
1451 DMEMIT("retain_attached_hw_handler ");
Dave Wysochanskic9e45582007-10-19 22:47:53 +01001452 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001453
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001454 if (!m->hw_handler_name || type == STATUSTYPE_INFO)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001455 DMEMIT("0 ");
1456 else
Chandra Seetharamancfae5c92008-05-01 14:50:11 -07001457 DMEMIT("1 %s ", m->hw_handler_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001458
1459 DMEMIT("%u ", m->nr_priority_groups);
1460
1461 if (m->next_pg)
1462 pg_num = m->next_pg->pg_num;
1463 else if (m->current_pg)
1464 pg_num = m->current_pg->pg_num;
1465 else
Mike Snitzera490a072011-03-24 13:54:33 +00001466 pg_num = (m->nr_priority_groups ? 1 : 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001467
1468 DMEMIT("%u ", pg_num);
1469
1470 switch (type) {
1471 case STATUSTYPE_INFO:
1472 list_for_each_entry(pg, &m->priority_groups, list) {
1473 if (pg->bypassed)
1474 state = 'D'; /* Disabled */
1475 else if (pg == m->current_pg)
1476 state = 'A'; /* Currently Active */
1477 else
1478 state = 'E'; /* Enabled */
1479
1480 DMEMIT("%c ", state);
1481
1482 if (pg->ps.type->status)
1483 sz += pg->ps.type->status(&pg->ps, NULL, type,
1484 result + sz,
1485 maxlen - sz);
1486 else
1487 DMEMIT("0 ");
1488
1489 DMEMIT("%u %u ", pg->nr_pgpaths,
1490 pg->ps.type->info_args);
1491
1492 list_for_each_entry(p, &pg->pgpaths, list) {
1493 DMEMIT("%s %s %u ", p->path.dev->name,
Kiyoshi Ueda66800732008-10-10 13:36:58 +01001494 p->is_active ? "A" : "F",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001495 p->fail_count);
1496 if (pg->ps.type->status)
1497 sz += pg->ps.type->status(&pg->ps,
1498 &p->path, type, result + sz,
1499 maxlen - sz);
1500 }
1501 }
1502 break;
1503
1504 case STATUSTYPE_TABLE:
1505 list_for_each_entry(pg, &m->priority_groups, list) {
1506 DMEMIT("%s ", pg->ps.type->name);
1507
1508 if (pg->ps.type->status)
1509 sz += pg->ps.type->status(&pg->ps, NULL, type,
1510 result + sz,
1511 maxlen - sz);
1512 else
1513 DMEMIT("0 ");
1514
1515 DMEMIT("%u %u ", pg->nr_pgpaths,
1516 pg->ps.type->table_args);
1517
1518 list_for_each_entry(p, &pg->pgpaths, list) {
1519 DMEMIT("%s ", p->path.dev->name);
1520 if (pg->ps.type->status)
1521 sz += pg->ps.type->status(&pg->ps,
1522 &p->path, type, result + sz,
1523 maxlen - sz);
1524 }
1525 }
1526 break;
1527 }
1528
1529 spin_unlock_irqrestore(&m->lock, flags);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001530}
1531
1532static int multipath_message(struct dm_target *ti, unsigned argc, char **argv)
1533{
Mike Anderson6380f262009-12-10 23:52:21 +00001534 int r = -EINVAL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001535 struct dm_dev *dev;
1536 struct multipath *m = (struct multipath *) ti->private;
1537 action_fn action;
1538
Mike Anderson6380f262009-12-10 23:52:21 +00001539 mutex_lock(&m->work_mutex);
1540
Kiyoshi Uedac2f3d242009-12-10 23:52:27 +00001541 if (dm_suspended(ti)) {
1542 r = -EBUSY;
1543 goto out;
1544 }
1545
Linus Torvalds1da177e2005-04-16 15:20:36 -07001546 if (argc == 1) {
Mike Snitzer498f0102011-08-02 12:32:04 +01001547 if (!strcasecmp(argv[0], "queue_if_no_path")) {
Mike Anderson6380f262009-12-10 23:52:21 +00001548 r = queue_if_no_path(m, 1, 0);
1549 goto out;
Mike Snitzer498f0102011-08-02 12:32:04 +01001550 } else if (!strcasecmp(argv[0], "fail_if_no_path")) {
Mike Anderson6380f262009-12-10 23:52:21 +00001551 r = queue_if_no_path(m, 0, 0);
1552 goto out;
1553 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001554 }
1555
Mike Anderson6380f262009-12-10 23:52:21 +00001556 if (argc != 2) {
1557 DMWARN("Unrecognised multipath message received.");
1558 goto out;
1559 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001560
Mike Snitzer498f0102011-08-02 12:32:04 +01001561 if (!strcasecmp(argv[0], "disable_group")) {
Mike Anderson6380f262009-12-10 23:52:21 +00001562 r = bypass_pg_num(m, argv[1], 1);
1563 goto out;
Mike Snitzer498f0102011-08-02 12:32:04 +01001564 } else if (!strcasecmp(argv[0], "enable_group")) {
Mike Anderson6380f262009-12-10 23:52:21 +00001565 r = bypass_pg_num(m, argv[1], 0);
1566 goto out;
Mike Snitzer498f0102011-08-02 12:32:04 +01001567 } else if (!strcasecmp(argv[0], "switch_group")) {
Mike Anderson6380f262009-12-10 23:52:21 +00001568 r = switch_pg_num(m, argv[1]);
1569 goto out;
Mike Snitzer498f0102011-08-02 12:32:04 +01001570 } else if (!strcasecmp(argv[0], "reinstate_path"))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001571 action = reinstate_path;
Mike Snitzer498f0102011-08-02 12:32:04 +01001572 else if (!strcasecmp(argv[0], "fail_path"))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001573 action = fail_path;
Mike Anderson6380f262009-12-10 23:52:21 +00001574 else {
1575 DMWARN("Unrecognised multipath message received.");
1576 goto out;
1577 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001578
Nikanth Karthikesan8215d6e2010-03-06 02:32:27 +00001579 r = dm_get_device(ti, argv[1], dm_table_get_mode(ti->table), &dev);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001580 if (r) {
Alasdair G Kergon72d94862006-06-26 00:27:35 -07001581 DMWARN("message: error getting device %s",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001582 argv[1]);
Mike Anderson6380f262009-12-10 23:52:21 +00001583 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001584 }
1585
1586 r = action_dev(m, dev, action);
1587
1588 dm_put_device(ti, dev);
1589
Mike Anderson6380f262009-12-10 23:52:21 +00001590out:
1591 mutex_unlock(&m->work_mutex);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001592 return r;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001593}
1594
Al Viro647b3d02007-08-28 22:15:59 -04001595static int multipath_ioctl(struct dm_target *ti, unsigned int cmd,
Milan Broz9af4aa32006-10-03 01:15:20 -07001596 unsigned long arg)
1597{
Mikulas Patocka35991652012-06-03 00:29:58 +01001598 struct multipath *m = ti->private;
Mike Snitzer7ba10aa2012-09-26 23:45:41 +01001599 struct pgpath *pgpath;
Mikulas Patocka35991652012-06-03 00:29:58 +01001600 struct block_device *bdev;
1601 fmode_t mode;
Milan Broz9af4aa32006-10-03 01:15:20 -07001602 unsigned long flags;
Mikulas Patocka35991652012-06-03 00:29:58 +01001603 int r;
1604
Mikulas Patocka35991652012-06-03 00:29:58 +01001605 bdev = NULL;
1606 mode = 0;
1607 r = 0;
Milan Broz9af4aa32006-10-03 01:15:20 -07001608
1609 spin_lock_irqsave(&m->lock, flags);
1610
1611 if (!m->current_pgpath)
Kiyoshi Ueda02ab8232009-06-22 10:12:27 +01001612 __choose_pgpath(m, 0);
Milan Broz9af4aa32006-10-03 01:15:20 -07001613
Mike Snitzer7ba10aa2012-09-26 23:45:41 +01001614 pgpath = m->current_pgpath;
1615
1616 if (pgpath) {
1617 bdev = pgpath->path.dev->bdev;
1618 mode = pgpath->path.dev->mode;
Milan Broze90dae12006-10-03 01:15:22 -07001619 }
Milan Broz9af4aa32006-10-03 01:15:20 -07001620
Mike Snitzer7ba10aa2012-09-26 23:45:41 +01001621 if ((pgpath && m->queue_io) || (!pgpath && m->queue_if_no_path))
Hannes Reinecke6c182cd2013-07-10 23:41:15 +01001622 r = -ENOTCONN;
Milan Broz9af4aa32006-10-03 01:15:20 -07001623 else if (!bdev)
1624 r = -EIO;
1625
1626 spin_unlock_irqrestore(&m->lock, flags);
1627
Paolo Bonziniec8013b2012-01-12 16:01:29 +01001628 /*
1629 * Only pass ioctls through if the device sizes match exactly.
1630 */
Hannes Reineckea1989b32014-02-26 10:07:04 +01001631 if (!bdev || ti->len != i_size_read(bdev->bd_inode) >> SECTOR_SHIFT) {
1632 int err = scsi_verify_blk_ioctl(NULL, cmd);
1633 if (err)
1634 r = err;
1635 }
Paolo Bonziniec8013b2012-01-12 16:01:29 +01001636
Hannes Reinecke6c182cd2013-07-10 23:41:15 +01001637 if (r == -ENOTCONN && !fatal_signal_pending(current))
Mikulas Patocka35991652012-06-03 00:29:58 +01001638 queue_work(kmultipathd, &m->process_queued_ios);
Mikulas Patocka35991652012-06-03 00:29:58 +01001639
Al Viro633a08b2007-08-29 20:34:12 -04001640 return r ? : __blkdev_driver_ioctl(bdev, mode, cmd, arg);
Milan Broz9af4aa32006-10-03 01:15:20 -07001641}
1642
Mike Snitzeraf4874e2009-06-22 10:12:33 +01001643static int multipath_iterate_devices(struct dm_target *ti,
1644 iterate_devices_callout_fn fn, void *data)
1645{
1646 struct multipath *m = ti->private;
1647 struct priority_group *pg;
1648 struct pgpath *p;
1649 int ret = 0;
1650
1651 list_for_each_entry(pg, &m->priority_groups, list) {
1652 list_for_each_entry(p, &pg->pgpaths, list) {
Mike Snitzer5dea2712009-07-23 20:30:42 +01001653 ret = fn(ti, p->path.dev, ti->begin, ti->len, data);
Mike Snitzeraf4874e2009-06-22 10:12:33 +01001654 if (ret)
1655 goto out;
1656 }
1657 }
1658
1659out:
1660 return ret;
1661}
1662
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001663static int __pgpath_busy(struct pgpath *pgpath)
1664{
1665 struct request_queue *q = bdev_get_queue(pgpath->path.dev->bdev);
1666
1667 return dm_underlying_device_busy(q);
1668}
1669
1670/*
1671 * We return "busy", only when we can map I/Os but underlying devices
1672 * are busy (so even if we map I/Os now, the I/Os will wait on
1673 * the underlying queue).
1674 * In other words, if we want to kill I/Os or queue them inside us
1675 * due to map unavailability, we don't return "busy". Otherwise,
1676 * dm core won't give us the I/Os and we can't do what we want.
1677 */
1678static int multipath_busy(struct dm_target *ti)
1679{
1680 int busy = 0, has_active = 0;
1681 struct multipath *m = ti->private;
1682 struct priority_group *pg;
1683 struct pgpath *pgpath;
1684 unsigned long flags;
1685
1686 spin_lock_irqsave(&m->lock, flags);
1687
Hannes Reineckeb63349a2013-10-01 11:49:56 +02001688 /* pg_init in progress, requeue until done */
1689 if (m->pg_init_in_progress) {
1690 busy = 1;
1691 goto out;
1692 }
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001693 /* Guess which priority_group will be used at next mapping time */
1694 if (unlikely(!m->current_pgpath && m->next_pg))
1695 pg = m->next_pg;
1696 else if (likely(m->current_pg))
1697 pg = m->current_pg;
1698 else
1699 /*
1700 * We don't know which pg will be used at next mapping time.
1701 * We don't call __choose_pgpath() here to avoid to trigger
1702 * pg_init just by busy checking.
1703 * So we don't know whether underlying devices we will be using
1704 * at next mapping time are busy or not. Just try mapping.
1705 */
1706 goto out;
1707
1708 /*
1709 * If there is one non-busy active path at least, the path selector
1710 * will be able to select it. So we consider such a pg as not busy.
1711 */
1712 busy = 1;
1713 list_for_each_entry(pgpath, &pg->pgpaths, list)
1714 if (pgpath->is_active) {
1715 has_active = 1;
1716
1717 if (!__pgpath_busy(pgpath)) {
1718 busy = 0;
1719 break;
1720 }
1721 }
1722
1723 if (!has_active)
1724 /*
1725 * No active path in this pg, so this pg won't be used and
1726 * the current_pg will be changed at next mapping time.
1727 * We need to try mapping to determine it.
1728 */
1729 busy = 0;
1730
1731out:
1732 spin_unlock_irqrestore(&m->lock, flags);
1733
1734 return busy;
1735}
1736
Linus Torvalds1da177e2005-04-16 15:20:36 -07001737/*-----------------------------------------------------------------
1738 * Module setup
1739 *---------------------------------------------------------------*/
1740static struct target_type multipath_target = {
1741 .name = "multipath",
Shiva Krishna Merla954a73d2013-10-30 03:26:38 +00001742 .version = {1, 6, 0},
Linus Torvalds1da177e2005-04-16 15:20:36 -07001743 .module = THIS_MODULE,
1744 .ctr = multipath_ctr,
1745 .dtr = multipath_dtr,
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001746 .map_rq = multipath_map,
1747 .rq_end_io = multipath_end_io,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001748 .presuspend = multipath_presuspend,
Kiyoshi Ueda6df400a2009-12-10 23:52:19 +00001749 .postsuspend = multipath_postsuspend,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001750 .resume = multipath_resume,
1751 .status = multipath_status,
1752 .message = multipath_message,
Milan Broz9af4aa32006-10-03 01:15:20 -07001753 .ioctl = multipath_ioctl,
Mike Snitzeraf4874e2009-06-22 10:12:33 +01001754 .iterate_devices = multipath_iterate_devices,
Kiyoshi Uedaf40c67f2009-06-22 10:12:37 +01001755 .busy = multipath_busy,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001756};
1757
1758static int __init dm_multipath_init(void)
1759{
1760 int r;
1761
1762 /* allocate a slab for the dm_ios */
Alasdair G Kergon028867a2007-07-12 17:26:32 +01001763 _mpio_cache = KMEM_CACHE(dm_mpath_io, 0);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001764 if (!_mpio_cache)
1765 return -ENOMEM;
1766
1767 r = dm_register_target(&multipath_target);
1768 if (r < 0) {
Alasdair G Kergon0cd33122007-07-12 17:27:01 +01001769 DMERR("register failed %d", r);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001770 kmem_cache_destroy(_mpio_cache);
1771 return -EINVAL;
1772 }
1773
Tejun Heo4d4d66a2011-01-13 19:59:57 +00001774 kmultipathd = alloc_workqueue("kmpathd", WQ_MEM_RECLAIM, 0);
Alasdair G Kergonc5573082005-05-05 16:16:07 -07001775 if (!kmultipathd) {
Alasdair G Kergon0cd33122007-07-12 17:27:01 +01001776 DMERR("failed to create workqueue kmpathd");
Alasdair G Kergonc5573082005-05-05 16:16:07 -07001777 dm_unregister_target(&multipath_target);
1778 kmem_cache_destroy(_mpio_cache);
1779 return -ENOMEM;
1780 }
1781
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -07001782 /*
1783 * A separate workqueue is used to handle the device handlers
1784 * to avoid overloading existing workqueue. Overloading the
1785 * old workqueue would also create a bottleneck in the
1786 * path of the storage hardware device activation.
1787 */
Tejun Heo4d4d66a2011-01-13 19:59:57 +00001788 kmpath_handlerd = alloc_ordered_workqueue("kmpath_handlerd",
1789 WQ_MEM_RECLAIM);
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -07001790 if (!kmpath_handlerd) {
1791 DMERR("failed to create workqueue kmpath_handlerd");
1792 destroy_workqueue(kmultipathd);
1793 dm_unregister_target(&multipath_target);
1794 kmem_cache_destroy(_mpio_cache);
1795 return -ENOMEM;
1796 }
1797
Alasdair G Kergon72d94862006-06-26 00:27:35 -07001798 DMINFO("version %u.%u.%u loaded",
Linus Torvalds1da177e2005-04-16 15:20:36 -07001799 multipath_target.version[0], multipath_target.version[1],
1800 multipath_target.version[2]);
1801
1802 return r;
1803}
1804
1805static void __exit dm_multipath_exit(void)
1806{
Chandra Seetharamanbab7cfc2008-05-01 14:50:22 -07001807 destroy_workqueue(kmpath_handlerd);
Alasdair G Kergonc5573082005-05-05 16:16:07 -07001808 destroy_workqueue(kmultipathd);
1809
Mikulas Patocka10d3bd02009-01-06 03:04:58 +00001810 dm_unregister_target(&multipath_target);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001811 kmem_cache_destroy(_mpio_cache);
1812}
1813
Linus Torvalds1da177e2005-04-16 15:20:36 -07001814module_init(dm_multipath_init);
1815module_exit(dm_multipath_exit);
1816
1817MODULE_DESCRIPTION(DM_NAME " multipath target");
1818MODULE_AUTHOR("Sistina Software <dm-devel@redhat.com>");
1819MODULE_LICENSE("GPL");