blob: 693187df76012e1ace1f3c9b58fd4e78d6ec3aab [file] [log] [blame]
Rusty Russelle467cde2007-10-22 11:03:38 +10001//#define DEBUG
2#include <linux/spinlock.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +09003#include <linux/slab.h>
Rusty Russelle467cde2007-10-22 11:03:38 +10004#include <linux/blkdev.h>
5#include <linux/hdreg.h>
Paul Gortmaker0c8d44f2011-07-01 15:56:05 -04006#include <linux/module.h>
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +10307#include <linux/mutex.h>
Rusty Russelle467cde2007-10-22 11:03:38 +10008#include <linux/virtio.h>
9#include <linux/virtio_blk.h>
Jens Axboe3d1266c2007-10-24 13:21:21 +020010#include <linux/scatterlist.h>
Christoph Hellwig7a7c9242011-02-01 21:43:48 +010011#include <linux/string_helpers.h>
Liu Yuan6917f832011-04-24 02:49:26 +080012#include <scsi/scsi_cmnd.h>
Michael S. Tsirkin5087a502011-10-30 21:29:59 +020013#include <linux/idr.h>
Jens Axboe3d1266c2007-10-24 13:21:21 +020014
Christian Borntraeger4f3bf192008-01-31 15:53:53 +010015#define PART_BITS 4
Rusty Russelle467cde2007-10-22 11:03:38 +100016
Michael S. Tsirkin5087a502011-10-30 21:29:59 +020017static int major;
18static DEFINE_IDA(vd_index_ida);
19
Christoph Hellwig7a7c9242011-02-01 21:43:48 +010020struct workqueue_struct *virtblk_wq;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +010021
Rusty Russelle467cde2007-10-22 11:03:38 +100022struct virtio_blk
23{
24 spinlock_t lock;
25
26 struct virtio_device *vdev;
27 struct virtqueue *vq;
28
29 /* The disk structure for the kernel. */
30 struct gendisk *disk;
31
Rusty Russelle467cde2007-10-22 11:03:38 +100032 mempool_t *pool;
33
Christoph Hellwig7a7c9242011-02-01 21:43:48 +010034 /* Process context for config space updates */
35 struct work_struct config_work;
36
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +103037 /* Lock for config space updates */
38 struct mutex config_lock;
39
40 /* enable config space updates */
41 bool config_enable;
42
Rusty Russell0864b792008-12-30 09:26:05 -060043 /* What host tells us, plus 2 for header & tailer. */
44 unsigned int sg_elems;
45
Michael S. Tsirkin5087a502011-10-30 21:29:59 +020046 /* Ida index - used to track minor number allocations. */
47 int index;
48
Rusty Russelle467cde2007-10-22 11:03:38 +100049 /* Scatterlist: can be too big for stack. */
Rusty Russell0864b792008-12-30 09:26:05 -060050 struct scatterlist sg[/*sg_elems*/];
Rusty Russelle467cde2007-10-22 11:03:38 +100051};
52
53struct virtblk_req
54{
Rusty Russelle467cde2007-10-22 11:03:38 +100055 struct request *req;
56 struct virtio_blk_outhdr out_hdr;
Hannes Reinecke1cde26f2009-05-18 14:41:30 +020057 struct virtio_scsi_inhdr in_hdr;
Rusty Russellcb38fa22008-05-02 21:50:45 -050058 u8 status;
Rusty Russelle467cde2007-10-22 11:03:38 +100059};
60
Rusty Russell18445c42008-02-04 23:49:57 -050061static void blk_done(struct virtqueue *vq)
Rusty Russelle467cde2007-10-22 11:03:38 +100062{
63 struct virtio_blk *vblk = vq->vdev->priv;
64 struct virtblk_req *vbr;
65 unsigned int len;
66 unsigned long flags;
67
68 spin_lock_irqsave(&vblk->lock, flags);
Michael S. Tsirkin09ec6b62010-04-12 16:18:36 +030069 while ((vbr = virtqueue_get_buf(vblk->vq, &len)) != NULL) {
Kiyoshi Ueda83169822008-10-01 10:11:20 -040070 int error;
Hannes Reinecke1cde26f2009-05-18 14:41:30 +020071
Rusty Russellcb38fa22008-05-02 21:50:45 -050072 switch (vbr->status) {
Rusty Russelle467cde2007-10-22 11:03:38 +100073 case VIRTIO_BLK_S_OK:
Kiyoshi Ueda83169822008-10-01 10:11:20 -040074 error = 0;
Rusty Russelle467cde2007-10-22 11:03:38 +100075 break;
76 case VIRTIO_BLK_S_UNSUPP:
Kiyoshi Ueda83169822008-10-01 10:11:20 -040077 error = -ENOTTY;
Rusty Russelle467cde2007-10-22 11:03:38 +100078 break;
79 default:
Kiyoshi Ueda83169822008-10-01 10:11:20 -040080 error = -EIO;
Rusty Russelle467cde2007-10-22 11:03:38 +100081 break;
82 }
83
Christoph Hellwig33659eb2010-08-07 18:17:56 +020084 switch (vbr->req->cmd_type) {
85 case REQ_TYPE_BLOCK_PC:
Hannes Reinecke1cde26f2009-05-18 14:41:30 +020086 vbr->req->resid_len = vbr->in_hdr.residual;
87 vbr->req->sense_len = vbr->in_hdr.sense_len;
88 vbr->req->errors = vbr->in_hdr.errors;
Christoph Hellwig33659eb2010-08-07 18:17:56 +020089 break;
90 case REQ_TYPE_SPECIAL:
john cooper4cb2ea22010-03-25 01:33:33 -040091 vbr->req->errors = (error != 0);
Christoph Hellwig33659eb2010-08-07 18:17:56 +020092 break;
Jens Axboe15fa6e82010-06-18 12:10:18 +020093 default:
94 break;
Christoph Hellwig33659eb2010-08-07 18:17:56 +020095 }
Hannes Reinecke1cde26f2009-05-18 14:41:30 +020096
Tejun Heo40cbbb72009-04-23 11:05:19 +090097 __blk_end_request_all(vbr->req, error);
Rusty Russelle467cde2007-10-22 11:03:38 +100098 mempool_free(vbr, vblk->pool);
99 }
100 /* In case queue is stopped waiting for more buffers. */
101 blk_start_queue(vblk->disk->queue);
102 spin_unlock_irqrestore(&vblk->lock, flags);
Rusty Russelle467cde2007-10-22 11:03:38 +1000103}
104
105static bool do_req(struct request_queue *q, struct virtio_blk *vblk,
106 struct request *req)
107{
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200108 unsigned long num, out = 0, in = 0;
Rusty Russelle467cde2007-10-22 11:03:38 +1000109 struct virtblk_req *vbr;
110
111 vbr = mempool_alloc(vblk->pool, GFP_ATOMIC);
112 if (!vbr)
113 /* When another request finishes we'll try again. */
114 return false;
115
116 vbr->req = req;
FUJITA Tomonoridd40e452010-07-03 17:45:38 +0900117
118 if (req->cmd_flags & REQ_FLUSH) {
119 vbr->out_hdr.type = VIRTIO_BLK_T_FLUSH;
Rusty Russelle467cde2007-10-22 11:03:38 +1000120 vbr->out_hdr.sector = 0;
Fernando Luis Vázquez Cao766ca442008-08-14 09:59:13 +0200121 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
FUJITA Tomonoridd40e452010-07-03 17:45:38 +0900122 } else {
123 switch (req->cmd_type) {
124 case REQ_TYPE_FS:
125 vbr->out_hdr.type = 0;
126 vbr->out_hdr.sector = blk_rq_pos(vbr->req);
127 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
128 break;
129 case REQ_TYPE_BLOCK_PC:
130 vbr->out_hdr.type = VIRTIO_BLK_T_SCSI_CMD;
Christoph Hellwigf1b0ef062009-09-17 19:57:42 +0200131 vbr->out_hdr.sector = 0;
132 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
133 break;
FUJITA Tomonoridd40e452010-07-03 17:45:38 +0900134 case REQ_TYPE_SPECIAL:
135 vbr->out_hdr.type = VIRTIO_BLK_T_GET_ID;
136 vbr->out_hdr.sector = 0;
137 vbr->out_hdr.ioprio = req_get_ioprio(vbr->req);
138 break;
139 default:
140 /* We don't put anything else in the queue. */
141 BUG();
Christoph Hellwigf1b0ef062009-09-17 19:57:42 +0200142 }
Rusty Russelle467cde2007-10-22 11:03:38 +1000143 }
144
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200145 sg_set_buf(&vblk->sg[out++], &vbr->out_hdr, sizeof(vbr->out_hdr));
Rusty Russelle467cde2007-10-22 11:03:38 +1000146
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200147 /*
148 * If this is a packet command we need a couple of additional headers.
149 * Behind the normal outhdr we put a segment with the scsi command
150 * block, and before the normal inhdr we put the sense data and the
151 * inhdr with additional status information before the normal inhdr.
152 */
Christoph Hellwig33659eb2010-08-07 18:17:56 +0200153 if (vbr->req->cmd_type == REQ_TYPE_BLOCK_PC)
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200154 sg_set_buf(&vblk->sg[out++], vbr->req->cmd, vbr->req->cmd_len);
155
156 num = blk_rq_map_sg(q, vbr->req, vblk->sg + out);
157
Christoph Hellwig33659eb2010-08-07 18:17:56 +0200158 if (vbr->req->cmd_type == REQ_TYPE_BLOCK_PC) {
Liu Yuan6917f832011-04-24 02:49:26 +0800159 sg_set_buf(&vblk->sg[num + out + in++], vbr->req->sense, SCSI_SENSE_BUFFERSIZE);
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200160 sg_set_buf(&vblk->sg[num + out + in++], &vbr->in_hdr,
161 sizeof(vbr->in_hdr));
162 }
163
164 sg_set_buf(&vblk->sg[num + out + in++], &vbr->status,
165 sizeof(vbr->status));
166
167 if (num) {
168 if (rq_data_dir(vbr->req) == WRITE) {
169 vbr->out_hdr.type |= VIRTIO_BLK_T_OUT;
170 out += num;
171 } else {
172 vbr->out_hdr.type |= VIRTIO_BLK_T_IN;
173 in += num;
174 }
Rusty Russelle467cde2007-10-22 11:03:38 +1000175 }
176
Rusty Russellf96fde42012-01-12 15:44:42 +1030177 if (virtqueue_add_buf(vblk->vq, vblk->sg, out, in, vbr, GFP_ATOMIC)<0) {
Rusty Russelle467cde2007-10-22 11:03:38 +1000178 mempool_free(vbr, vblk->pool);
179 return false;
180 }
181
Rusty Russelle467cde2007-10-22 11:03:38 +1000182 return true;
183}
184
185static void do_virtblk_request(struct request_queue *q)
186{
Christoph Hellwig6c3b46f2009-05-18 14:38:28 +0200187 struct virtio_blk *vblk = q->queuedata;
Rusty Russelle467cde2007-10-22 11:03:38 +1000188 struct request *req;
189 unsigned int issued = 0;
190
Tejun Heo9934c8c2009-05-08 11:54:16 +0900191 while ((req = blk_peek_request(q)) != NULL) {
Rusty Russell0864b792008-12-30 09:26:05 -0600192 BUG_ON(req->nr_phys_segments + 2 > vblk->sg_elems);
Rusty Russelle467cde2007-10-22 11:03:38 +1000193
194 /* If this request fails, stop queue and wait for something to
195 finish to restart it. */
196 if (!do_req(q, vblk, req)) {
197 blk_stop_queue(q);
198 break;
199 }
Tejun Heo9934c8c2009-05-08 11:54:16 +0900200 blk_start_request(req);
Rusty Russelle467cde2007-10-22 11:03:38 +1000201 issued++;
202 }
203
204 if (issued)
Michael S. Tsirkin09ec6b62010-04-12 16:18:36 +0300205 virtqueue_kick(vblk->vq);
Rusty Russelle467cde2007-10-22 11:03:38 +1000206}
207
john cooper4cb2ea22010-03-25 01:33:33 -0400208/* return id (s/n) string for *disk to *id_str
209 */
210static int virtblk_get_id(struct gendisk *disk, char *id_str)
211{
212 struct virtio_blk *vblk = disk->private_data;
213 struct request *req;
214 struct bio *bio;
Mike Snitzere4c47762010-10-09 12:12:13 +1030215 int err;
john cooper4cb2ea22010-03-25 01:33:33 -0400216
217 bio = bio_map_kern(vblk->disk->queue, id_str, VIRTIO_BLK_ID_BYTES,
218 GFP_KERNEL);
219 if (IS_ERR(bio))
220 return PTR_ERR(bio);
221
222 req = blk_make_request(vblk->disk->queue, bio, GFP_KERNEL);
223 if (IS_ERR(req)) {
224 bio_put(bio);
225 return PTR_ERR(req);
226 }
227
228 req->cmd_type = REQ_TYPE_SPECIAL;
Mike Snitzere4c47762010-10-09 12:12:13 +1030229 err = blk_execute_rq(vblk->disk->queue, vblk->disk, req, false);
230 blk_put_request(req);
231
232 return err;
john cooper4cb2ea22010-03-25 01:33:33 -0400233}
234
Christoph Hellwigfe5a50a2010-09-15 01:27:23 +0200235static int virtblk_ioctl(struct block_device *bdev, fmode_t mode,
236 unsigned int cmd, unsigned long data)
Rusty Russelle467cde2007-10-22 11:03:38 +1000237{
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200238 struct gendisk *disk = bdev->bd_disk;
239 struct virtio_blk *vblk = disk->private_data;
240
241 /*
242 * Only allow the generic SCSI ioctls if the host can support it.
243 */
244 if (!virtio_has_feature(vblk->vdev, VIRTIO_BLK_F_SCSI))
Christoph Hellwigd9ecdea2009-06-20 21:29:41 +0200245 return -ENOTTY;
Hannes Reinecke1cde26f2009-05-18 14:41:30 +0200246
Paolo Bonzini577ebb32012-01-12 16:01:27 +0100247 return scsi_cmd_blk_ioctl(bdev, mode, cmd,
248 (void __user *)data);
Rusty Russelle467cde2007-10-22 11:03:38 +1000249}
250
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100251/* We provide getgeo only to please some old bootloader/partitioning tools */
252static int virtblk_getgeo(struct block_device *bd, struct hd_geometry *geo)
253{
Ryan Harper48e40432008-04-16 13:56:37 -0500254 struct virtio_blk *vblk = bd->bd_disk->private_data;
255 struct virtio_blk_geometry vgeo;
256 int err;
257
258 /* see if the host passed in geometry config */
259 err = virtio_config_val(vblk->vdev, VIRTIO_BLK_F_GEOMETRY,
260 offsetof(struct virtio_blk_config, geometry),
261 &vgeo);
262
263 if (!err) {
264 geo->heads = vgeo.heads;
265 geo->sectors = vgeo.sectors;
266 geo->cylinders = vgeo.cylinders;
267 } else {
268 /* some standard values, similar to sd */
269 geo->heads = 1 << 6;
270 geo->sectors = 1 << 5;
271 geo->cylinders = get_capacity(bd->bd_disk) >> 11;
272 }
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100273 return 0;
274}
275
Alexey Dobriyan83d5cde2009-09-21 17:01:13 -0700276static const struct block_device_operations virtblk_fops = {
Arnd Bergmann8a6cfeb2010-07-08 10:18:46 +0200277 .ioctl = virtblk_ioctl,
Christian Borntraeger135da0b2008-01-23 17:56:50 +0100278 .owner = THIS_MODULE,
279 .getgeo = virtblk_getgeo,
Rusty Russelle467cde2007-10-22 11:03:38 +1000280};
281
Christian Borntraegerd50ed902008-02-01 09:05:00 +0100282static int index_to_minor(int index)
283{
284 return index << PART_BITS;
285}
286
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200287static int minor_to_index(int minor)
288{
289 return minor >> PART_BITS;
290}
291
Ryan Harpera5eb9e42010-06-23 22:19:57 -0500292static ssize_t virtblk_serial_show(struct device *dev,
293 struct device_attribute *attr, char *buf)
294{
295 struct gendisk *disk = dev_to_disk(dev);
296 int err;
297
298 /* sysfs gives us a PAGE_SIZE buffer */
299 BUILD_BUG_ON(PAGE_SIZE < VIRTIO_BLK_ID_BYTES);
300
301 buf[VIRTIO_BLK_ID_BYTES] = '\0';
302 err = virtblk_get_id(disk, buf);
303 if (!err)
304 return strlen(buf);
305
306 if (err == -EIO) /* Unsupported? Make it empty. */
307 return 0;
308
309 return err;
310}
311DEVICE_ATTR(serial, S_IRUGO, virtblk_serial_show, NULL);
312
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100313static void virtblk_config_changed_work(struct work_struct *work)
314{
315 struct virtio_blk *vblk =
316 container_of(work, struct virtio_blk, config_work);
317 struct virtio_device *vdev = vblk->vdev;
318 struct request_queue *q = vblk->disk->queue;
319 char cap_str_2[10], cap_str_10[10];
320 u64 capacity, size;
321
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +1030322 mutex_lock(&vblk->config_lock);
323 if (!vblk->config_enable)
324 goto done;
325
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100326 /* Host must always specify the capacity. */
327 vdev->config->get(vdev, offsetof(struct virtio_blk_config, capacity),
328 &capacity, sizeof(capacity));
329
330 /* If capacity is too big, truncate with warning. */
331 if ((sector_t)capacity != capacity) {
332 dev_warn(&vdev->dev, "Capacity %llu too large: truncating\n",
333 (unsigned long long)capacity);
334 capacity = (sector_t)-1;
335 }
336
337 size = capacity * queue_logical_block_size(q);
338 string_get_size(size, STRING_UNITS_2, cap_str_2, sizeof(cap_str_2));
339 string_get_size(size, STRING_UNITS_10, cap_str_10, sizeof(cap_str_10));
340
341 dev_notice(&vdev->dev,
342 "new size: %llu %d-byte logical blocks (%s/%s)\n",
343 (unsigned long long)capacity,
344 queue_logical_block_size(q),
345 cap_str_10, cap_str_2);
346
347 set_capacity(vblk->disk, capacity);
Vivek Goyale9986f32012-03-29 10:09:44 +0200348 revalidate_disk(vblk->disk);
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +1030349done:
350 mutex_unlock(&vblk->config_lock);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100351}
352
353static void virtblk_config_changed(struct virtio_device *vdev)
354{
355 struct virtio_blk *vblk = vdev->priv;
356
357 queue_work(virtblk_wq, &vblk->config_work);
358}
359
Amit Shah6abd6e52011-12-22 16:58:29 +0530360static int init_vq(struct virtio_blk *vblk)
361{
362 int err = 0;
363
364 /* We expect one virtqueue, for output. */
365 vblk->vq = virtio_find_single_vq(vblk->vdev, blk_done, "requests");
366 if (IS_ERR(vblk->vq))
367 err = PTR_ERR(vblk->vq);
368
369 return err;
370}
371
Ren Mingxinc0aa3e02012-04-10 15:28:05 +0800372/*
373 * Legacy naming scheme used for virtio devices. We are stuck with it for
374 * virtio blk but don't ever use it for any new driver.
375 */
376static int virtblk_name_format(char *prefix, int index, char *buf, int buflen)
377{
378 const int base = 'z' - 'a' + 1;
379 char *begin = buf + strlen(prefix);
380 char *end = buf + buflen;
381 char *p;
382 int unit;
383
384 p = end - 1;
385 *p = '\0';
386 unit = base;
387 do {
388 if (p == begin)
389 return -EINVAL;
390 *--p = 'a' + (index % unit);
391 index = (index / unit) - 1;
392 } while (index >= 0);
393
394 memmove(begin, p, end - p);
395 memcpy(buf, prefix, strlen(prefix));
396
397 return 0;
398}
399
Mike Frysinger98e94442009-05-18 03:39:09 -0400400static int __devinit virtblk_probe(struct virtio_device *vdev)
Rusty Russelle467cde2007-10-22 11:03:38 +1000401{
402 struct virtio_blk *vblk;
Christoph Hellwig69740c82010-02-24 14:22:25 -0600403 struct request_queue *q;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200404 int err, index;
Rusty Russelle467cde2007-10-22 11:03:38 +1000405 u64 cap;
Christoph Hellwig69740c82010-02-24 14:22:25 -0600406 u32 v, blk_size, sg_elems, opt_io_size;
407 u16 min_io_size;
408 u8 physical_block_exp, alignment_offset;
Rusty Russelle467cde2007-10-22 11:03:38 +1000409
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200410 err = ida_simple_get(&vd_index_ida, 0, minor_to_index(1 << MINORBITS),
411 GFP_KERNEL);
412 if (err < 0)
413 goto out;
414 index = err;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100415
Rusty Russell0864b792008-12-30 09:26:05 -0600416 /* We need to know how many segments before we allocate. */
417 err = virtio_config_val(vdev, VIRTIO_BLK_F_SEG_MAX,
418 offsetof(struct virtio_blk_config, seg_max),
419 &sg_elems);
Christoph Hellwiga5b365a2010-05-25 14:17:54 +0200420
421 /* We need at least one SG element, whatever they say. */
422 if (err || !sg_elems)
Rusty Russell0864b792008-12-30 09:26:05 -0600423 sg_elems = 1;
424
425 /* We need an extra sg elements at head and tail. */
426 sg_elems += 2;
427 vdev->priv = vblk = kmalloc(sizeof(*vblk) +
428 sizeof(vblk->sg[0]) * sg_elems, GFP_KERNEL);
Rusty Russelle467cde2007-10-22 11:03:38 +1000429 if (!vblk) {
430 err = -ENOMEM;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200431 goto out_free_index;
Rusty Russelle467cde2007-10-22 11:03:38 +1000432 }
433
Rusty Russelle467cde2007-10-22 11:03:38 +1000434 spin_lock_init(&vblk->lock);
435 vblk->vdev = vdev;
Rusty Russell0864b792008-12-30 09:26:05 -0600436 vblk->sg_elems = sg_elems;
437 sg_init_table(vblk->sg, vblk->sg_elems);
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +1030438 mutex_init(&vblk->config_lock);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100439 INIT_WORK(&vblk->config_work, virtblk_config_changed_work);
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +1030440 vblk->config_enable = true;
Rusty Russelle467cde2007-10-22 11:03:38 +1000441
Amit Shah6abd6e52011-12-22 16:58:29 +0530442 err = init_vq(vblk);
443 if (err)
Rusty Russelle467cde2007-10-22 11:03:38 +1000444 goto out_free_vblk;
Rusty Russelle467cde2007-10-22 11:03:38 +1000445
446 vblk->pool = mempool_create_kmalloc_pool(1,sizeof(struct virtblk_req));
447 if (!vblk->pool) {
448 err = -ENOMEM;
449 goto out_free_vq;
450 }
451
Rusty Russelle467cde2007-10-22 11:03:38 +1000452 /* FIXME: How many partitions? How long is a piece of string? */
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100453 vblk->disk = alloc_disk(1 << PART_BITS);
Rusty Russelle467cde2007-10-22 11:03:38 +1000454 if (!vblk->disk) {
455 err = -ENOMEM;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100456 goto out_mempool;
Rusty Russelle467cde2007-10-22 11:03:38 +1000457 }
458
Christoph Hellwig69740c82010-02-24 14:22:25 -0600459 q = vblk->disk->queue = blk_init_queue(do_virtblk_request, &vblk->lock);
460 if (!q) {
Rusty Russelle467cde2007-10-22 11:03:38 +1000461 err = -ENOMEM;
462 goto out_put_disk;
463 }
464
Christoph Hellwig69740c82010-02-24 14:22:25 -0600465 q->queuedata = vblk;
Fernando Luis Vázquez Cao7d116b62008-10-27 18:45:15 +0900466
Ren Mingxinc0aa3e02012-04-10 15:28:05 +0800467 virtblk_name_format("vd", index, vblk->disk->disk_name, DISK_NAME_LEN);
Christian Borntraegerd50ed902008-02-01 09:05:00 +0100468
Rusty Russelle467cde2007-10-22 11:03:38 +1000469 vblk->disk->major = major;
Christian Borntraegerd50ed902008-02-01 09:05:00 +0100470 vblk->disk->first_minor = index_to_minor(index);
Rusty Russelle467cde2007-10-22 11:03:38 +1000471 vblk->disk->private_data = vblk;
472 vblk->disk->fops = &virtblk_fops;
Jeremy Katzc4839342008-03-02 17:00:15 -0500473 vblk->disk->driverfs_dev = &vdev->dev;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200474 vblk->index = index;
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100475
Tejun Heo02c42b72010-09-03 11:56:18 +0200476 /* configure queue flush support */
Tejun Heo4913efe2010-09-03 11:56:16 +0200477 if (virtio_has_feature(vdev, VIRTIO_BLK_F_FLUSH))
478 blk_queue_flush(q, REQ_FLUSH);
Rusty Russelle467cde2007-10-22 11:03:38 +1000479
Christian Borntraeger3ef53602008-05-16 11:17:03 +0200480 /* If disk is read-only in the host, the guest should obey */
481 if (virtio_has_feature(vdev, VIRTIO_BLK_F_RO))
482 set_disk_ro(vblk->disk, 1);
483
Rusty Russella586d4f2008-02-04 23:49:56 -0500484 /* Host must always specify the capacity. */
Rusty Russell72e61eb2008-05-02 21:50:49 -0500485 vdev->config->get(vdev, offsetof(struct virtio_blk_config, capacity),
486 &cap, sizeof(cap));
Rusty Russelle467cde2007-10-22 11:03:38 +1000487
488 /* If capacity is too big, truncate with warning. */
489 if ((sector_t)cap != cap) {
490 dev_warn(&vdev->dev, "Capacity %llu too large: truncating\n",
491 (unsigned long long)cap);
492 cap = (sector_t)-1;
493 }
494 set_capacity(vblk->disk, cap);
495
Rusty Russell0864b792008-12-30 09:26:05 -0600496 /* We can handle whatever the host told us to handle. */
Martin K. Petersenee714f22010-03-10 00:48:32 -0500497 blk_queue_max_segments(q, vblk->sg_elems-2);
Rusty Russell0864b792008-12-30 09:26:05 -0600498
Christoph Hellwig4eff3ca2009-07-17 21:47:45 -0600499 /* No need to bounce any requests */
Christoph Hellwig69740c82010-02-24 14:22:25 -0600500 blk_queue_bounce_limit(q, BLK_BOUNCE_ANY);
Christoph Hellwig4eff3ca2009-07-17 21:47:45 -0600501
Rusty Russell4b7f7e22008-12-30 09:26:04 -0600502 /* No real sector limit. */
Martin K. Petersenee714f22010-03-10 00:48:32 -0500503 blk_queue_max_hw_sectors(q, -1U);
Rusty Russell4b7f7e22008-12-30 09:26:04 -0600504
Rusty Russella586d4f2008-02-04 23:49:56 -0500505 /* Host can optionally specify maximum segment size and number of
506 * segments. */
507 err = virtio_config_val(vdev, VIRTIO_BLK_F_SIZE_MAX,
508 offsetof(struct virtio_blk_config, size_max),
509 &v);
Rusty Russelle467cde2007-10-22 11:03:38 +1000510 if (!err)
Christoph Hellwig69740c82010-02-24 14:22:25 -0600511 blk_queue_max_segment_size(q, v);
Rusty Russell4b7f7e22008-12-30 09:26:04 -0600512 else
Christoph Hellwig69740c82010-02-24 14:22:25 -0600513 blk_queue_max_segment_size(q, -1U);
Rusty Russelle467cde2007-10-22 11:03:38 +1000514
Christian Borntraeger066f4d82008-05-29 11:08:26 +0200515 /* Host can optionally specify the block size of the device */
516 err = virtio_config_val(vdev, VIRTIO_BLK_F_BLK_SIZE,
517 offsetof(struct virtio_blk_config, blk_size),
518 &blk_size);
519 if (!err)
Christoph Hellwig69740c82010-02-24 14:22:25 -0600520 blk_queue_logical_block_size(q, blk_size);
521 else
522 blk_size = queue_logical_block_size(q);
523
524 /* Use topology information if available */
525 err = virtio_config_val(vdev, VIRTIO_BLK_F_TOPOLOGY,
526 offsetof(struct virtio_blk_config, physical_block_exp),
527 &physical_block_exp);
528 if (!err && physical_block_exp)
529 blk_queue_physical_block_size(q,
530 blk_size * (1 << physical_block_exp));
531
532 err = virtio_config_val(vdev, VIRTIO_BLK_F_TOPOLOGY,
533 offsetof(struct virtio_blk_config, alignment_offset),
534 &alignment_offset);
535 if (!err && alignment_offset)
536 blk_queue_alignment_offset(q, blk_size * alignment_offset);
537
538 err = virtio_config_val(vdev, VIRTIO_BLK_F_TOPOLOGY,
539 offsetof(struct virtio_blk_config, min_io_size),
540 &min_io_size);
541 if (!err && min_io_size)
542 blk_queue_io_min(q, blk_size * min_io_size);
543
544 err = virtio_config_val(vdev, VIRTIO_BLK_F_TOPOLOGY,
545 offsetof(struct virtio_blk_config, opt_io_size),
546 &opt_io_size);
547 if (!err && opt_io_size)
548 blk_queue_io_opt(q, blk_size * opt_io_size);
549
Christian Borntraeger066f4d82008-05-29 11:08:26 +0200550
Rusty Russelle467cde2007-10-22 11:03:38 +1000551 add_disk(vblk->disk);
Ryan Harpera5eb9e42010-06-23 22:19:57 -0500552 err = device_create_file(disk_to_dev(vblk->disk), &dev_attr_serial);
553 if (err)
554 goto out_del_disk;
555
Rusty Russelle467cde2007-10-22 11:03:38 +1000556 return 0;
557
Ryan Harpera5eb9e42010-06-23 22:19:57 -0500558out_del_disk:
559 del_gendisk(vblk->disk);
560 blk_cleanup_queue(vblk->disk->queue);
Rusty Russelle467cde2007-10-22 11:03:38 +1000561out_put_disk:
562 put_disk(vblk->disk);
Rusty Russelle467cde2007-10-22 11:03:38 +1000563out_mempool:
564 mempool_destroy(vblk->pool);
565out_free_vq:
Michael S. Tsirkind2a7ddd2009-06-12 22:16:36 -0600566 vdev->config->del_vqs(vdev);
Rusty Russelle467cde2007-10-22 11:03:38 +1000567out_free_vblk:
568 kfree(vblk);
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200569out_free_index:
570 ida_simple_remove(&vd_index_ida, index);
Rusty Russelle467cde2007-10-22 11:03:38 +1000571out:
572 return err;
573}
574
Mike Frysinger98e94442009-05-18 03:39:09 -0400575static void __devexit virtblk_remove(struct virtio_device *vdev)
Rusty Russelle467cde2007-10-22 11:03:38 +1000576{
577 struct virtio_blk *vblk = vdev->priv;
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200578 int index = vblk->index;
Asias Heb79d8662012-05-04 20:22:04 +0800579 struct virtblk_req *vbr;
580 unsigned long flags;
Rusty Russelle467cde2007-10-22 11:03:38 +1000581
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +1030582 /* Prevent config work handler from accessing the device. */
583 mutex_lock(&vblk->config_lock);
584 vblk->config_enable = false;
585 mutex_unlock(&vblk->config_lock);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100586
Rusty Russell6e5aa7e2008-02-04 23:50:03 -0500587 /* Stop all the virtqueues. */
588 vdev->config->reset(vdev);
589
Michael S. Tsirkin4678d6f2012-01-12 15:44:44 +1030590 flush_work(&vblk->config_work);
591
Chris Lalancetteac9d4632008-05-30 15:09:41 -0500592 del_gendisk(vblk->disk);
Asias Heb79d8662012-05-04 20:22:04 +0800593
594 /* Abort requests dispatched to driver. */
595 spin_lock_irqsave(&vblk->lock, flags);
596 while ((vbr = virtqueue_detach_unused_buf(vblk->vq))) {
597 __blk_end_request_all(vbr->req, -EIO);
598 mempool_free(vbr, vblk->pool);
599 }
600 spin_unlock_irqrestore(&vblk->lock, flags);
601
Rusty Russelle467cde2007-10-22 11:03:38 +1000602 blk_cleanup_queue(vblk->disk->queue);
603 put_disk(vblk->disk);
Rusty Russelle467cde2007-10-22 11:03:38 +1000604 mempool_destroy(vblk->pool);
Michael S. Tsirkind2a7ddd2009-06-12 22:16:36 -0600605 vdev->config->del_vqs(vdev);
Rusty Russelle467cde2007-10-22 11:03:38 +1000606 kfree(vblk);
Michael S. Tsirkin5087a502011-10-30 21:29:59 +0200607 ida_simple_remove(&vd_index_ida, index);
Rusty Russelle467cde2007-10-22 11:03:38 +1000608}
609
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530610#ifdef CONFIG_PM
611static int virtblk_freeze(struct virtio_device *vdev)
612{
613 struct virtio_blk *vblk = vdev->priv;
614
615 /* Ensure we don't receive any more interrupts */
616 vdev->config->reset(vdev);
617
618 /* Prevent config work handler from accessing the device. */
619 mutex_lock(&vblk->config_lock);
620 vblk->config_enable = false;
621 mutex_unlock(&vblk->config_lock);
622
623 flush_work(&vblk->config_work);
624
625 spin_lock_irq(vblk->disk->queue->queue_lock);
626 blk_stop_queue(vblk->disk->queue);
627 spin_unlock_irq(vblk->disk->queue->queue_lock);
628 blk_sync_queue(vblk->disk->queue);
629
630 vdev->config->del_vqs(vdev);
631 return 0;
632}
633
634static int virtblk_restore(struct virtio_device *vdev)
635{
636 struct virtio_blk *vblk = vdev->priv;
637 int ret;
638
639 vblk->config_enable = true;
640 ret = init_vq(vdev->priv);
641 if (!ret) {
642 spin_lock_irq(vblk->disk->queue->queue_lock);
643 blk_start_queue(vblk->disk->queue);
644 spin_unlock_irq(vblk->disk->queue->queue_lock);
645 }
646 return ret;
647}
648#endif
649
Márton Németh47483e22010-01-10 13:40:02 +0100650static const struct virtio_device_id id_table[] = {
Rusty Russelle467cde2007-10-22 11:03:38 +1000651 { VIRTIO_ID_BLOCK, VIRTIO_DEV_ANY_ID },
652 { 0 },
653};
654
Rusty Russellc45a6812008-05-02 21:50:50 -0500655static unsigned int features[] = {
Tejun Heo02c42b72010-09-03 11:56:18 +0200656 VIRTIO_BLK_F_SEG_MAX, VIRTIO_BLK_F_SIZE_MAX, VIRTIO_BLK_F_GEOMETRY,
657 VIRTIO_BLK_F_RO, VIRTIO_BLK_F_BLK_SIZE, VIRTIO_BLK_F_SCSI,
658 VIRTIO_BLK_F_FLUSH, VIRTIO_BLK_F_TOPOLOGY
Rusty Russellc45a6812008-05-02 21:50:50 -0500659};
660
Rakib Mullick4fbfff762009-07-17 20:13:22 +0600661/*
662 * virtio_blk causes spurious section mismatch warning by
663 * simultaneously referring to a __devinit and a __devexit function.
664 * Use __refdata to avoid this warning.
665 */
666static struct virtio_driver __refdata virtio_blk = {
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100667 .feature_table = features,
668 .feature_table_size = ARRAY_SIZE(features),
669 .driver.name = KBUILD_MODNAME,
670 .driver.owner = THIS_MODULE,
671 .id_table = id_table,
672 .probe = virtblk_probe,
673 .remove = __devexit_p(virtblk_remove),
674 .config_changed = virtblk_config_changed,
Amit Shahf8fb5bc2011-12-22 16:58:30 +0530675#ifdef CONFIG_PM
676 .freeze = virtblk_freeze,
677 .restore = virtblk_restore,
678#endif
Rusty Russelle467cde2007-10-22 11:03:38 +1000679};
680
681static int __init init(void)
682{
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100683 int error;
684
685 virtblk_wq = alloc_workqueue("virtio-blk", 0, 0);
686 if (!virtblk_wq)
687 return -ENOMEM;
688
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100689 major = register_blkdev(0, "virtblk");
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100690 if (major < 0) {
691 error = major;
692 goto out_destroy_workqueue;
693 }
694
695 error = register_virtio_driver(&virtio_blk);
696 if (error)
697 goto out_unregister_blkdev;
698 return 0;
699
700out_unregister_blkdev:
701 unregister_blkdev(major, "virtblk");
702out_destroy_workqueue:
703 destroy_workqueue(virtblk_wq);
704 return error;
Rusty Russelle467cde2007-10-22 11:03:38 +1000705}
706
707static void __exit fini(void)
708{
Christian Borntraeger4f3bf192008-01-31 15:53:53 +0100709 unregister_blkdev(major, "virtblk");
Rusty Russelle467cde2007-10-22 11:03:38 +1000710 unregister_virtio_driver(&virtio_blk);
Christoph Hellwig7a7c9242011-02-01 21:43:48 +0100711 destroy_workqueue(virtblk_wq);
Rusty Russelle467cde2007-10-22 11:03:38 +1000712}
713module_init(init);
714module_exit(fini);
715
716MODULE_DEVICE_TABLE(virtio, id_table);
717MODULE_DESCRIPTION("Virtio block driver");
718MODULE_LICENSE("GPL");