blob: 60103e2517ba28ac5c946f32e1bd9e0e6eb7f668 [file] [log] [blame]
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -04001/*
2 * This program is free software; you can redistribute it and/or
3 * modify it under the terms of the GNU General Public License version 2
4 * as published by the Free Software Foundation; or, when distributed
5 * separately from the Linux kernel or incorporated into other
6 * software packages, subject to the following license:
7 *
8 * Permission is hereby granted, free of charge, to any person obtaining a copy
9 * of this source file (the "Software"), to deal in the Software without
10 * restriction, including without limitation the rights to use, copy, modify,
11 * merge, publish, distribute, sublicense, and/or sell copies of the Software,
12 * and to permit persons to whom the Software is furnished to do so, subject to
13 * the following conditions:
14 *
15 * The above copyright notice and this permission notice shall be included in
16 * all copies or substantial portions of the Software.
17 *
18 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
19 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
20 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
21 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
22 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
23 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
24 * IN THE SOFTWARE.
25 */
26
Konrad Rzeszutek Wilk5a577e32011-05-12 16:58:21 -040027#ifndef __XEN_BLKIF__BACKEND__COMMON_H__
28#define __XEN_BLKIF__BACKEND__COMMON_H__
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040029
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040030#include <linux/module.h>
31#include <linux/interrupt.h>
32#include <linux/slab.h>
33#include <linux/blkdev.h>
34#include <linux/vmalloc.h>
35#include <linux/wait.h>
Konrad Rzeszutek Wilk54893772011-04-14 17:21:50 -040036#include <linux/io.h>
Roger Pau Monne0a8704a2012-10-24 18:58:45 +020037#include <linux/rbtree.h>
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040038#include <asm/setup.h>
39#include <asm/pgalloc.h>
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040040#include <asm/hypervisor.h>
Jeremy Fitzhardinge88122932009-02-09 12:05:51 -080041#include <xen/grant_table.h>
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040042#include <xen/xenbus.h>
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -040043#include <xen/interface/io/ring.h>
44#include <xen/interface/io/blkif.h>
45#include <xen/interface/io/protocols.h>
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040046
Konrad Rzeszutek Wilk22b20f22011-05-12 16:43:12 -040047#define DRV_PFX "xen-blkback:"
Konrad Rzeszutek Wilk1afbd732011-05-11 16:15:24 -040048#define DPRINTK(fmt, args...) \
Joe Jin1bc05b02011-08-15 12:57:07 +080049 pr_debug(DRV_PFX "(%s:%d) " fmt ".\n", \
Konrad Rzeszutek Wilk1afbd732011-05-11 16:15:24 -040050 __func__, __LINE__, ##args)
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -040051
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -040052
53/* Not a real protocol. Used to generate ring structs which contain
54 * the elements common to all protocols only. This way we get a
55 * compiler-checkable way to use common struct elements, so we can
56 * avoid using switch(protocol) in a number of places. */
57struct blkif_common_request {
58 char dummy;
59};
60struct blkif_common_response {
61 char dummy;
62};
63
Li Dongyangb3cb0d62011-09-01 18:39:10 +080064struct blkif_x86_32_request_rw {
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -040065 uint8_t nr_segments; /* number of segments */
66 blkif_vdev_t handle; /* only for read/write requests */
67 uint64_t id; /* private guest value, echoed in resp */
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -040068 blkif_sector_t sector_number;/* start sector idx on disk (r/w only) */
69 struct blkif_request_segment seg[BLKIF_MAX_SEGMENTS_PER_REQUEST];
70} __attribute__((__packed__));
71
72struct blkif_x86_32_request_discard {
Konrad Rzeszutek Wilk5ea42982011-10-12 16:23:30 -040073 uint8_t flag; /* BLKIF_DISCARD_SECURE or zero */
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -040074 blkif_vdev_t _pad1; /* was "handle" for read/write requests */
75 uint64_t id; /* private guest value, echoed in resp */
76 blkif_sector_t sector_number;/* start sector idx on disk (r/w only) */
77 uint64_t nr_sectors;
78} __attribute__((__packed__));
79
David Vrabel0e367ae2013-03-07 17:32:01 +000080struct blkif_x86_32_request_other {
81 uint8_t _pad1;
82 blkif_vdev_t _pad2;
83 uint64_t id; /* private guest value, echoed in resp */
84} __attribute__((__packed__));
85
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -040086struct blkif_x86_32_request {
87 uint8_t operation; /* BLKIF_OP_??? */
Li Dongyangb3cb0d62011-09-01 18:39:10 +080088 union {
89 struct blkif_x86_32_request_rw rw;
90 struct blkif_x86_32_request_discard discard;
David Vrabel0e367ae2013-03-07 17:32:01 +000091 struct blkif_x86_32_request_other other;
Li Dongyangb3cb0d62011-09-01 18:39:10 +080092 } u;
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -040093} __attribute__((__packed__));
94
95/* i386 protocol version */
96#pragma pack(push, 4)
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -040097struct blkif_x86_32_response {
98 uint64_t id; /* copied from request */
99 uint8_t operation; /* copied from request */
100 int16_t status; /* BLKIF_RSP_??? */
101};
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -0400102#pragma pack(pop)
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -0400103/* x86_64 protocol version */
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800104
105struct blkif_x86_64_request_rw {
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400106 uint8_t nr_segments; /* number of segments */
107 blkif_vdev_t handle; /* only for read/write requests */
108 uint32_t _pad1; /* offsetof(blkif_reqest..,u.rw.id)==8 */
109 uint64_t id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800110 blkif_sector_t sector_number;/* start sector idx on disk (r/w only) */
111 struct blkif_request_segment seg[BLKIF_MAX_SEGMENTS_PER_REQUEST];
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400112} __attribute__((__packed__));
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800113
114struct blkif_x86_64_request_discard {
Konrad Rzeszutek Wilk5ea42982011-10-12 16:23:30 -0400115 uint8_t flag; /* BLKIF_DISCARD_SECURE or zero */
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400116 blkif_vdev_t _pad1; /* was "handle" for read/write requests */
117 uint32_t _pad2; /* offsetof(blkif_..,u.discard.id)==8 */
118 uint64_t id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800119 blkif_sector_t sector_number;/* start sector idx on disk (r/w only) */
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400120 uint64_t nr_sectors;
121} __attribute__((__packed__));
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800122
David Vrabel0e367ae2013-03-07 17:32:01 +0000123struct blkif_x86_64_request_other {
124 uint8_t _pad1;
125 blkif_vdev_t _pad2;
126 uint32_t _pad3; /* offsetof(blkif_..,u.discard.id)==8 */
127 uint64_t id; /* private guest value, echoed in resp */
128} __attribute__((__packed__));
129
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -0400130struct blkif_x86_64_request {
131 uint8_t operation; /* BLKIF_OP_??? */
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800132 union {
133 struct blkif_x86_64_request_rw rw;
134 struct blkif_x86_64_request_discard discard;
David Vrabel0e367ae2013-03-07 17:32:01 +0000135 struct blkif_x86_64_request_other other;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800136 } u;
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400137} __attribute__((__packed__));
138
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -0400139struct blkif_x86_64_response {
140 uint64_t __attribute__((__aligned__(8))) id;
141 uint8_t operation; /* copied from request */
142 int16_t status; /* BLKIF_RSP_??? */
143};
Konrad Rzeszutek Wilk452a6b22011-05-12 16:31:51 -0400144
145DEFINE_RING_TYPES(blkif_common, struct blkif_common_request,
146 struct blkif_common_response);
147DEFINE_RING_TYPES(blkif_x86_32, struct blkif_x86_32_request,
148 struct blkif_x86_32_response);
149DEFINE_RING_TYPES(blkif_x86_64, struct blkif_x86_64_request,
150 struct blkif_x86_64_response);
151
152union blkif_back_rings {
153 struct blkif_back_ring native;
154 struct blkif_common_back_ring common;
155 struct blkif_x86_32_back_ring x86_32;
156 struct blkif_x86_64_back_ring x86_64;
157};
158
159enum blkif_protocol {
160 BLKIF_PROTOCOL_NATIVE = 1,
161 BLKIF_PROTOCOL_X86_32 = 2,
162 BLKIF_PROTOCOL_X86_64 = 3,
163};
164
Konrad Rzeszutek Wilk3d814732011-05-12 16:53:56 -0400165struct xen_vbd {
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400166 /* What the domain refers to this vbd as. */
167 blkif_vdev_t handle;
168 /* Non-zero -> read-only */
169 unsigned char readonly;
170 /* VDISK_xxx */
171 unsigned char type;
172 /* phys device that this vbd maps to. */
173 u32 pdevice;
174 struct block_device *bdev;
175 /* Cached size parameter. */
176 sector_t size;
Oliver Chick1f999572012-09-21 10:04:18 +0100177 unsigned int flush_support:1;
178 unsigned int discard_secure:1;
Roger Pau Monne0a8704a2012-10-24 18:58:45 +0200179 unsigned int feature_gnt_persistent:1;
180 unsigned int overflow_max_grants:1;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400181};
182
183struct backend_info;
184
Roger Pau Monne0a8704a2012-10-24 18:58:45 +0200185
186struct persistent_gnt {
187 struct page *page;
188 grant_ref_t gnt;
189 grant_handle_t handle;
Roger Pau Monne0a8704a2012-10-24 18:58:45 +0200190 struct rb_node node;
191};
192
Konrad Rzeszutek Wilk30fd1502011-05-12 16:47:48 -0400193struct xen_blkif {
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400194 /* Unique identifier for this interface. */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400195 domid_t domid;
196 unsigned int handle;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400197 /* Physical parameters of the comms window. */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400198 unsigned int irq;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400199 /* Comms information. */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400200 enum blkif_protocol blk_protocol;
201 union blkif_back_rings blk_rings;
David Vrabel2d073842011-09-29 16:53:30 +0100202 void *blk_ring;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400203 /* The VBD attached to this interface. */
Konrad Rzeszutek Wilk3d814732011-05-12 16:53:56 -0400204 struct xen_vbd vbd;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400205 /* Back pointer to the backend_info. */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400206 struct backend_info *be;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400207 /* Private fields. */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400208 spinlock_t blk_ring_lock;
209 atomic_t refcnt;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400210
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400211 wait_queue_head_t wq;
Konrad Rzeszutek Wilk29bde092011-10-10 00:42:22 -0400212 /* for barrier (drain) requests */
213 struct completion drain_complete;
214 atomic_t drain;
Konrad Rzeszutek Wilka1397fa2011-04-14 17:05:23 -0400215 /* One thread per one blkif. */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400216 struct task_struct *xenblkd;
217 unsigned int waiting_reqs;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400218
Roger Pau Monne0a8704a2012-10-24 18:58:45 +0200219 /* tree to store persistent grants */
220 struct rb_root persistent_gnts;
221 unsigned int persistent_gnt_c;
222
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400223 /* statistics */
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400224 unsigned long st_print;
Zoltan Kiss986cacb2013-03-11 16:15:50 +0000225 unsigned long long st_rd_req;
226 unsigned long long st_wr_req;
227 unsigned long long st_oo_req;
228 unsigned long long st_f_req;
229 unsigned long long st_ds_req;
230 unsigned long long st_rd_sect;
231 unsigned long long st_wr_sect;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400232
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400233 wait_queue_head_t waiting_to_free;
Konrad Rzeszutek Wilk54893772011-04-14 17:21:50 -0400234};
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400235
Konrad Rzeszutek Wilk42c78412011-04-20 11:21:43 -0400236
237#define vbd_sz(_v) ((_v)->bdev->bd_part ? \
238 (_v)->bdev->bd_part->nr_sects : \
239 get_capacity((_v)->bdev->bd_disk))
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400240
Konrad Rzeszutek Wilk8b6bf742011-04-20 11:50:43 -0400241#define xen_blkif_get(_b) (atomic_inc(&(_b)->refcnt))
242#define xen_blkif_put(_b) \
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400243 do { \
244 if (atomic_dec_and_test(&(_b)->refcnt)) \
245 wake_up(&(_b)->waiting_to_free);\
246 } while (0)
247
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400248struct phys_req {
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400249 unsigned short dev;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800250 blkif_sector_t nr_sects;
Konrad Rzeszutek Wilk01f37f22011-05-11 15:57:09 -0400251 struct block_device *bdev;
252 blkif_sector_t sector_number;
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400253};
Konrad Rzeszutek Wilk8b6bf742011-04-20 11:50:43 -0400254int xen_blkif_interface_init(void);
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400255
Konrad Rzeszutek Wilk8b6bf742011-04-20 11:50:43 -0400256int xen_blkif_xenbus_init(void);
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400257
Konrad Rzeszutek Wilk8b6bf742011-04-20 11:50:43 -0400258irqreturn_t xen_blkif_be_int(int irq, void *dev_id);
259int xen_blkif_schedule(void *arg);
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400260
Konrad Rzeszutek Wilk24f567f2011-05-04 17:07:27 -0400261int xen_blkbk_flush_diskcache(struct xenbus_transaction xbt,
262 struct backend_info *be, int state);
Konrad Rzeszutek Wilk4d05a282011-04-14 18:25:47 -0400263
Konrad Rzeszutek Wilk29bde092011-10-10 00:42:22 -0400264int xen_blkbk_barrier(struct xenbus_transaction xbt,
265 struct backend_info *be, int state);
Konrad Rzeszutek Wilk8b6bf742011-04-20 11:50:43 -0400266struct xenbus_device *xen_blkbk_xenbus(struct backend_info *be);
Jeremy Fitzhardinge98e036a2010-03-18 15:35:05 -0700267
Konrad Rzeszutek Wilkb0f80122011-05-12 16:23:06 -0400268static inline void blkif_get_x86_32_req(struct blkif_request *dst,
Konrad Rzeszutek Wilk68c88dd2011-05-11 16:23:39 -0400269 struct blkif_x86_32_request *src)
270{
271 int i, n = BLKIF_MAX_SEGMENTS_PER_REQUEST;
272 dst->operation = src->operation;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800273 switch (src->operation) {
274 case BLKIF_OP_READ:
275 case BLKIF_OP_WRITE:
276 case BLKIF_OP_WRITE_BARRIER:
277 case BLKIF_OP_FLUSH_DISKCACHE:
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400278 dst->u.rw.nr_segments = src->u.rw.nr_segments;
279 dst->u.rw.handle = src->u.rw.handle;
280 dst->u.rw.id = src->u.rw.id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800281 dst->u.rw.sector_number = src->u.rw.sector_number;
282 barrier();
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400283 if (n > dst->u.rw.nr_segments)
284 n = dst->u.rw.nr_segments;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800285 for (i = 0; i < n; i++)
286 dst->u.rw.seg[i] = src->u.rw.seg[i];
287 break;
288 case BLKIF_OP_DISCARD:
Konrad Rzeszutek Wilk5ea42982011-10-12 16:23:30 -0400289 dst->u.discard.flag = src->u.discard.flag;
Konrad Rzeszutek Wilk8c9ce602012-05-25 16:11:09 -0400290 dst->u.discard.id = src->u.discard.id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800291 dst->u.discard.sector_number = src->u.discard.sector_number;
292 dst->u.discard.nr_sectors = src->u.discard.nr_sectors;
293 break;
294 default:
David Vrabel0e367ae2013-03-07 17:32:01 +0000295 /*
296 * Don't know how to translate this op. Only get the
297 * ID so failure can be reported to the frontend.
298 */
299 dst->u.other.id = src->u.other.id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800300 break;
301 }
Konrad Rzeszutek Wilk68c88dd2011-05-11 16:23:39 -0400302}
303
Konrad Rzeszutek Wilkb0f80122011-05-12 16:23:06 -0400304static inline void blkif_get_x86_64_req(struct blkif_request *dst,
Konrad Rzeszutek Wilk68c88dd2011-05-11 16:23:39 -0400305 struct blkif_x86_64_request *src)
306{
307 int i, n = BLKIF_MAX_SEGMENTS_PER_REQUEST;
308 dst->operation = src->operation;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800309 switch (src->operation) {
310 case BLKIF_OP_READ:
311 case BLKIF_OP_WRITE:
312 case BLKIF_OP_WRITE_BARRIER:
313 case BLKIF_OP_FLUSH_DISKCACHE:
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400314 dst->u.rw.nr_segments = src->u.rw.nr_segments;
315 dst->u.rw.handle = src->u.rw.handle;
316 dst->u.rw.id = src->u.rw.id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800317 dst->u.rw.sector_number = src->u.rw.sector_number;
318 barrier();
Konrad Rzeszutek Wilk97e36832011-10-12 12:12:36 -0400319 if (n > dst->u.rw.nr_segments)
320 n = dst->u.rw.nr_segments;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800321 for (i = 0; i < n; i++)
322 dst->u.rw.seg[i] = src->u.rw.seg[i];
323 break;
324 case BLKIF_OP_DISCARD:
Konrad Rzeszutek Wilk5ea42982011-10-12 16:23:30 -0400325 dst->u.discard.flag = src->u.discard.flag;
Konrad Rzeszutek Wilk8c9ce602012-05-25 16:11:09 -0400326 dst->u.discard.id = src->u.discard.id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800327 dst->u.discard.sector_number = src->u.discard.sector_number;
328 dst->u.discard.nr_sectors = src->u.discard.nr_sectors;
329 break;
330 default:
David Vrabel0e367ae2013-03-07 17:32:01 +0000331 /*
332 * Don't know how to translate this op. Only get the
333 * ID so failure can be reported to the frontend.
334 */
335 dst->u.other.id = src->u.other.id;
Li Dongyangb3cb0d62011-09-01 18:39:10 +0800336 break;
337 }
Konrad Rzeszutek Wilk68c88dd2011-05-11 16:23:39 -0400338}
339
Konrad Rzeszutek Wilk5a577e32011-05-12 16:58:21 -0400340#endif /* __XEN_BLKIF__BACKEND__COMMON_H__ */