blob: d096835cfd6b66def5a1df8d9167a065cbeaeb1f [file] [log] [blame]
Fred Isaman155e7522011-07-30 20:52:39 -04001/*
2 * linux/fs/nfs/blocklayout/blocklayout.c
3 *
4 * Module for the NFSv4.1 pNFS block layout driver.
5 *
6 * Copyright (c) 2006 The Regents of the University of Michigan.
7 * All rights reserved.
8 *
9 * Andy Adamson <andros@citi.umich.edu>
10 * Fred Isaman <iisaman@umich.edu>
11 *
12 * permission is granted to use, copy, create derivative works and
13 * redistribute this software and such derivative works for any purpose,
14 * so long as the name of the university of michigan is not used in
15 * any advertising or publicity pertaining to the use or distribution
16 * of this software without specific, written prior authorization. if
17 * the above copyright notice or any other identification of the
18 * university of michigan is included in any copy of any portion of
19 * this software, then the disclaimer below must also be included.
20 *
21 * this software is provided as is, without representation from the
22 * university of michigan as to its fitness for any purpose, and without
23 * warranty by the university of michigan of any kind, either express
24 * or implied, including without limitation the implied warranties of
25 * merchantability and fitness for a particular purpose. the regents
26 * of the university of michigan shall not be liable for any damages,
27 * including special, indirect, incidental, or consequential damages,
28 * with respect to any claim arising out or in connection with the use
29 * of the software, even if it has been or is hereafter advised of the
30 * possibility of such damages.
31 */
32#include <linux/module.h>
33#include <linux/init.h>
Jim Reesfe0a9b72011-07-30 20:52:42 -040034#include <linux/mount.h>
35#include <linux/namei.h>
Fred Isaman155e7522011-07-30 20:52:39 -040036
37#include "blocklayout.h"
38
39#define NFSDBG_FACILITY NFSDBG_PNFS_LD
40
41MODULE_LICENSE("GPL");
42MODULE_AUTHOR("Andy Adamson <andros@citi.umich.edu>");
43MODULE_DESCRIPTION("The NFSv4.1 pNFS Block layout driver");
44
Jim Reesfe0a9b72011-07-30 20:52:42 -040045struct dentry *bl_device_pipe;
46wait_queue_head_t bl_wq;
47
Fred Isaman155e7522011-07-30 20:52:39 -040048static enum pnfs_try_status
49bl_read_pagelist(struct nfs_read_data *rdata)
50{
51 return PNFS_NOT_ATTEMPTED;
52}
53
54static enum pnfs_try_status
55bl_write_pagelist(struct nfs_write_data *wdata,
56 int sync)
57{
58 return PNFS_NOT_ATTEMPTED;
59}
60
Fred Isaman9e692962011-07-30 20:52:41 -040061/* FIXME - range ignored */
Fred Isaman155e7522011-07-30 20:52:39 -040062static void
Fred Isaman9e692962011-07-30 20:52:41 -040063release_extents(struct pnfs_block_layout *bl, struct pnfs_layout_range *range)
Fred Isaman155e7522011-07-30 20:52:39 -040064{
Fred Isaman9e692962011-07-30 20:52:41 -040065 int i;
66 struct pnfs_block_extent *be;
67
68 spin_lock(&bl->bl_ext_lock);
69 for (i = 0; i < EXTENT_LISTS; i++) {
70 while (!list_empty(&bl->bl_extents[i])) {
71 be = list_first_entry(&bl->bl_extents[i],
72 struct pnfs_block_extent,
73 be_node);
74 list_del(&be->be_node);
75 bl_put_extent(be);
76 }
77 }
78 spin_unlock(&bl->bl_ext_lock);
Fred Isaman155e7522011-07-30 20:52:39 -040079}
80
Fred Isaman155e7522011-07-30 20:52:39 -040081static void
82release_inval_marks(struct pnfs_inval_markings *marks)
83{
Fred Isamanc1c2a4c2011-07-30 20:52:49 -040084 struct pnfs_inval_tracking *pos, *temp;
85
86 list_for_each_entry_safe(pos, temp, &marks->im_tree.mtt_stub, it_link) {
87 list_del(&pos->it_link);
88 kfree(pos);
89 }
Fred Isaman155e7522011-07-30 20:52:39 -040090 return;
91}
92
93static void bl_free_layout_hdr(struct pnfs_layout_hdr *lo)
94{
95 struct pnfs_block_layout *bl = BLK_LO2EXT(lo);
96
97 dprintk("%s enter\n", __func__);
98 release_extents(bl, NULL);
99 release_inval_marks(&bl->bl_inval);
100 kfree(bl);
101}
102
103static struct pnfs_layout_hdr *bl_alloc_layout_hdr(struct inode *inode,
104 gfp_t gfp_flags)
105{
106 struct pnfs_block_layout *bl;
107
108 dprintk("%s enter\n", __func__);
109 bl = kzalloc(sizeof(*bl), gfp_flags);
110 if (!bl)
111 return NULL;
112 spin_lock_init(&bl->bl_ext_lock);
113 INIT_LIST_HEAD(&bl->bl_extents[0]);
114 INIT_LIST_HEAD(&bl->bl_extents[1]);
115 INIT_LIST_HEAD(&bl->bl_commit);
116 INIT_LIST_HEAD(&bl->bl_committing);
117 bl->bl_count = 0;
118 bl->bl_blocksize = NFS_SERVER(inode)->pnfs_blksize >> SECTOR_SHIFT;
119 BL_INIT_INVAL_MARKS(&bl->bl_inval, bl->bl_blocksize);
120 return &bl->bl_layout;
121}
122
Fred Isamana60d2eb2011-07-30 20:52:44 -0400123static void bl_free_lseg(struct pnfs_layout_segment *lseg)
Fred Isaman155e7522011-07-30 20:52:39 -0400124{
Fred Isamana60d2eb2011-07-30 20:52:44 -0400125 dprintk("%s enter\n", __func__);
126 kfree(lseg);
Fred Isaman155e7522011-07-30 20:52:39 -0400127}
128
Fred Isamana60d2eb2011-07-30 20:52:44 -0400129/* We pretty much ignore lseg, and store all data layout wide, so we
130 * can correctly merge.
131 */
132static struct pnfs_layout_segment *bl_alloc_lseg(struct pnfs_layout_hdr *lo,
133 struct nfs4_layoutget_res *lgr,
134 gfp_t gfp_flags)
Fred Isaman155e7522011-07-30 20:52:39 -0400135{
Fred Isamana60d2eb2011-07-30 20:52:44 -0400136 struct pnfs_layout_segment *lseg;
137 int status;
138
139 dprintk("%s enter\n", __func__);
140 lseg = kzalloc(sizeof(*lseg), gfp_flags);
141 if (!lseg)
142 return ERR_PTR(-ENOMEM);
143 status = nfs4_blk_process_layoutget(lo, lgr, gfp_flags);
144 if (status) {
145 /* We don't want to call the full-blown bl_free_lseg,
146 * since on error extents were not touched.
147 */
148 kfree(lseg);
149 return ERR_PTR(status);
150 }
151 return lseg;
Fred Isaman155e7522011-07-30 20:52:39 -0400152}
153
154static void
155bl_encode_layoutcommit(struct pnfs_layout_hdr *lo, struct xdr_stream *xdr,
156 const struct nfs4_layoutcommit_args *arg)
157{
Fred Isaman90ace122011-07-30 20:52:51 -0400158 dprintk("%s enter\n", __func__);
159 encode_pnfs_block_layoutupdate(BLK_LO2EXT(lo), xdr, arg);
Fred Isaman155e7522011-07-30 20:52:39 -0400160}
161
162static void
163bl_cleanup_layoutcommit(struct nfs4_layoutcommit_data *lcdata)
164{
165}
166
Fred Isaman2f9fd182011-07-30 20:52:46 -0400167static void free_blk_mountid(struct block_mount_id *mid)
168{
169 if (mid) {
170 struct pnfs_block_dev *dev;
171 spin_lock(&mid->bm_lock);
172 while (!list_empty(&mid->bm_devlist)) {
173 dev = list_first_entry(&mid->bm_devlist,
174 struct pnfs_block_dev,
175 bm_node);
176 list_del(&dev->bm_node);
177 bl_free_block_dev(dev);
178 }
179 spin_unlock(&mid->bm_lock);
180 kfree(mid);
181 }
182}
183
184/* This is mostly copied from the filelayout's get_device_info function.
185 * It seems much of this should be at the generic pnfs level.
186 */
187static struct pnfs_block_dev *
188nfs4_blk_get_deviceinfo(struct nfs_server *server, const struct nfs_fh *fh,
189 struct nfs4_deviceid *d_id)
190{
191 struct pnfs_device *dev;
192 struct pnfs_block_dev *rv = NULL;
193 u32 max_resp_sz;
194 int max_pages;
195 struct page **pages = NULL;
196 int i, rc;
197
198 /*
199 * Use the session max response size as the basis for setting
200 * GETDEVICEINFO's maxcount
201 */
202 max_resp_sz = server->nfs_client->cl_session->fc_attrs.max_resp_sz;
203 max_pages = max_resp_sz >> PAGE_SHIFT;
204 dprintk("%s max_resp_sz %u max_pages %d\n",
205 __func__, max_resp_sz, max_pages);
206
207 dev = kmalloc(sizeof(*dev), GFP_NOFS);
208 if (!dev) {
209 dprintk("%s kmalloc failed\n", __func__);
210 return NULL;
211 }
212
213 pages = kzalloc(max_pages * sizeof(struct page *), GFP_NOFS);
214 if (pages == NULL) {
215 kfree(dev);
216 return NULL;
217 }
218 for (i = 0; i < max_pages; i++) {
219 pages[i] = alloc_page(GFP_NOFS);
220 if (!pages[i])
221 goto out_free;
222 }
223
224 memcpy(&dev->dev_id, d_id, sizeof(*d_id));
225 dev->layout_type = LAYOUT_BLOCK_VOLUME;
226 dev->pages = pages;
227 dev->pgbase = 0;
228 dev->pglen = PAGE_SIZE * max_pages;
229 dev->mincount = 0;
230
231 dprintk("%s: dev_id: %s\n", __func__, dev->dev_id.data);
232 rc = nfs4_proc_getdeviceinfo(server, dev);
233 dprintk("%s getdevice info returns %d\n", __func__, rc);
234 if (rc)
235 goto out_free;
236
237 rv = nfs4_blk_decode_device(server, dev);
238 out_free:
239 for (i = 0; i < max_pages; i++)
240 __free_page(pages[i]);
241 kfree(pages);
242 kfree(dev);
243 return rv;
244}
245
Fred Isaman155e7522011-07-30 20:52:39 -0400246static int
247bl_set_layoutdriver(struct nfs_server *server, const struct nfs_fh *fh)
248{
Fred Isaman2f9fd182011-07-30 20:52:46 -0400249 struct block_mount_id *b_mt_id = NULL;
250 struct pnfs_devicelist *dlist = NULL;
251 struct pnfs_block_dev *bdev;
252 LIST_HEAD(block_disklist);
253 int status = 0, i;
254
Fred Isaman155e7522011-07-30 20:52:39 -0400255 dprintk("%s enter\n", __func__);
Fred Isaman2f9fd182011-07-30 20:52:46 -0400256
257 if (server->pnfs_blksize == 0) {
258 dprintk("%s Server did not return blksize\n", __func__);
259 return -EINVAL;
260 }
261 b_mt_id = kzalloc(sizeof(struct block_mount_id), GFP_NOFS);
262 if (!b_mt_id) {
263 status = -ENOMEM;
264 goto out_error;
265 }
266 /* Initialize nfs4 block layout mount id */
267 spin_lock_init(&b_mt_id->bm_lock);
268 INIT_LIST_HEAD(&b_mt_id->bm_devlist);
269
270 dlist = kmalloc(sizeof(struct pnfs_devicelist), GFP_NOFS);
271 if (!dlist) {
272 status = -ENOMEM;
273 goto out_error;
274 }
275 dlist->eof = 0;
276 while (!dlist->eof) {
277 status = nfs4_proc_getdevicelist(server, fh, dlist);
278 if (status)
279 goto out_error;
280 dprintk("%s GETDEVICELIST numdevs=%i, eof=%i\n",
281 __func__, dlist->num_devs, dlist->eof);
282 for (i = 0; i < dlist->num_devs; i++) {
283 bdev = nfs4_blk_get_deviceinfo(server, fh,
284 &dlist->dev_id[i]);
285 if (!bdev) {
286 status = -ENODEV;
287 goto out_error;
288 }
289 spin_lock(&b_mt_id->bm_lock);
290 list_add(&bdev->bm_node, &b_mt_id->bm_devlist);
291 spin_unlock(&b_mt_id->bm_lock);
292 }
293 }
294 dprintk("%s SUCCESS\n", __func__);
295 server->pnfs_ld_data = b_mt_id;
296
297 out_return:
298 kfree(dlist);
299 return status;
300
301 out_error:
302 free_blk_mountid(b_mt_id);
303 goto out_return;
Fred Isaman155e7522011-07-30 20:52:39 -0400304}
305
306static int
307bl_clear_layoutdriver(struct nfs_server *server)
308{
Fred Isaman2f9fd182011-07-30 20:52:46 -0400309 struct block_mount_id *b_mt_id = server->pnfs_ld_data;
310
Fred Isaman155e7522011-07-30 20:52:39 -0400311 dprintk("%s enter\n", __func__);
Fred Isaman2f9fd182011-07-30 20:52:46 -0400312 free_blk_mountid(b_mt_id);
313 dprintk("%s RETURNS\n", __func__);
Fred Isaman155e7522011-07-30 20:52:39 -0400314 return 0;
315}
316
Benny Halevye9643fe2011-07-30 20:52:40 -0400317static const struct nfs_pageio_ops bl_pg_read_ops = {
318 .pg_init = pnfs_generic_pg_init_read,
319 .pg_test = pnfs_generic_pg_test,
320 .pg_doio = pnfs_generic_pg_readpages,
321};
322
323static const struct nfs_pageio_ops bl_pg_write_ops = {
324 .pg_init = pnfs_generic_pg_init_write,
325 .pg_test = pnfs_generic_pg_test,
326 .pg_doio = pnfs_generic_pg_writepages,
327};
328
Fred Isaman155e7522011-07-30 20:52:39 -0400329static struct pnfs_layoutdriver_type blocklayout_type = {
330 .id = LAYOUT_BLOCK_VOLUME,
331 .name = "LAYOUT_BLOCK_VOLUME",
332 .read_pagelist = bl_read_pagelist,
333 .write_pagelist = bl_write_pagelist,
334 .alloc_layout_hdr = bl_alloc_layout_hdr,
335 .free_layout_hdr = bl_free_layout_hdr,
336 .alloc_lseg = bl_alloc_lseg,
337 .free_lseg = bl_free_lseg,
338 .encode_layoutcommit = bl_encode_layoutcommit,
339 .cleanup_layoutcommit = bl_cleanup_layoutcommit,
340 .set_layoutdriver = bl_set_layoutdriver,
341 .clear_layoutdriver = bl_clear_layoutdriver,
Benny Halevye9643fe2011-07-30 20:52:40 -0400342 .pg_read_ops = &bl_pg_read_ops,
343 .pg_write_ops = &bl_pg_write_ops,
Fred Isaman155e7522011-07-30 20:52:39 -0400344};
345
Jim Reesfe0a9b72011-07-30 20:52:42 -0400346static const struct rpc_pipe_ops bl_upcall_ops = {
347 .upcall = bl_pipe_upcall,
348 .downcall = bl_pipe_downcall,
349 .destroy_msg = bl_pipe_destroy_msg,
350};
351
Fred Isaman155e7522011-07-30 20:52:39 -0400352static int __init nfs4blocklayout_init(void)
353{
Jim Reesfe0a9b72011-07-30 20:52:42 -0400354 struct vfsmount *mnt;
355 struct path path;
Fred Isaman155e7522011-07-30 20:52:39 -0400356 int ret;
357
358 dprintk("%s: NFSv4 Block Layout Driver Registering...\n", __func__);
359
360 ret = pnfs_register_layoutdriver(&blocklayout_type);
Jim Reesfe0a9b72011-07-30 20:52:42 -0400361 if (ret)
362 goto out;
363
364 init_waitqueue_head(&bl_wq);
365
366 mnt = rpc_get_mount();
367 if (IS_ERR(mnt)) {
368 ret = PTR_ERR(mnt);
369 goto out_remove;
370 }
371
372 ret = vfs_path_lookup(mnt->mnt_root,
373 mnt,
374 NFS_PIPE_DIRNAME, 0, &path);
375 if (ret)
376 goto out_remove;
377
378 bl_device_pipe = rpc_mkpipe(path.dentry, "blocklayout", NULL,
379 &bl_upcall_ops, 0);
380 if (IS_ERR(bl_device_pipe)) {
381 ret = PTR_ERR(bl_device_pipe);
382 goto out_remove;
383 }
384out:
385 return ret;
386
387out_remove:
388 pnfs_unregister_layoutdriver(&blocklayout_type);
Fred Isaman155e7522011-07-30 20:52:39 -0400389 return ret;
390}
391
392static void __exit nfs4blocklayout_exit(void)
393{
394 dprintk("%s: NFSv4 Block Layout Driver Unregistering...\n",
395 __func__);
396
397 pnfs_unregister_layoutdriver(&blocklayout_type);
Jim Reesfe0a9b72011-07-30 20:52:42 -0400398 rpc_unlink(bl_device_pipe);
Fred Isaman155e7522011-07-30 20:52:39 -0400399}
400
401MODULE_ALIAS("nfs-layouttype4-3");
402
403module_init(nfs4blocklayout_init);
404module_exit(nfs4blocklayout_exit);