blob: 142bfd0b16635a37c5c292515b41d77d5c2911c2 [file] [log] [blame]
Tom Haynesd67ae822014-12-11 17:02:04 -05001/*
2 * Device operations for the pnfs nfs4 file layout driver.
3 *
4 * Copyright (c) 2014, Primary Data, Inc. All rights reserved.
5 *
6 * Tao Peng <bergwolf@primarydata.com>
7 */
8
9#include <linux/nfs_fs.h>
10#include <linux/vmalloc.h>
11#include <linux/module.h>
12#include <linux/sunrpc/addr.h>
13
14#include "../internal.h"
15#include "../nfs4session.h"
16#include "flexfilelayout.h"
17
18#define NFSDBG_FACILITY NFSDBG_PNFS_LD
19
Trond Myklebust15d03052016-08-16 11:08:22 -040020static unsigned int dataserver_timeo = NFS_DEF_TCP_RETRANS;
21static unsigned int dataserver_retrans;
Tom Haynesd67ae822014-12-11 17:02:04 -050022
23void nfs4_ff_layout_put_deviceid(struct nfs4_ff_layout_ds *mirror_ds)
24{
25 if (mirror_ds)
26 nfs4_put_deviceid_node(&mirror_ds->id_node);
27}
28
29void nfs4_ff_layout_free_deviceid(struct nfs4_ff_layout_ds *mirror_ds)
30{
31 nfs4_print_deviceid(&mirror_ds->id_node.deviceid);
32 nfs4_pnfs_ds_put(mirror_ds->ds);
Trond Myklebust84a80f62015-03-09 15:23:35 -040033 kfree_rcu(mirror_ds, id_node.rcu);
Tom Haynesd67ae822014-12-11 17:02:04 -050034}
35
36/* Decode opaque device data and construct new_ds using it */
37struct nfs4_ff_layout_ds *
38nfs4_ff_alloc_deviceid_node(struct nfs_server *server, struct pnfs_device *pdev,
39 gfp_t gfp_flags)
40{
41 struct xdr_stream stream;
42 struct xdr_buf buf;
43 struct page *scratch;
44 struct list_head dsaddrs;
45 struct nfs4_pnfs_ds_addr *da;
46 struct nfs4_ff_layout_ds *new_ds = NULL;
47 struct nfs4_ff_ds_version *ds_versions = NULL;
48 u32 mp_count;
49 u32 version_count;
50 __be32 *p;
51 int i, ret = -ENOMEM;
52
53 /* set up xdr stream */
54 scratch = alloc_page(gfp_flags);
55 if (!scratch)
56 goto out_err;
57
58 new_ds = kzalloc(sizeof(struct nfs4_ff_layout_ds), gfp_flags);
59 if (!new_ds)
60 goto out_scratch;
61
62 nfs4_init_deviceid_node(&new_ds->id_node,
63 server,
64 &pdev->dev_id);
65 INIT_LIST_HEAD(&dsaddrs);
66
67 xdr_init_decode_pages(&stream, &buf, pdev->pages, pdev->pglen);
68 xdr_set_scratch_buffer(&stream, page_address(scratch), PAGE_SIZE);
69
70 /* multipath count */
71 p = xdr_inline_decode(&stream, 4);
72 if (unlikely(!p))
73 goto out_err_drain_dsaddrs;
74 mp_count = be32_to_cpup(p);
75 dprintk("%s: multipath ds count %d\n", __func__, mp_count);
76
77 for (i = 0; i < mp_count; i++) {
78 /* multipath ds */
79 da = nfs4_decode_mp_ds_addr(server->nfs_client->cl_net,
80 &stream, gfp_flags);
81 if (da)
82 list_add_tail(&da->da_node, &dsaddrs);
83 }
84 if (list_empty(&dsaddrs)) {
85 dprintk("%s: no suitable DS addresses found\n",
86 __func__);
87 ret = -ENOMEDIUM;
88 goto out_err_drain_dsaddrs;
89 }
90
91 /* version count */
92 p = xdr_inline_decode(&stream, 4);
93 if (unlikely(!p))
94 goto out_err_drain_dsaddrs;
95 version_count = be32_to_cpup(p);
96 dprintk("%s: version count %d\n", __func__, version_count);
97
98 ds_versions = kzalloc(version_count * sizeof(struct nfs4_ff_ds_version),
99 gfp_flags);
100 if (!ds_versions)
101 goto out_scratch;
102
103 for (i = 0; i < version_count; i++) {
104 /* 20 = version(4) + minor_version(4) + rsize(4) + wsize(4) +
105 * tightly_coupled(4) */
106 p = xdr_inline_decode(&stream, 20);
107 if (unlikely(!p))
108 goto out_err_drain_dsaddrs;
109 ds_versions[i].version = be32_to_cpup(p++);
110 ds_versions[i].minor_version = be32_to_cpup(p++);
111 ds_versions[i].rsize = nfs_block_size(be32_to_cpup(p++), NULL);
112 ds_versions[i].wsize = nfs_block_size(be32_to_cpup(p++), NULL);
113 ds_versions[i].tightly_coupled = be32_to_cpup(p);
114
115 if (ds_versions[i].rsize > NFS_MAX_FILE_IO_SIZE)
116 ds_versions[i].rsize = NFS_MAX_FILE_IO_SIZE;
117 if (ds_versions[i].wsize > NFS_MAX_FILE_IO_SIZE)
118 ds_versions[i].wsize = NFS_MAX_FILE_IO_SIZE;
119
120 if (ds_versions[i].version != 3 || ds_versions[i].minor_version != 0) {
121 dprintk("%s: [%d] unsupported ds version %d-%d\n", __func__,
122 i, ds_versions[i].version,
123 ds_versions[i].minor_version);
124 ret = -EPROTONOSUPPORT;
125 goto out_err_drain_dsaddrs;
126 }
127
128 dprintk("%s: [%d] vers %u minor_ver %u rsize %u wsize %u coupled %d\n",
129 __func__, i, ds_versions[i].version,
130 ds_versions[i].minor_version,
131 ds_versions[i].rsize,
132 ds_versions[i].wsize,
133 ds_versions[i].tightly_coupled);
134 }
135
136 new_ds->ds_versions = ds_versions;
137 new_ds->ds_versions_cnt = version_count;
138
139 new_ds->ds = nfs4_pnfs_ds_add(&dsaddrs, gfp_flags);
140 if (!new_ds->ds)
141 goto out_err_drain_dsaddrs;
142
143 /* If DS was already in cache, free ds addrs */
144 while (!list_empty(&dsaddrs)) {
145 da = list_first_entry(&dsaddrs,
146 struct nfs4_pnfs_ds_addr,
147 da_node);
148 list_del_init(&da->da_node);
149 kfree(da->da_remotestr);
150 kfree(da);
151 }
152
153 __free_page(scratch);
154 return new_ds;
155
156out_err_drain_dsaddrs:
157 while (!list_empty(&dsaddrs)) {
158 da = list_first_entry(&dsaddrs, struct nfs4_pnfs_ds_addr,
159 da_node);
160 list_del_init(&da->da_node);
161 kfree(da->da_remotestr);
162 kfree(da);
163 }
164
165 kfree(ds_versions);
166out_scratch:
167 __free_page(scratch);
168out_err:
169 kfree(new_ds);
170
171 dprintk("%s ERROR: returning %d\n", __func__, ret);
172 return NULL;
173}
174
Trond Myklebust889d94d2015-09-01 00:58:24 -0700175static void ff_layout_mark_devid_invalid(struct pnfs_layout_segment *lseg,
176 struct nfs4_deviceid_node *devid)
177{
178 nfs4_mark_deviceid_unavailable(devid);
179 if (!ff_layout_has_available_ds(lseg))
180 pnfs_error_mark_layout_for_return(lseg->pls_layout->plh_inode,
181 lseg);
182}
183
184static bool ff_layout_mirror_valid(struct pnfs_layout_segment *lseg,
185 struct nfs4_ff_layout_mirror *mirror)
186{
187 if (mirror == NULL || mirror->mirror_ds == NULL) {
188 pnfs_error_mark_layout_for_return(lseg->pls_layout->plh_inode,
189 lseg);
190 return false;
191 }
192 if (mirror->mirror_ds->ds == NULL) {
193 struct nfs4_deviceid_node *devid;
194 devid = &mirror->mirror_ds->id_node;
195 ff_layout_mark_devid_invalid(lseg, devid);
196 return false;
197 }
198 return true;
199}
200
Tom Haynesd67ae822014-12-11 17:02:04 -0500201static void extend_ds_error(struct nfs4_ff_layout_ds_err *err,
202 u64 offset, u64 length)
203{
204 u64 end;
205
Trond Myklebust17822b22016-10-25 12:24:25 -0400206 end = max_t(u64, pnfs_end_offset(err->offset, err->length),
207 pnfs_end_offset(offset, length));
Tom Haynesd67ae822014-12-11 17:02:04 -0500208 err->offset = min_t(u64, err->offset, offset);
209 err->length = end - err->offset;
210}
211
Trond Myklebustb819ed42016-01-21 14:48:49 -0500212static int
213ff_ds_error_match(const struct nfs4_ff_layout_ds_err *e1,
214 const struct nfs4_ff_layout_ds_err *e2)
Tom Haynesd67ae822014-12-11 17:02:04 -0500215{
Trond Myklebustb819ed42016-01-21 14:48:49 -0500216 int ret;
217
218 if (e1->opnum != e2->opnum)
219 return e1->opnum < e2->opnum ? -1 : 1;
220 if (e1->status != e2->status)
221 return e1->status < e2->status ? -1 : 1;
Trond Myklebust93b717f2016-05-16 17:42:43 -0400222 ret = memcmp(e1->stateid.data, e2->stateid.data,
223 sizeof(e1->stateid.data));
Trond Myklebustb819ed42016-01-21 14:48:49 -0500224 if (ret != 0)
225 return ret;
226 ret = memcmp(&e1->deviceid, &e2->deviceid, sizeof(e1->deviceid));
227 if (ret != 0)
228 return ret;
Trond Myklebust17822b22016-10-25 12:24:25 -0400229 if (pnfs_end_offset(e1->offset, e1->length) < e2->offset)
Trond Myklebustb819ed42016-01-21 14:48:49 -0500230 return -1;
Trond Myklebust17822b22016-10-25 12:24:25 -0400231 if (e1->offset > pnfs_end_offset(e2->offset, e2->length))
Trond Myklebustb819ed42016-01-21 14:48:49 -0500232 return 1;
233 /* If ranges overlap or are contiguous, they are the same */
234 return 0;
Tom Haynesd67ae822014-12-11 17:02:04 -0500235}
236
Trond Myklebustb819ed42016-01-21 14:48:49 -0500237static void
Tom Haynesd67ae822014-12-11 17:02:04 -0500238ff_layout_add_ds_error_locked(struct nfs4_flexfile_layout *flo,
239 struct nfs4_ff_layout_ds_err *dserr)
240{
Trond Myklebustb819ed42016-01-21 14:48:49 -0500241 struct nfs4_ff_layout_ds_err *err, *tmp;
242 struct list_head *head = &flo->error_list;
243 int match;
Tom Haynesd67ae822014-12-11 17:02:04 -0500244
Trond Myklebustb819ed42016-01-21 14:48:49 -0500245 /* Do insertion sort w/ merges */
246 list_for_each_entry_safe(err, tmp, &flo->error_list, list) {
247 match = ff_ds_error_match(err, dserr);
248 if (match < 0)
249 continue;
250 if (match > 0) {
251 /* Add entry "dserr" _before_ entry "err" */
252 head = &err->list;
Tom Haynesd67ae822014-12-11 17:02:04 -0500253 break;
254 }
Trond Myklebustb819ed42016-01-21 14:48:49 -0500255 /* Entries match, so merge "err" into "dserr" */
256 extend_ds_error(dserr, err->offset, err->length);
Trond Myklebustcb067932016-12-06 12:00:51 -0500257 list_replace(&err->list, &dserr->list);
Trond Myklebustb819ed42016-01-21 14:48:49 -0500258 kfree(err);
Trond Myklebustcb067932016-12-06 12:00:51 -0500259 return;
Tom Haynesd67ae822014-12-11 17:02:04 -0500260 }
261
Trond Myklebustb819ed42016-01-21 14:48:49 -0500262 list_add_tail(&dserr->list, head);
Tom Haynesd67ae822014-12-11 17:02:04 -0500263}
264
265int ff_layout_track_ds_error(struct nfs4_flexfile_layout *flo,
266 struct nfs4_ff_layout_mirror *mirror, u64 offset,
267 u64 length, int status, enum nfs_opnum4 opnum,
268 gfp_t gfp_flags)
269{
270 struct nfs4_ff_layout_ds_err *dserr;
Tom Haynesd67ae822014-12-11 17:02:04 -0500271
272 if (status == 0)
273 return 0;
274
275 if (mirror->mirror_ds == NULL)
276 return -EINVAL;
277
Tom Haynesd67ae822014-12-11 17:02:04 -0500278 dserr = kmalloc(sizeof(*dserr), gfp_flags);
279 if (!dserr)
280 return -ENOMEM;
281
282 INIT_LIST_HEAD(&dserr->list);
283 dserr->offset = offset;
284 dserr->length = length;
285 dserr->status = status;
286 dserr->opnum = opnum;
287 nfs4_stateid_copy(&dserr->stateid, &mirror->stateid);
288 memcpy(&dserr->deviceid, &mirror->mirror_ds->id_node.deviceid,
289 NFS4_DEVICEID4_SIZE);
290
291 spin_lock(&flo->generic_hdr.plh_inode->i_lock);
Trond Myklebustb819ed42016-01-21 14:48:49 -0500292 ff_layout_add_ds_error_locked(flo, dserr);
Tom Haynesd67ae822014-12-11 17:02:04 -0500293 spin_unlock(&flo->generic_hdr.plh_inode->i_lock);
Tom Haynesd67ae822014-12-11 17:02:04 -0500294
295 return 0;
296}
297
Jeff Layton57f3f4c2016-04-21 20:51:58 -0400298static struct rpc_cred *
299ff_layout_get_mirror_cred(struct nfs4_ff_layout_mirror *mirror, u32 iomode)
300{
Jeff Layton3064b682016-04-21 20:52:00 -0400301 struct rpc_cred *cred, __rcu **pcred;
Jeff Layton57f3f4c2016-04-21 20:51:58 -0400302
Jeff Layton3064b682016-04-21 20:52:00 -0400303 if (iomode == IOMODE_READ)
304 pcred = &mirror->ro_cred;
305 else
306 pcred = &mirror->rw_cred;
Jeff Layton57f3f4c2016-04-21 20:51:58 -0400307
308 rcu_read_lock();
309 do {
310 cred = rcu_dereference(*pcred);
311 if (!cred)
312 break;
313
314 cred = get_rpccred_rcu(cred);
315 } while(!cred);
316 rcu_read_unlock();
317 return cred;
318}
319
Tom Haynesd67ae822014-12-11 17:02:04 -0500320struct nfs_fh *
321nfs4_ff_layout_select_ds_fh(struct pnfs_layout_segment *lseg, u32 mirror_idx)
322{
323 struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, mirror_idx);
324 struct nfs_fh *fh = NULL;
Tom Haynesd67ae822014-12-11 17:02:04 -0500325
Trond Myklebust889d94d2015-09-01 00:58:24 -0700326 if (!ff_layout_mirror_valid(lseg, mirror)) {
327 pr_err_ratelimited("NFS: %s: No data server for mirror offset index %d\n",
Tom Haynesd67ae822014-12-11 17:02:04 -0500328 __func__, mirror_idx);
Tom Haynesd67ae822014-12-11 17:02:04 -0500329 goto out;
330 }
331
332 /* FIXME: For now assume there is only 1 version available for the DS */
333 fh = &mirror->fh_versions[0];
334out:
335 return fh;
336}
337
Jeff Layton95e2b7e2016-05-17 12:28:44 -0400338/**
339 * nfs4_ff_layout_prepare_ds - prepare a DS connection for an RPC call
340 * @lseg: the layout segment we're operating on
341 * @ds_idx: index of the DS to use
342 * @fail_return: return layout on connect failure?
343 *
344 * Try to prepare a DS connection to accept an RPC call. This involves
345 * selecting a mirror to use and connecting the client to it if it's not
346 * already connected.
347 *
348 * Since we only need a single functioning mirror to satisfy a read, we don't
349 * want to return the layout if there is one. For writes though, any down
350 * mirror should result in a LAYOUTRETURN. @fail_return is how we distinguish
351 * between the two cases.
352 *
353 * Returns a pointer to a connected DS object on success or NULL on failure.
354 */
Tom Haynesd67ae822014-12-11 17:02:04 -0500355struct nfs4_pnfs_ds *
356nfs4_ff_layout_prepare_ds(struct pnfs_layout_segment *lseg, u32 ds_idx,
357 bool fail_return)
358{
359 struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, ds_idx);
360 struct nfs4_pnfs_ds *ds = NULL;
361 struct nfs4_deviceid_node *devid;
362 struct inode *ino = lseg->pls_layout->plh_inode;
363 struct nfs_server *s = NFS_SERVER(ino);
364 unsigned int max_payload;
Tom Haynesd67ae822014-12-11 17:02:04 -0500365
Trond Myklebust889d94d2015-09-01 00:58:24 -0700366 if (!ff_layout_mirror_valid(lseg, mirror)) {
367 pr_err_ratelimited("NFS: %s: No data server for offset index %d\n",
Tom Haynesd67ae822014-12-11 17:02:04 -0500368 __func__, ds_idx);
Tom Haynesd67ae822014-12-11 17:02:04 -0500369 goto out;
370 }
371
372 devid = &mirror->mirror_ds->id_node;
373 if (ff_layout_test_devid_unavailable(devid))
Trond Myklebust3dc14732016-08-29 15:12:54 -0400374 goto out_fail;
Tom Haynesd67ae822014-12-11 17:02:04 -0500375
376 ds = mirror->mirror_ds->ds;
377 /* matching smp_wmb() in _nfs4_pnfs_v3/4_ds_connect */
378 smp_rmb();
379 if (ds->ds_clp)
Jeff Layton90a0be02016-04-21 20:51:59 -0400380 goto out;
Tom Haynesd67ae822014-12-11 17:02:04 -0500381
382 /* FIXME: For now we assume the server sent only one version of NFS
383 * to use for the DS.
384 */
385 nfs4_pnfs_ds_connect(s, ds, devid, dataserver_timeo,
386 dataserver_retrans,
387 mirror->mirror_ds->ds_versions[0].version,
Anna Schumaker7d38de32016-11-17 15:15:55 -0500388 mirror->mirror_ds->ds_versions[0].minor_version);
Tom Haynesd67ae822014-12-11 17:02:04 -0500389
390 /* connect success, check rsize/wsize limit */
391 if (ds->ds_clp) {
392 max_payload =
393 nfs_block_size(rpc_max_payload(ds->ds_clp->cl_rpcclient),
394 NULL);
395 if (mirror->mirror_ds->ds_versions[0].rsize > max_payload)
396 mirror->mirror_ds->ds_versions[0].rsize = max_payload;
397 if (mirror->mirror_ds->ds_versions[0].wsize > max_payload)
398 mirror->mirror_ds->ds_versions[0].wsize = max_payload;
Trond Myklebust3dc14732016-08-29 15:12:54 -0400399 goto out;
Tom Haynesd67ae822014-12-11 17:02:04 -0500400 }
Trond Myklebust3dc14732016-08-29 15:12:54 -0400401 ff_layout_track_ds_error(FF_LAYOUT_FROM_HDR(lseg->pls_layout),
402 mirror, lseg->pls_range.offset,
403 lseg->pls_range.length, NFS4ERR_NXIO,
404 OP_ILLEGAL, GFP_NOIO);
405out_fail:
406 if (fail_return || !ff_layout_has_available_ds(lseg))
407 pnfs_error_mark_layout_for_return(ino, lseg);
408 ds = NULL;
Tom Haynesd67ae822014-12-11 17:02:04 -0500409out:
410 return ds;
411}
412
413struct rpc_cred *
414ff_layout_get_ds_cred(struct pnfs_layout_segment *lseg, u32 ds_idx,
415 struct rpc_cred *mdscred)
416{
417 struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, ds_idx);
Jeff Layton547a6372016-04-21 20:51:57 -0400418 struct rpc_cred *cred;
Tom Haynesd67ae822014-12-11 17:02:04 -0500419
Jeff Layton57f3f4c2016-04-21 20:51:58 -0400420 if (mirror) {
421 cred = ff_layout_get_mirror_cred(mirror, lseg->pls_range.iomode);
422 if (!cred)
423 cred = get_rpccred(mdscred);
424 } else {
425 cred = get_rpccred(mdscred);
426 }
Tom Haynesd67ae822014-12-11 17:02:04 -0500427 return cred;
428}
429
430/**
431* Find or create a DS rpc client with th MDS server rpc client auth flavor
432* in the nfs_client cl_ds_clients list.
433*/
434struct rpc_clnt *
435nfs4_ff_find_or_create_ds_client(struct pnfs_layout_segment *lseg, u32 ds_idx,
436 struct nfs_client *ds_clp, struct inode *inode)
437{
438 struct nfs4_ff_layout_mirror *mirror = FF_LAYOUT_COMP(lseg, ds_idx);
439
440 switch (mirror->mirror_ds->ds_versions[0].version) {
441 case 3:
442 /* For NFSv3 DS, flavor is set when creating DS connections */
443 return ds_clp->cl_rpcclient;
444 case 4:
445 return nfs4_find_or_create_ds_client(ds_clp, inode);
446 default:
447 BUG();
448 }
449}
450
Trond Myklebust5b9b3c82016-12-02 16:15:05 -0500451void ff_layout_free_ds_ioerr(struct list_head *head)
Tom Haynesd67ae822014-12-11 17:02:04 -0500452{
Trond Myklebust5b9b3c82016-12-02 16:15:05 -0500453 struct nfs4_ff_layout_ds_err *err;
454
455 while (!list_empty(head)) {
456 err = list_first_entry(head,
457 struct nfs4_ff_layout_ds_err,
458 list);
459 list_del(&err->list);
460 kfree(err);
461 }
462}
463
464/* called with inode i_lock held */
465int ff_layout_encode_ds_ioerr(struct xdr_stream *xdr, const struct list_head *head)
466{
467 struct nfs4_ff_layout_ds_err *err;
Tom Haynesd67ae822014-12-11 17:02:04 -0500468 __be32 *p;
469
Trond Myklebust5b9b3c82016-12-02 16:15:05 -0500470 list_for_each_entry(err, head, list) {
Tom Haynesd67ae822014-12-11 17:02:04 -0500471 /* offset(8) + length(8) + stateid(NFS4_STATEID_SIZE)
Trond Myklebustd1354902015-08-27 20:37:39 -0400472 * + array length + deviceid(NFS4_DEVICEID4_SIZE)
473 * + status(4) + opnum(4)
Tom Haynesd67ae822014-12-11 17:02:04 -0500474 */
475 p = xdr_reserve_space(xdr,
Trond Myklebustd1354902015-08-27 20:37:39 -0400476 28 + NFS4_STATEID_SIZE + NFS4_DEVICEID4_SIZE);
Tom Haynesd67ae822014-12-11 17:02:04 -0500477 if (unlikely(!p))
478 return -ENOBUFS;
479 p = xdr_encode_hyper(p, err->offset);
480 p = xdr_encode_hyper(p, err->length);
481 p = xdr_encode_opaque_fixed(p, &err->stateid,
482 NFS4_STATEID_SIZE);
Trond Myklebustd1354902015-08-27 20:37:39 -0400483 /* Encode 1 error */
484 *p++ = cpu_to_be32(1);
Tom Haynesd67ae822014-12-11 17:02:04 -0500485 p = xdr_encode_opaque_fixed(p, &err->deviceid,
486 NFS4_DEVICEID4_SIZE);
487 *p++ = cpu_to_be32(err->status);
488 *p++ = cpu_to_be32(err->opnum);
Trond Myklebust5b9b3c82016-12-02 16:15:05 -0500489 dprintk("%s: offset %llu length %llu status %d op %d\n",
Tom Haynesd67ae822014-12-11 17:02:04 -0500490 __func__, err->offset, err->length, err->status,
Trond Myklebust5b9b3c82016-12-02 16:15:05 -0500491 err->opnum);
Tom Haynesd67ae822014-12-11 17:02:04 -0500492 }
493
494 return 0;
495}
496
Trond Myklebust5b9b3c82016-12-02 16:15:05 -0500497static
498unsigned int do_layout_fetch_ds_ioerr(struct pnfs_layout_hdr *lo,
499 const struct pnfs_layout_range *range,
500 struct list_head *head,
501 unsigned int maxnum)
502{
503 struct nfs4_flexfile_layout *flo = FF_LAYOUT_FROM_HDR(lo);
504 struct inode *inode = lo->plh_inode;
505 struct nfs4_ff_layout_ds_err *err, *n;
506 unsigned int ret = 0;
507
508 spin_lock(&inode->i_lock);
509 list_for_each_entry_safe(err, n, &flo->error_list, list) {
510 if (!pnfs_is_range_intersecting(err->offset,
511 pnfs_end_offset(err->offset, err->length),
512 range->offset,
513 pnfs_end_offset(range->offset, range->length)))
514 continue;
515 if (!maxnum)
516 break;
517 list_move(&err->list, head);
518 maxnum--;
519 ret++;
520 }
521 spin_unlock(&inode->i_lock);
522 return ret;
523}
524
525unsigned int ff_layout_fetch_ds_ioerr(struct pnfs_layout_hdr *lo,
526 const struct pnfs_layout_range *range,
527 struct list_head *head,
528 unsigned int maxnum)
529{
530 unsigned int ret;
531
532 ret = do_layout_fetch_ds_ioerr(lo, range, head, maxnum);
533 /* If we're over the max, discard all remaining entries */
534 if (ret == maxnum) {
535 LIST_HEAD(discard);
536 do_layout_fetch_ds_ioerr(lo, range, &discard, -1);
537 ff_layout_free_ds_ioerr(&discard);
538 }
539 return ret;
540}
541
Trond Myklebust81d6dc82015-09-01 02:49:44 -0700542static bool ff_read_layout_has_available_ds(struct pnfs_layout_segment *lseg)
Tom Haynesd67ae822014-12-11 17:02:04 -0500543{
544 struct nfs4_ff_layout_mirror *mirror;
545 struct nfs4_deviceid_node *devid;
Trond Myklebust81d6dc82015-09-01 02:49:44 -0700546 u32 idx;
Tom Haynesd67ae822014-12-11 17:02:04 -0500547
548 for (idx = 0; idx < FF_LAYOUT_MIRROR_COUNT(lseg); idx++) {
549 mirror = FF_LAYOUT_COMP(lseg, idx);
550 if (mirror && mirror->mirror_ds) {
551 devid = &mirror->mirror_ds->id_node;
552 if (!ff_layout_test_devid_unavailable(devid))
553 return true;
554 }
555 }
556
557 return false;
558}
559
Trond Myklebust81d6dc82015-09-01 02:49:44 -0700560static bool ff_rw_layout_has_available_ds(struct pnfs_layout_segment *lseg)
561{
562 struct nfs4_ff_layout_mirror *mirror;
563 struct nfs4_deviceid_node *devid;
564 u32 idx;
565
566 for (idx = 0; idx < FF_LAYOUT_MIRROR_COUNT(lseg); idx++) {
567 mirror = FF_LAYOUT_COMP(lseg, idx);
568 if (!mirror || !mirror->mirror_ds)
569 return false;
570 devid = &mirror->mirror_ds->id_node;
571 if (ff_layout_test_devid_unavailable(devid))
572 return false;
573 }
574
575 return FF_LAYOUT_MIRROR_COUNT(lseg) != 0;
576}
577
578bool ff_layout_has_available_ds(struct pnfs_layout_segment *lseg)
579{
580 if (lseg->pls_range.iomode == IOMODE_READ)
581 return ff_read_layout_has_available_ds(lseg);
582 /* Note: RW layout needs all mirrors available */
583 return ff_rw_layout_has_available_ds(lseg);
584}
585
Tom Haynes3b13b4b2016-05-17 12:28:37 -0400586bool ff_layout_avoid_mds_available_ds(struct pnfs_layout_segment *lseg)
587{
588 return ff_layout_no_fallback_to_mds(lseg) ||
589 ff_layout_has_available_ds(lseg);
590}
591
Tom Haynesfb1084e2016-05-25 07:31:12 -0700592bool ff_layout_avoid_read_on_rw(struct pnfs_layout_segment *lseg)
593{
594 return lseg->pls_range.iomode == IOMODE_RW &&
595 ff_layout_no_read_on_rw(lseg);
596}
597
Tom Haynesd67ae822014-12-11 17:02:04 -0500598module_param(dataserver_retrans, uint, 0644);
599MODULE_PARM_DESC(dataserver_retrans, "The number of times the NFSv4.1 client "
600 "retries a request before it attempts further "
601 " recovery action.");
602module_param(dataserver_timeo, uint, 0644);
603MODULE_PARM_DESC(dataserver_timeo, "The time (in tenths of a second) the "
604 "NFSv4.1 client waits for a response from a "
605 " data server before it retries an NFS request.");