| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1 | /* | 
|  | 2 | * linux/fs/nfs/direct.c | 
|  | 3 | * | 
|  | 4 | * Copyright (C) 2003 by Chuck Lever <cel@netapp.com> | 
|  | 5 | * | 
|  | 6 | * High-performance uncached I/O for the Linux NFS client | 
|  | 7 | * | 
|  | 8 | * There are important applications whose performance or correctness | 
|  | 9 | * depends on uncached access to file data.  Database clusters | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 10 | * (multiple copies of the same instance running on separate hosts) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 11 | * implement their own cache coherency protocol that subsumes file | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 12 | * system cache protocols.  Applications that process datasets | 
|  | 13 | * considerably larger than the client's memory do not always benefit | 
|  | 14 | * from a local cache.  A streaming video server, for instance, has no | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 15 | * need to cache the contents of a file. | 
|  | 16 | * | 
|  | 17 | * When an application requests uncached I/O, all read and write requests | 
|  | 18 | * are made directly to the server; data stored or fetched via these | 
|  | 19 | * requests is not cached in the Linux page cache.  The client does not | 
|  | 20 | * correct unaligned requests from applications.  All requested bytes are | 
|  | 21 | * held on permanent storage before a direct write system call returns to | 
|  | 22 | * an application. | 
|  | 23 | * | 
|  | 24 | * Solaris implements an uncached I/O facility called directio() that | 
|  | 25 | * is used for backups and sequential I/O to very large files.  Solaris | 
|  | 26 | * also supports uncaching whole NFS partitions with "-o forcedirectio," | 
|  | 27 | * an undocumented mount option. | 
|  | 28 | * | 
|  | 29 | * Designed by Jeff Kimmel, Chuck Lever, and Trond Myklebust, with | 
|  | 30 | * help from Andrew Morton. | 
|  | 31 | * | 
|  | 32 | * 18 Dec 2001	Initial implementation for 2.4  --cel | 
|  | 33 | * 08 Jul 2002	Version for 2.4.19, with bug fixes --trondmy | 
|  | 34 | * 08 Jun 2003	Port to 2.5 APIs  --cel | 
|  | 35 | * 31 Mar 2004	Handle direct I/O without VFS support  --cel | 
|  | 36 | * 15 Sep 2004	Parallel async reads  --cel | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 37 | * 04 May 2005	support O_DIRECT with aio  --cel | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 38 | * | 
|  | 39 | */ | 
|  | 40 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 41 | #include <linux/errno.h> | 
|  | 42 | #include <linux/sched.h> | 
|  | 43 | #include <linux/kernel.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 44 | #include <linux/file.h> | 
|  | 45 | #include <linux/pagemap.h> | 
|  | 46 | #include <linux/kref.h> | 
| Tejun Heo | 5a0e3ad | 2010-03-24 17:04:11 +0900 | [diff] [blame] | 47 | #include <linux/slab.h> | 
| Konstantin Khlebnikov | 7ec10f2 | 2011-02-22 00:28:34 +0300 | [diff] [blame] | 48 | #include <linux/task_io_accounting_ops.h> | 
| Peng Tao | 6296556 | 2012-09-25 14:55:57 +0800 | [diff] [blame] | 49 | #include <linux/module.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 50 |  | 
|  | 51 | #include <linux/nfs_fs.h> | 
|  | 52 | #include <linux/nfs_page.h> | 
|  | 53 | #include <linux/sunrpc/clnt.h> | 
|  | 54 |  | 
| Linus Torvalds | 7c0f6ba | 2016-12-24 11:46:01 -0800 | [diff] [blame] | 55 | #include <linux/uaccess.h> | 
| Arun Sharma | 60063497 | 2011-07-26 16:09:06 -0700 | [diff] [blame] | 56 | #include <linux/atomic.h> | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 57 |  | 
| Trond Myklebust | 8d5658c | 2007-04-10 09:26:35 -0400 | [diff] [blame] | 58 | #include "internal.h" | 
| Chuck Lever | 91d5b47 | 2006-03-20 13:44:14 -0500 | [diff] [blame] | 59 | #include "iostat.h" | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 60 | #include "pnfs.h" | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 61 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 62 | #define NFSDBG_FACILITY		NFSDBG_VFS | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 63 |  | 
| Christoph Lameter | e18b890 | 2006-12-06 20:33:20 -0800 | [diff] [blame] | 64 | static struct kmem_cache *nfs_direct_cachep; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 65 |  | 
|  | 66 | /* | 
|  | 67 | * This represents a set of asynchronous requests that we're waiting on | 
|  | 68 | */ | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 69 | struct nfs_direct_mirror { | 
|  | 70 | ssize_t count; | 
|  | 71 | }; | 
|  | 72 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 73 | struct nfs_direct_req { | 
|  | 74 | struct kref		kref;		/* release manager */ | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 75 |  | 
|  | 76 | /* I/O parameters */ | 
| Trond Myklebust | a8881f5 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 77 | struct nfs_open_context	*ctx;		/* file open context info */ | 
| Trond Myklebust | f11ac8d | 2010-06-25 16:35:53 -0400 | [diff] [blame] | 78 | struct nfs_lock_context *l_ctx;		/* Lock context info */ | 
| Chuck Lever | 99514f8 | 2006-03-20 13:44:30 -0500 | [diff] [blame] | 79 | struct kiocb *		iocb;		/* controlling i/o request */ | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 80 | struct inode *		inode;		/* target file of i/o */ | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 81 |  | 
|  | 82 | /* completion state */ | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 83 | atomic_t		io_count;	/* i/os we're waiting for */ | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 84 | spinlock_t		lock;		/* protect completion state */ | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 85 |  | 
|  | 86 | struct nfs_direct_mirror mirrors[NFS_PAGEIO_DESCRIPTOR_MIRROR_MAX]; | 
|  | 87 | int			mirror_count; | 
|  | 88 |  | 
| Trond Myklebust | d9ee655 | 2018-03-06 12:47:08 -0500 | [diff] [blame] | 89 | loff_t			io_start;	/* Start offset for I/O */ | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 90 | ssize_t			count,		/* bytes actually processed */ | 
| Weston Andros Adamson | ed3743a | 2016-04-01 11:42:29 -0400 | [diff] [blame] | 91 | max_count,	/* max expected count */ | 
| Peng Tao | 35754bc | 2012-09-25 14:55:57 +0800 | [diff] [blame] | 92 | bytes_left,	/* bytes left to be sent */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 93 | error;		/* any reported error */ | 
| Trond Myklebust | d72b7a6 | 2006-03-20 13:44:43 -0500 | [diff] [blame] | 94 | struct completion	completion;	/* wait for i/o completion */ | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 95 |  | 
|  | 96 | /* commit state */ | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 97 | struct nfs_mds_commit_info mds_cinfo;	/* Storage for cinfo */ | 
|  | 98 | struct pnfs_ds_commit_info ds_cinfo;	/* Storage for cinfo */ | 
|  | 99 | struct work_struct	work; | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 100 | int			flags; | 
|  | 101 | #define NFS_ODIRECT_DO_COMMIT		(1)	/* an unstable reply was received */ | 
|  | 102 | #define NFS_ODIRECT_RESCHED_WRITES	(2)	/* write verification failed */ | 
|  | 103 | struct nfs_writeverf	verf;		/* unstable write verifier */ | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 104 | }; | 
|  | 105 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 106 | static const struct nfs_pgio_completion_ops nfs_direct_write_completion_ops; | 
|  | 107 | static const struct nfs_commit_completion_ops nfs_direct_commit_completion_ops; | 
| Anna Schumaker | 4d3b55d | 2016-11-23 13:49:38 -0500 | [diff] [blame] | 108 | static void nfs_direct_write_complete(struct nfs_direct_req *dreq); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 109 | static void nfs_direct_write_schedule_work(struct work_struct *work); | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 110 |  | 
|  | 111 | static inline void get_dreq(struct nfs_direct_req *dreq) | 
|  | 112 | { | 
|  | 113 | atomic_inc(&dreq->io_count); | 
|  | 114 | } | 
|  | 115 |  | 
|  | 116 | static inline int put_dreq(struct nfs_direct_req *dreq) | 
|  | 117 | { | 
|  | 118 | return atomic_dec_and_test(&dreq->io_count); | 
|  | 119 | } | 
|  | 120 |  | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 121 | static void | 
|  | 122 | nfs_direct_good_bytes(struct nfs_direct_req *dreq, struct nfs_pgio_header *hdr) | 
|  | 123 | { | 
|  | 124 | int i; | 
|  | 125 | ssize_t count; | 
|  | 126 |  | 
| Weston Andros Adamson | ed3743a | 2016-04-01 11:42:29 -0400 | [diff] [blame] | 127 | WARN_ON_ONCE(dreq->count >= dreq->max_count); | 
|  | 128 |  | 
| Peng Tao | 1ccbad9 | 2015-04-09 23:02:16 +0800 | [diff] [blame] | 129 | if (dreq->mirror_count == 1) { | 
|  | 130 | dreq->mirrors[hdr->pgio_mirror_idx].count += hdr->good_bytes; | 
|  | 131 | dreq->count += hdr->good_bytes; | 
|  | 132 | } else { | 
|  | 133 | /* mirrored writes */ | 
|  | 134 | count = dreq->mirrors[hdr->pgio_mirror_idx].count; | 
|  | 135 | if (count + dreq->io_start < hdr->io_start + hdr->good_bytes) { | 
|  | 136 | count = hdr->io_start + hdr->good_bytes - dreq->io_start; | 
|  | 137 | dreq->mirrors[hdr->pgio_mirror_idx].count = count; | 
|  | 138 | } | 
|  | 139 | /* update the dreq->count by finding the minimum agreed count from all | 
|  | 140 | * mirrors */ | 
|  | 141 | count = dreq->mirrors[0].count; | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 142 |  | 
| Peng Tao | 1ccbad9 | 2015-04-09 23:02:16 +0800 | [diff] [blame] | 143 | for (i = 1; i < dreq->mirror_count; i++) | 
|  | 144 | count = min(count, dreq->mirrors[i].count); | 
|  | 145 |  | 
|  | 146 | dreq->count = count; | 
| Peng Tao | 5fadeb4 | 2015-01-19 12:41:16 +0800 | [diff] [blame] | 147 | } | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 148 | } | 
|  | 149 |  | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 150 | /* | 
|  | 151 | * nfs_direct_select_verf - select the right verifier | 
|  | 152 | * @dreq - direct request possibly spanning multiple servers | 
|  | 153 | * @ds_clp - nfs_client of data server or NULL if MDS / non-pnfs | 
| Weston Andros Adamson | 6cccbb6 | 2014-09-16 17:35:51 -0400 | [diff] [blame] | 154 | * @commit_idx - commit bucket index for the DS | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 155 | * | 
|  | 156 | * returns the correct verifier to use given the role of the server | 
|  | 157 | */ | 
|  | 158 | static struct nfs_writeverf * | 
|  | 159 | nfs_direct_select_verf(struct nfs_direct_req *dreq, | 
|  | 160 | struct nfs_client *ds_clp, | 
| Weston Andros Adamson | 6cccbb6 | 2014-09-16 17:35:51 -0400 | [diff] [blame] | 161 | int commit_idx) | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 162 | { | 
|  | 163 | struct nfs_writeverf *verfp = &dreq->verf; | 
|  | 164 |  | 
|  | 165 | #ifdef CONFIG_NFS_V4_1 | 
| Kinglong Mee | 834e465 | 2015-09-22 06:54:47 +0800 | [diff] [blame] | 166 | /* | 
|  | 167 | * pNFS is in use, use the DS verf except commit_through_mds is set | 
|  | 168 | * for layout segment where nbuckets is zero. | 
|  | 169 | */ | 
|  | 170 | if (ds_clp && dreq->ds_cinfo.nbuckets > 0) { | 
| Weston Andros Adamson | 6cccbb6 | 2014-09-16 17:35:51 -0400 | [diff] [blame] | 171 | if (commit_idx >= 0 && commit_idx < dreq->ds_cinfo.nbuckets) | 
|  | 172 | verfp = &dreq->ds_cinfo.buckets[commit_idx].direct_verf; | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 173 | else | 
|  | 174 | WARN_ON_ONCE(1); | 
|  | 175 | } | 
|  | 176 | #endif | 
|  | 177 | return verfp; | 
|  | 178 | } | 
|  | 179 |  | 
|  | 180 |  | 
|  | 181 | /* | 
|  | 182 | * nfs_direct_set_hdr_verf - set the write/commit verifier | 
|  | 183 | * @dreq - direct request possibly spanning multiple servers | 
|  | 184 | * @hdr - pageio header to validate against previously seen verfs | 
|  | 185 | * | 
|  | 186 | * Set the server's (MDS or DS) "seen" verifier | 
|  | 187 | */ | 
|  | 188 | static void nfs_direct_set_hdr_verf(struct nfs_direct_req *dreq, | 
|  | 189 | struct nfs_pgio_header *hdr) | 
|  | 190 | { | 
|  | 191 | struct nfs_writeverf *verfp; | 
|  | 192 |  | 
| Weston Andros Adamson | 6cccbb6 | 2014-09-16 17:35:51 -0400 | [diff] [blame] | 193 | verfp = nfs_direct_select_verf(dreq, hdr->ds_clp, hdr->ds_commit_idx); | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 194 | WARN_ON_ONCE(verfp->committed >= 0); | 
|  | 195 | memcpy(verfp, &hdr->verf, sizeof(struct nfs_writeverf)); | 
|  | 196 | WARN_ON_ONCE(verfp->committed < 0); | 
|  | 197 | } | 
|  | 198 |  | 
| Trond Myklebust | 8fc3c38 | 2016-06-01 21:32:24 -0400 | [diff] [blame] | 199 | static int nfs_direct_cmp_verf(const struct nfs_writeverf *v1, | 
|  | 200 | const struct nfs_writeverf *v2) | 
|  | 201 | { | 
|  | 202 | return nfs_write_verifier_cmp(&v1->verifier, &v2->verifier); | 
|  | 203 | } | 
|  | 204 |  | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 205 | /* | 
|  | 206 | * nfs_direct_cmp_hdr_verf - compare verifier for pgio header | 
|  | 207 | * @dreq - direct request possibly spanning multiple servers | 
|  | 208 | * @hdr - pageio header to validate against previously seen verf | 
|  | 209 | * | 
|  | 210 | * set the server's "seen" verf if not initialized. | 
|  | 211 | * returns result of comparison between @hdr->verf and the "seen" | 
|  | 212 | * verf of the server used by @hdr (DS or MDS) | 
|  | 213 | */ | 
|  | 214 | static int nfs_direct_set_or_cmp_hdr_verf(struct nfs_direct_req *dreq, | 
|  | 215 | struct nfs_pgio_header *hdr) | 
|  | 216 | { | 
|  | 217 | struct nfs_writeverf *verfp; | 
|  | 218 |  | 
| Weston Andros Adamson | 6cccbb6 | 2014-09-16 17:35:51 -0400 | [diff] [blame] | 219 | verfp = nfs_direct_select_verf(dreq, hdr->ds_clp, hdr->ds_commit_idx); | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 220 | if (verfp->committed < 0) { | 
|  | 221 | nfs_direct_set_hdr_verf(dreq, hdr); | 
|  | 222 | return 0; | 
|  | 223 | } | 
| Trond Myklebust | 8fc3c38 | 2016-06-01 21:32:24 -0400 | [diff] [blame] | 224 | return nfs_direct_cmp_verf(verfp, &hdr->verf); | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 225 | } | 
|  | 226 |  | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 227 | /* | 
|  | 228 | * nfs_direct_cmp_commit_data_verf - compare verifier for commit data | 
|  | 229 | * @dreq - direct request possibly spanning multiple servers | 
|  | 230 | * @data - commit data to validate against previously seen verf | 
|  | 231 | * | 
|  | 232 | * returns result of comparison between @data->verf and the verf of | 
|  | 233 | * the server used by @data (DS or MDS) | 
|  | 234 | */ | 
|  | 235 | static int nfs_direct_cmp_commit_data_verf(struct nfs_direct_req *dreq, | 
|  | 236 | struct nfs_commit_data *data) | 
|  | 237 | { | 
|  | 238 | struct nfs_writeverf *verfp; | 
|  | 239 |  | 
|  | 240 | verfp = nfs_direct_select_verf(dreq, data->ds_clp, | 
|  | 241 | data->ds_commit_index); | 
| Weston Andros Adamson | 80c76fe | 2014-10-01 12:58:25 -0400 | [diff] [blame] | 242 |  | 
|  | 243 | /* verifier not set so always fail */ | 
|  | 244 | if (verfp->committed < 0) | 
|  | 245 | return 1; | 
|  | 246 |  | 
| Trond Myklebust | 8fc3c38 | 2016-06-01 21:32:24 -0400 | [diff] [blame] | 247 | return nfs_direct_cmp_verf(verfp, &data->verf); | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 248 | } | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 249 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 250 | /** | 
| Chuck Lever | b8a32e2 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 251 | * nfs_direct_IO - NFS address space operation for direct I/O | 
| Chuck Lever | b8a32e2 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 252 | * @iocb: target I/O control block | 
| Al Viro | 90090ae | 2016-05-29 19:05:03 -0400 | [diff] [blame] | 253 | * @iter: I/O buffer | 
| Chuck Lever | b8a32e2 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 254 | * | 
|  | 255 | * The presence of this routine in the address space ops vector means | 
| Mel Gorman | a564b8f | 2012-07-31 16:45:12 -0700 | [diff] [blame] | 256 | * the NFS client supports direct I/O. However, for most direct IO, we | 
|  | 257 | * shunt off direct read and write requests before the VFS gets them, | 
|  | 258 | * so this method is only ever called for swap. | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 259 | */ | 
| Christoph Hellwig | c8b8e32 | 2016-04-07 08:51:58 -0700 | [diff] [blame] | 260 | ssize_t nfs_direct_IO(struct kiocb *iocb, struct iov_iter *iter) | 
| Chuck Lever | b8a32e2 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 261 | { | 
| Peng Tao | ee8a1a8 | 2015-01-20 07:44:29 +0800 | [diff] [blame] | 262 | struct inode *inode = iocb->ki_filp->f_mapping->host; | 
|  | 263 |  | 
|  | 264 | /* we only support swap file calling nfs_direct_IO */ | 
|  | 265 | if (!IS_SWAPFILE(inode)) | 
|  | 266 | return 0; | 
|  | 267 |  | 
| Christoph Hellwig | 66ee59a | 2015-02-11 19:56:46 +0100 | [diff] [blame] | 268 | VM_BUG_ON(iov_iter_count(iter) != PAGE_SIZE); | 
| Mel Gorman | a564b8f | 2012-07-31 16:45:12 -0700 | [diff] [blame] | 269 |  | 
| Omar Sandoval | 6f67376 | 2015-03-16 04:33:52 -0700 | [diff] [blame] | 270 | if (iov_iter_rw(iter) == READ) | 
| Christoph Hellwig | c8b8e32 | 2016-04-07 08:51:58 -0700 | [diff] [blame] | 271 | return nfs_file_direct_read(iocb, iter); | 
| Al Viro | 65a4a1c | 2015-04-09 14:11:08 -0400 | [diff] [blame] | 272 | return nfs_file_direct_write(iocb, iter); | 
| Chuck Lever | b8a32e2 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 273 | } | 
|  | 274 |  | 
| Chuck Lever | 749e146 | 2007-05-19 17:22:46 -0400 | [diff] [blame] | 275 | static void nfs_direct_release_pages(struct page **pages, unsigned int npages) | 
| Chuck Lever | 9c93ab7 | 2006-06-20 12:56:31 -0400 | [diff] [blame] | 276 | { | 
| Chuck Lever | 749e146 | 2007-05-19 17:22:46 -0400 | [diff] [blame] | 277 | unsigned int i; | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 278 | for (i = 0; i < npages; i++) | 
| Kirill A. Shutemov | 09cbfea | 2016-04-01 15:29:47 +0300 | [diff] [blame] | 279 | put_page(pages[i]); | 
| Trond Myklebust | 6b45d85 | 2006-03-20 13:44:43 -0500 | [diff] [blame] | 280 | } | 
|  | 281 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 282 | void nfs_init_cinfo_from_dreq(struct nfs_commit_info *cinfo, | 
|  | 283 | struct nfs_direct_req *dreq) | 
|  | 284 | { | 
| Dave Wysochanski | fe238e6 | 2016-04-01 13:45:09 -0400 | [diff] [blame] | 285 | cinfo->inode = dreq->inode; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 286 | cinfo->mds = &dreq->mds_cinfo; | 
|  | 287 | cinfo->ds = &dreq->ds_cinfo; | 
|  | 288 | cinfo->dreq = dreq; | 
|  | 289 | cinfo->completion_ops = &nfs_direct_commit_completion_ops; | 
|  | 290 | } | 
|  | 291 |  | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 292 | static inline void nfs_direct_setup_mirroring(struct nfs_direct_req *dreq, | 
|  | 293 | struct nfs_pageio_descriptor *pgio, | 
|  | 294 | struct nfs_page *req) | 
|  | 295 | { | 
|  | 296 | int mirror_count = 1; | 
|  | 297 |  | 
|  | 298 | if (pgio->pg_ops->pg_get_mirror_count) | 
|  | 299 | mirror_count = pgio->pg_ops->pg_get_mirror_count(pgio, req); | 
|  | 300 |  | 
|  | 301 | dreq->mirror_count = mirror_count; | 
|  | 302 | } | 
|  | 303 |  | 
| Chuck Lever | 93619e5 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 304 | static inline struct nfs_direct_req *nfs_direct_req_alloc(void) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 305 | { | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 306 | struct nfs_direct_req *dreq; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 307 |  | 
| Trond Myklebust | 292f3ee | 2012-04-30 18:31:49 -0400 | [diff] [blame] | 308 | dreq = kmem_cache_zalloc(nfs_direct_cachep, GFP_KERNEL); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 309 | if (!dreq) | 
|  | 310 | return NULL; | 
|  | 311 |  | 
|  | 312 | kref_init(&dreq->kref); | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 313 | kref_get(&dreq->kref); | 
| Trond Myklebust | d72b7a6 | 2006-03-20 13:44:43 -0500 | [diff] [blame] | 314 | init_completion(&dreq->completion); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 315 | INIT_LIST_HEAD(&dreq->mds_cinfo.list); | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 316 | dreq->verf.committed = NFS_INVALID_STABLE_HOW;	/* not set yet */ | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 317 | INIT_WORK(&dreq->work, nfs_direct_write_schedule_work); | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 318 | dreq->mirror_count = 1; | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 319 | spin_lock_init(&dreq->lock); | 
| Chuck Lever | 93619e5 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 320 |  | 
|  | 321 | return dreq; | 
|  | 322 | } | 
|  | 323 |  | 
| Trond Myklebust | b4946ff | 2007-05-30 12:58:00 -0400 | [diff] [blame] | 324 | static void nfs_direct_req_free(struct kref *kref) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 325 | { | 
|  | 326 | struct nfs_direct_req *dreq = container_of(kref, struct nfs_direct_req, kref); | 
| Trond Myklebust | a8881f5 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 327 |  | 
| Peng Tao | 8c393f9 | 2014-11-05 22:36:50 +0800 | [diff] [blame] | 328 | nfs_free_pnfs_ds_cinfo(&dreq->ds_cinfo); | 
| Trond Myklebust | f11ac8d | 2010-06-25 16:35:53 -0400 | [diff] [blame] | 329 | if (dreq->l_ctx != NULL) | 
|  | 330 | nfs_put_lock_context(dreq->l_ctx); | 
| Trond Myklebust | a8881f5 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 331 | if (dreq->ctx != NULL) | 
|  | 332 | put_nfs_open_context(dreq->ctx); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 333 | kmem_cache_free(nfs_direct_cachep, dreq); | 
|  | 334 | } | 
|  | 335 |  | 
| Trond Myklebust | b4946ff | 2007-05-30 12:58:00 -0400 | [diff] [blame] | 336 | static void nfs_direct_req_release(struct nfs_direct_req *dreq) | 
|  | 337 | { | 
|  | 338 | kref_put(&dreq->kref, nfs_direct_req_free); | 
|  | 339 | } | 
|  | 340 |  | 
| Peng Tao | 6296556 | 2012-09-25 14:55:57 +0800 | [diff] [blame] | 341 | ssize_t nfs_dreq_bytes_left(struct nfs_direct_req *dreq) | 
|  | 342 | { | 
|  | 343 | return dreq->bytes_left; | 
|  | 344 | } | 
|  | 345 | EXPORT_SYMBOL_GPL(nfs_dreq_bytes_left); | 
|  | 346 |  | 
| Chuck Lever | d4cc948 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 347 | /* | 
| Chuck Lever | bc0fb20 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 348 | * Collects and returns the final error value/byte-count. | 
|  | 349 | */ | 
|  | 350 | static ssize_t nfs_direct_wait(struct nfs_direct_req *dreq) | 
|  | 351 | { | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 352 | ssize_t result = -EIOCBQUEUED; | 
| Chuck Lever | bc0fb20 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 353 |  | 
|  | 354 | /* Async requests don't wait here */ | 
|  | 355 | if (dreq->iocb) | 
|  | 356 | goto out; | 
|  | 357 |  | 
| Matthew Wilcox | 150030b | 2007-12-06 16:24:39 -0500 | [diff] [blame] | 358 | result = wait_for_completion_killable(&dreq->completion); | 
| Chuck Lever | bc0fb20 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 359 |  | 
| Trond Myklebust | d2a7de0 | 2016-06-17 16:48:22 -0400 | [diff] [blame] | 360 | if (!result) { | 
|  | 361 | result = dreq->count; | 
|  | 362 | WARN_ON_ONCE(dreq->count < 0); | 
|  | 363 | } | 
| Chuck Lever | bc0fb20 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 364 | if (!result) | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 365 | result = dreq->error; | 
| Chuck Lever | bc0fb20 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 366 |  | 
|  | 367 | out: | 
| Chuck Lever | bc0fb20 | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 368 | return (ssize_t) result; | 
|  | 369 | } | 
|  | 370 |  | 
|  | 371 | /* | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 372 | * Synchronous I/O uses a stack-allocated iocb.  Thus we can't trust | 
|  | 373 | * the iocb is still valid here if this is a synchronous request. | 
| Chuck Lever | 63ab46a | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 374 | */ | 
| Trond Myklebust | f7b5c34 | 2016-06-23 09:29:47 -0400 | [diff] [blame] | 375 | static void nfs_direct_complete(struct nfs_direct_req *dreq) | 
| Chuck Lever | 63ab46a | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 376 | { | 
| Christoph Hellwig | 9811cd5 | 2013-11-14 08:50:28 -0800 | [diff] [blame] | 377 | struct inode *inode = dreq->inode; | 
|  | 378 |  | 
| Jens Axboe | fe0f07d | 2015-04-15 17:05:48 -0600 | [diff] [blame] | 379 | inode_dio_end(inode); | 
| Christoph Hellwig | 2a009ec | 2013-11-14 08:50:29 -0800 | [diff] [blame] | 380 |  | 
|  | 381 | if (dreq->iocb) { | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 382 | long res = (long) dreq->error; | 
| Trond Myklebust | d2a7de0 | 2016-06-17 16:48:22 -0400 | [diff] [blame] | 383 | if (dreq->count != 0) { | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 384 | res = (long) dreq->count; | 
| Trond Myklebust | d2a7de0 | 2016-06-17 16:48:22 -0400 | [diff] [blame] | 385 | WARN_ON_ONCE(dreq->count < 0); | 
|  | 386 | } | 
| Christoph Hellwig | 04b2fa9 | 2015-02-02 14:49:06 +0100 | [diff] [blame] | 387 | dreq->iocb->ki_complete(dreq->iocb, res, 0); | 
| Trond Myklebust | d72b7a6 | 2006-03-20 13:44:43 -0500 | [diff] [blame] | 388 | } | 
| Christoph Hellwig | 2a009ec | 2013-11-14 08:50:29 -0800 | [diff] [blame] | 389 |  | 
| Daniel Wagner | 024de8f | 2016-09-22 13:54:28 +0200 | [diff] [blame] | 390 | complete(&dreq->completion); | 
| Chuck Lever | 63ab46a | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 391 |  | 
| Trond Myklebust | b4946ff | 2007-05-30 12:58:00 -0400 | [diff] [blame] | 392 | nfs_direct_req_release(dreq); | 
| Chuck Lever | 63ab46a | 2006-03-20 13:44:31 -0500 | [diff] [blame] | 393 | } | 
|  | 394 |  | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 395 | static void nfs_direct_read_completion(struct nfs_pgio_header *hdr) | 
| Trond Myklebust | fdd1e74 | 2008-04-15 16:33:58 -0400 | [diff] [blame] | 396 | { | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 397 | unsigned long bytes = 0; | 
|  | 398 | struct nfs_direct_req *dreq = hdr->dreq; | 
| Trond Myklebust | fdd1e74 | 2008-04-15 16:33:58 -0400 | [diff] [blame] | 399 |  | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 400 | if (test_bit(NFS_IOHDR_REDO, &hdr->flags)) | 
|  | 401 | goto out_put; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 402 |  | 
| Chuck Lever | 15ce4a0 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 403 | spin_lock(&dreq->lock); | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 404 | if (test_bit(NFS_IOHDR_ERROR, &hdr->flags) && (hdr->good_bytes == 0)) | 
|  | 405 | dreq->error = hdr->error; | 
|  | 406 | else | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 407 | nfs_direct_good_bytes(dreq, hdr); | 
|  | 408 |  | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 409 | spin_unlock(&dreq->lock); | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 410 |  | 
| Trond Myklebust | 4bd8b01 | 2012-05-01 12:49:58 -0400 | [diff] [blame] | 411 | while (!list_empty(&hdr->pages)) { | 
|  | 412 | struct nfs_page *req = nfs_list_entry(hdr->pages.next); | 
|  | 413 | struct page *page = req->wb_page; | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 414 |  | 
| Jeff Layton | be7e985 | 2012-12-12 12:36:31 -0500 | [diff] [blame] | 415 | if (!PageCompound(page) && bytes < hdr->good_bytes) | 
|  | 416 | set_page_dirty(page); | 
| Trond Myklebust | 4bd8b01 | 2012-05-01 12:49:58 -0400 | [diff] [blame] | 417 | bytes += req->wb_bytes; | 
|  | 418 | nfs_list_remove_request(req); | 
| Anna Schumaker | beeb533 | 2017-04-07 14:15:07 -0400 | [diff] [blame] | 419 | nfs_release_request(req); | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 420 | } | 
|  | 421 | out_put: | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 422 | if (put_dreq(dreq)) | 
| Trond Myklebust | f7b5c34 | 2016-06-23 09:29:47 -0400 | [diff] [blame] | 423 | nfs_direct_complete(dreq); | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 424 | hdr->release(hdr); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 425 | } | 
|  | 426 |  | 
| Trond Myklebust | 3e9e0ca3 | 2012-04-30 13:40:06 -0400 | [diff] [blame] | 427 | static void nfs_read_sync_pgio_error(struct list_head *head) | 
| Fred Isaman | cd84160 | 2012-04-20 14:47:44 -0400 | [diff] [blame] | 428 | { | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 429 | struct nfs_page *req; | 
| Fred Isaman | cd84160 | 2012-04-20 14:47:44 -0400 | [diff] [blame] | 430 |  | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 431 | while (!list_empty(head)) { | 
|  | 432 | req = nfs_list_entry(head->next); | 
|  | 433 | nfs_list_remove_request(req); | 
|  | 434 | nfs_release_request(req); | 
|  | 435 | } | 
| Fred Isaman | cd84160 | 2012-04-20 14:47:44 -0400 | [diff] [blame] | 436 | } | 
|  | 437 |  | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 438 | static void nfs_direct_pgio_init(struct nfs_pgio_header *hdr) | 
|  | 439 | { | 
|  | 440 | get_dreq(hdr->dreq); | 
|  | 441 | } | 
|  | 442 |  | 
|  | 443 | static const struct nfs_pgio_completion_ops nfs_direct_read_completion_ops = { | 
| Trond Myklebust | 3e9e0ca3 | 2012-04-30 13:40:06 -0400 | [diff] [blame] | 444 | .error_cleanup = nfs_read_sync_pgio_error, | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 445 | .init_hdr = nfs_direct_pgio_init, | 
|  | 446 | .completion = nfs_direct_read_completion, | 
|  | 447 | }; | 
|  | 448 |  | 
| Chuck Lever | d4cc948 | 2006-03-20 13:44:28 -0500 | [diff] [blame] | 449 | /* | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 450 | * For each rsize'd chunk of the user's buffer, dispatch an NFS READ | 
|  | 451 | * operation.  If nfs_readdata_alloc() or get_user_pages() fails, | 
|  | 452 | * bail and stop sending more reads.  Read length accounting is | 
|  | 453 | * handled automatically by nfs_direct_read_result().  Otherwise, if | 
|  | 454 | * no requests have been sent, just return an error. | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 455 | */ | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 456 |  | 
|  | 457 | static ssize_t nfs_direct_read_schedule_iovec(struct nfs_direct_req *dreq, | 
|  | 458 | struct iov_iter *iter, | 
|  | 459 | loff_t pos) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 460 | { | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 461 | struct nfs_pageio_descriptor desc; | 
|  | 462 | struct inode *inode = dreq->inode; | 
|  | 463 | ssize_t result = -EINVAL; | 
|  | 464 | size_t requested_bytes = 0; | 
|  | 465 | size_t rsize = max_t(size_t, NFS_SERVER(inode)->rsize, PAGE_SIZE); | 
| Chuck Lever | 82b145c | 2006-06-20 12:57:03 -0400 | [diff] [blame] | 466 |  | 
| Linus Torvalds | 16b9057 | 2014-06-12 10:30:18 -0700 | [diff] [blame] | 467 | nfs_pageio_init_read(&desc, dreq->inode, false, | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 468 | &nfs_direct_read_completion_ops); | 
|  | 469 | get_dreq(dreq); | 
|  | 470 | desc.pg_dreq = dreq; | 
| Jens Axboe | fe0f07d | 2015-04-15 17:05:48 -0600 | [diff] [blame] | 471 | inode_dio_begin(inode); | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 472 |  | 
|  | 473 | while (iov_iter_count(iter)) { | 
|  | 474 | struct page **pagevec; | 
| Chuck Lever | 5dd602f | 2006-03-20 13:44:29 -0500 | [diff] [blame] | 475 | size_t bytes; | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 476 | size_t pgbase; | 
|  | 477 | unsigned npages, i; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 478 |  | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 479 | result = iov_iter_get_pages_alloc(iter, &pagevec, | 
|  | 480 | rsize, &pgbase); | 
|  | 481 | if (result < 0) | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 482 | break; | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 483 |  | 
|  | 484 | bytes = result; | 
|  | 485 | iov_iter_advance(iter, bytes); | 
|  | 486 | npages = (result + pgbase + PAGE_SIZE - 1) / PAGE_SIZE; | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 487 | for (i = 0; i < npages; i++) { | 
|  | 488 | struct nfs_page *req; | 
| Trond Myklebust | bf5fc40 | 2012-05-04 13:47:16 -0400 | [diff] [blame] | 489 | unsigned int req_len = min_t(size_t, bytes, PAGE_SIZE - pgbase); | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 490 | /* XXX do we need to do the eof zeroing found in async_filler? */ | 
| Weston Andros Adamson | 2bfc6e5 | 2014-05-15 11:56:45 -0400 | [diff] [blame] | 491 | req = nfs_create_request(dreq->ctx, pagevec[i], NULL, | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 492 | pgbase, req_len); | 
|  | 493 | if (IS_ERR(req)) { | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 494 | result = PTR_ERR(req); | 
|  | 495 | break; | 
|  | 496 | } | 
|  | 497 | req->wb_index = pos >> PAGE_SHIFT; | 
|  | 498 | req->wb_offset = pos & ~PAGE_MASK; | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 499 | if (!nfs_pageio_add_request(&desc, req)) { | 
|  | 500 | result = desc.pg_error; | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 501 | nfs_release_request(req); | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 502 | break; | 
|  | 503 | } | 
|  | 504 | pgbase = 0; | 
|  | 505 | bytes -= req_len; | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 506 | requested_bytes += req_len; | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 507 | pos += req_len; | 
| Peng Tao | 35754bc | 2012-09-25 14:55:57 +0800 | [diff] [blame] | 508 | dreq->bytes_left -= req_len; | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 509 | } | 
| Trond Myklebust | 6d74743 | 2012-04-30 13:27:31 -0400 | [diff] [blame] | 510 | nfs_direct_release_pages(pagevec, npages); | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 511 | kvfree(pagevec); | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 512 | if (result < 0) | 
|  | 513 | break; | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 514 | } | 
|  | 515 |  | 
| Fred Isaman | 584aa81 | 2012-04-20 14:47:51 -0400 | [diff] [blame] | 516 | nfs_pageio_complete(&desc); | 
|  | 517 |  | 
| Chuck Lever | 839f7ad | 2011-01-21 15:54:57 +0000 | [diff] [blame] | 518 | /* | 
|  | 519 | * If no bytes were started, return the error, and let the | 
|  | 520 | * generic layer handle the completion. | 
|  | 521 | */ | 
|  | 522 | if (requested_bytes == 0) { | 
| Jens Axboe | fe0f07d | 2015-04-15 17:05:48 -0600 | [diff] [blame] | 523 | inode_dio_end(inode); | 
| Chuck Lever | 839f7ad | 2011-01-21 15:54:57 +0000 | [diff] [blame] | 524 | nfs_direct_req_release(dreq); | 
|  | 525 | return result < 0 ? result : -EIO; | 
|  | 526 | } | 
|  | 527 |  | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 528 | if (put_dreq(dreq)) | 
| Trond Myklebust | f7b5c34 | 2016-06-23 09:29:47 -0400 | [diff] [blame] | 529 | nfs_direct_complete(dreq); | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 530 | return requested_bytes; | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 531 | } | 
|  | 532 |  | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 533 | /** | 
|  | 534 | * nfs_file_direct_read - file direct read operation for NFS files | 
|  | 535 | * @iocb: target I/O control block | 
| Al Viro | 619d30b | 2014-03-04 21:53:33 -0500 | [diff] [blame] | 536 | * @iter: vector of user buffers into which to read data | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 537 | * | 
|  | 538 | * We use this function for direct reads instead of calling | 
|  | 539 | * generic_file_aio_read() in order to avoid gfar's check to see if | 
|  | 540 | * the request starts before the end of the file.  For that check | 
|  | 541 | * to work, we must generate a GETATTR before each direct read, and | 
|  | 542 | * even then there is a window between the GETATTR and the subsequent | 
|  | 543 | * READ where the file size could change.  Our preference is simply | 
|  | 544 | * to do all reads the application wants, and the server will take | 
|  | 545 | * care of managing the end of file boundary. | 
|  | 546 | * | 
|  | 547 | * This function also eliminates unnecessarily updating the file's | 
|  | 548 | * atime locally, as the NFS server sets the file's atime, and this | 
|  | 549 | * client must read the updated atime from the server back into its | 
|  | 550 | * cache. | 
|  | 551 | */ | 
| Christoph Hellwig | c8b8e32 | 2016-04-07 08:51:58 -0700 | [diff] [blame] | 552 | ssize_t nfs_file_direct_read(struct kiocb *iocb, struct iov_iter *iter) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 553 | { | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 554 | struct file *file = iocb->ki_filp; | 
|  | 555 | struct address_space *mapping = file->f_mapping; | 
|  | 556 | struct inode *inode = mapping->host; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 557 | struct nfs_direct_req *dreq; | 
| Trond Myklebust | b3c54de | 2012-08-13 17:15:50 -0400 | [diff] [blame] | 558 | struct nfs_lock_context *l_ctx; | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 559 | ssize_t result = -EINVAL, requested; | 
| Al Viro | a6cbcd4 | 2014-03-04 22:38:00 -0500 | [diff] [blame] | 560 | size_t count = iov_iter_count(iter); | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 561 | nfs_add_stats(mapping->host, NFSIOS_DIRECTREADBYTES, count); | 
|  | 562 |  | 
|  | 563 | dfprintk(FILE, "NFS: direct read(%pD2, %zd@%Ld)\n", | 
| Christoph Hellwig | c8b8e32 | 2016-04-07 08:51:58 -0700 | [diff] [blame] | 564 | file, count, (long long) iocb->ki_pos); | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 565 |  | 
|  | 566 | result = 0; | 
|  | 567 | if (!count) | 
|  | 568 | goto out; | 
|  | 569 |  | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 570 | task_io_account_read(count); | 
|  | 571 |  | 
|  | 572 | result = -ENOMEM; | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 573 | dreq = nfs_direct_req_alloc(); | 
| Trond Myklebust | f11ac8d | 2010-06-25 16:35:53 -0400 | [diff] [blame] | 574 | if (dreq == NULL) | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 575 | goto out; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 576 |  | 
| Chuck Lever | 91d5b47 | 2006-03-20 13:44:14 -0500 | [diff] [blame] | 577 | dreq->inode = inode; | 
| Weston Andros Adamson | ed3743a | 2016-04-01 11:42:29 -0400 | [diff] [blame] | 578 | dreq->bytes_left = dreq->max_count = count; | 
| Christoph Hellwig | c8b8e32 | 2016-04-07 08:51:58 -0700 | [diff] [blame] | 579 | dreq->io_start = iocb->ki_pos; | 
| Trond Myklebust | cd3758e | 2007-08-10 17:44:32 -0400 | [diff] [blame] | 580 | dreq->ctx = get_nfs_open_context(nfs_file_open_context(iocb->ki_filp)); | 
| Trond Myklebust | b3c54de | 2012-08-13 17:15:50 -0400 | [diff] [blame] | 581 | l_ctx = nfs_get_lock_context(dreq->ctx); | 
|  | 582 | if (IS_ERR(l_ctx)) { | 
|  | 583 | result = PTR_ERR(l_ctx); | 
| Trond Myklebust | f11ac8d | 2010-06-25 16:35:53 -0400 | [diff] [blame] | 584 | goto out_release; | 
| Trond Myklebust | b3c54de | 2012-08-13 17:15:50 -0400 | [diff] [blame] | 585 | } | 
|  | 586 | dreq->l_ctx = l_ctx; | 
| Chuck Lever | 487b837 | 2006-03-20 13:44:30 -0500 | [diff] [blame] | 587 | if (!is_sync_kiocb(iocb)) | 
|  | 588 | dreq->iocb = iocb; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 589 |  | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 590 | nfs_start_io_direct(inode); | 
|  | 591 |  | 
| Al Viro | 619d30b | 2014-03-04 21:53:33 -0500 | [diff] [blame] | 592 | NFS_I(inode)->read_io += count; | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 593 | requested = nfs_direct_read_schedule_iovec(dreq, iter, iocb->ki_pos); | 
| Christoph Hellwig | d0b9875 | 2013-11-14 08:50:33 -0800 | [diff] [blame] | 594 |  | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 595 | nfs_end_io_direct(inode); | 
| Christoph Hellwig | d0b9875 | 2013-11-14 08:50:33 -0800 | [diff] [blame] | 596 |  | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 597 | if (requested > 0) { | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 598 | result = nfs_direct_wait(dreq); | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 599 | if (result > 0) { | 
|  | 600 | requested -= result; | 
| Christoph Hellwig | c8b8e32 | 2016-04-07 08:51:58 -0700 | [diff] [blame] | 601 | iocb->ki_pos += result; | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 602 | } | 
|  | 603 | iov_iter_revert(iter, requested); | 
|  | 604 | } else { | 
|  | 605 | result = requested; | 
| Christoph Hellwig | 14a3ec79 | 2013-11-14 08:50:31 -0800 | [diff] [blame] | 606 | } | 
| Christoph Hellwig | d0b9875 | 2013-11-14 08:50:33 -0800 | [diff] [blame] | 607 |  | 
| Trond Myklebust | f11ac8d | 2010-06-25 16:35:53 -0400 | [diff] [blame] | 608 | out_release: | 
| Trond Myklebust | b4946ff | 2007-05-30 12:58:00 -0400 | [diff] [blame] | 609 | nfs_direct_req_release(dreq); | 
| Trond Myklebust | f11ac8d | 2010-06-25 16:35:53 -0400 | [diff] [blame] | 610 | out: | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 611 | return result; | 
|  | 612 | } | 
|  | 613 |  | 
| Tom Haynes | 085d1e3 | 2014-12-11 13:04:55 -0500 | [diff] [blame] | 614 | static void | 
|  | 615 | nfs_direct_write_scan_commit_list(struct inode *inode, | 
|  | 616 | struct list_head *list, | 
|  | 617 | struct nfs_commit_info *cinfo) | 
|  | 618 | { | 
| Trond Myklebust | e824f99 | 2017-08-01 11:53:49 -0400 | [diff] [blame] | 619 | mutex_lock(&NFS_I(cinfo->inode)->commit_mutex); | 
| Tom Haynes | 085d1e3 | 2014-12-11 13:04:55 -0500 | [diff] [blame] | 620 | #ifdef CONFIG_NFS_V4_1 | 
|  | 621 | if (cinfo->ds != NULL && cinfo->ds->nwritten != 0) | 
|  | 622 | NFS_SERVER(inode)->pnfs_curr_ld->recover_commit_reqs(list, cinfo); | 
|  | 623 | #endif | 
|  | 624 | nfs_scan_commit_list(&cinfo->mds->list, list, cinfo, 0); | 
| Trond Myklebust | e824f99 | 2017-08-01 11:53:49 -0400 | [diff] [blame] | 625 | mutex_unlock(&NFS_I(cinfo->inode)->commit_mutex); | 
| Tom Haynes | 085d1e3 | 2014-12-11 13:04:55 -0500 | [diff] [blame] | 626 | } | 
|  | 627 |  | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 628 | static void nfs_direct_write_reschedule(struct nfs_direct_req *dreq) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 629 | { | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 630 | struct nfs_pageio_descriptor desc; | 
|  | 631 | struct nfs_page *req, *tmp; | 
|  | 632 | LIST_HEAD(reqs); | 
|  | 633 | struct nfs_commit_info cinfo; | 
|  | 634 | LIST_HEAD(failed); | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 635 | int i; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 636 |  | 
|  | 637 | nfs_init_cinfo_from_dreq(&cinfo, dreq); | 
| Tom Haynes | 085d1e3 | 2014-12-11 13:04:55 -0500 | [diff] [blame] | 638 | nfs_direct_write_scan_commit_list(dreq->inode, &reqs, &cinfo); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 639 |  | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 640 | dreq->count = 0; | 
| Trond Myklebust | a5314a7 | 2016-06-01 21:42:32 -0400 | [diff] [blame] | 641 | dreq->verf.committed = NFS_INVALID_STABLE_HOW; | 
|  | 642 | nfs_clear_pnfs_ds_commit_verifiers(&dreq->ds_cinfo); | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 643 | for (i = 0; i < dreq->mirror_count; i++) | 
|  | 644 | dreq->mirrors[i].count = 0; | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 645 | get_dreq(dreq); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 646 |  | 
| Christoph Hellwig | a20c93e | 2014-04-16 15:07:21 +0200 | [diff] [blame] | 647 | nfs_pageio_init_write(&desc, dreq->inode, FLUSH_STABLE, false, | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 648 | &nfs_direct_write_completion_ops); | 
|  | 649 | desc.pg_dreq = dreq; | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 650 |  | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 651 | req = nfs_list_entry(reqs.next); | 
|  | 652 | nfs_direct_setup_mirroring(dreq, &desc, req); | 
| Peng Tao | d600ad1 | 2015-12-04 02:57:48 +0800 | [diff] [blame] | 653 | if (desc.pg_error < 0) { | 
|  | 654 | list_splice_init(&reqs, &failed); | 
|  | 655 | goto out_failed; | 
|  | 656 | } | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 657 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 658 | list_for_each_entry_safe(req, tmp, &reqs, wb_list) { | 
|  | 659 | if (!nfs_pageio_add_request(&desc, req)) { | 
| Trond Myklebust | 4035c24 | 2012-07-08 10:24:10 -0400 | [diff] [blame] | 660 | nfs_list_remove_request(req); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 661 | nfs_list_add_request(req, &failed); | 
| Dave Wysochanski | fe238e6 | 2016-04-01 13:45:09 -0400 | [diff] [blame] | 662 | spin_lock(&cinfo.inode->i_lock); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 663 | dreq->flags = 0; | 
| Peng Tao | d600ad1 | 2015-12-04 02:57:48 +0800 | [diff] [blame] | 664 | if (desc.pg_error < 0) | 
|  | 665 | dreq->error = desc.pg_error; | 
|  | 666 | else | 
|  | 667 | dreq->error = -EIO; | 
| Dave Wysochanski | fe238e6 | 2016-04-01 13:45:09 -0400 | [diff] [blame] | 668 | spin_unlock(&cinfo.inode->i_lock); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 669 | } | 
| Trond Myklebust | 5a695da | 2012-06-19 13:39:14 -0400 | [diff] [blame] | 670 | nfs_release_request(req); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 671 | } | 
|  | 672 | nfs_pageio_complete(&desc); | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 673 |  | 
| Peng Tao | d600ad1 | 2015-12-04 02:57:48 +0800 | [diff] [blame] | 674 | out_failed: | 
| Trond Myklebust | 4035c24 | 2012-07-08 10:24:10 -0400 | [diff] [blame] | 675 | while (!list_empty(&failed)) { | 
|  | 676 | req = nfs_list_entry(failed.next); | 
|  | 677 | nfs_list_remove_request(req); | 
| Trond Myklebust | 1d1afcb | 2012-05-09 14:04:55 -0400 | [diff] [blame] | 678 | nfs_unlock_and_release_request(req); | 
| Trond Myklebust | 4035c24 | 2012-07-08 10:24:10 -0400 | [diff] [blame] | 679 | } | 
| Trond Myklebust | 607f31e | 2006-06-28 16:52:45 -0400 | [diff] [blame] | 680 |  | 
|  | 681 | if (put_dreq(dreq)) | 
| Anna Schumaker | 4d3b55d | 2016-11-23 13:49:38 -0500 | [diff] [blame] | 682 | nfs_direct_write_complete(dreq); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 683 | } | 
|  | 684 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 685 | static void nfs_direct_commit_complete(struct nfs_commit_data *data) | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 686 | { | 
| Fred Isaman | 0b7c015 | 2012-04-20 14:47:39 -0400 | [diff] [blame] | 687 | struct nfs_direct_req *dreq = data->dreq; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 688 | struct nfs_commit_info cinfo; | 
|  | 689 | struct nfs_page *req; | 
| Trond Myklebust | c9d8f89 | 2008-04-15 16:56:39 -0400 | [diff] [blame] | 690 | int status = data->task.tk_status; | 
|  | 691 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 692 | nfs_init_cinfo_from_dreq(&cinfo, dreq); | 
| Anna Schumaker | fe4f844 | 2017-04-07 14:15:08 -0400 | [diff] [blame] | 693 | if (status < 0 || nfs_direct_cmp_commit_data_verf(dreq, data)) | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 694 | dreq->flags = NFS_ODIRECT_RESCHED_WRITES; | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 695 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 696 | while (!list_empty(&data->pages)) { | 
|  | 697 | req = nfs_list_entry(data->pages.next); | 
|  | 698 | nfs_list_remove_request(req); | 
|  | 699 | if (dreq->flags == NFS_ODIRECT_RESCHED_WRITES) { | 
|  | 700 | /* Note the rewrite will go through mds */ | 
| Weston Andros Adamson | b57ff13 | 2014-09-05 18:20:21 -0400 | [diff] [blame] | 701 | nfs_mark_request_commit(req, NULL, &cinfo, 0); | 
| Fred Isaman | 906369e | 2012-06-08 16:48:33 -0400 | [diff] [blame] | 702 | } else | 
|  | 703 | nfs_release_request(req); | 
| Trond Myklebust | 1d1afcb | 2012-05-09 14:04:55 -0400 | [diff] [blame] | 704 | nfs_unlock_and_release_request(req); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 705 | } | 
|  | 706 |  | 
|  | 707 | if (atomic_dec_and_test(&cinfo.mds->rpcs_out)) | 
| Anna Schumaker | 4d3b55d | 2016-11-23 13:49:38 -0500 | [diff] [blame] | 708 | nfs_direct_write_complete(dreq); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 709 | } | 
|  | 710 |  | 
| Trond Myklebust | b20135d | 2015-12-31 09:28:06 -0500 | [diff] [blame] | 711 | static void nfs_direct_resched_write(struct nfs_commit_info *cinfo, | 
|  | 712 | struct nfs_page *req) | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 713 | { | 
| Trond Myklebust | b20135d | 2015-12-31 09:28:06 -0500 | [diff] [blame] | 714 | struct nfs_direct_req *dreq = cinfo->dreq; | 
|  | 715 |  | 
|  | 716 | spin_lock(&dreq->lock); | 
|  | 717 | dreq->flags = NFS_ODIRECT_RESCHED_WRITES; | 
|  | 718 | spin_unlock(&dreq->lock); | 
|  | 719 | nfs_mark_request_commit(req, NULL, cinfo, 0); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 720 | } | 
|  | 721 |  | 
|  | 722 | static const struct nfs_commit_completion_ops nfs_direct_commit_completion_ops = { | 
|  | 723 | .completion = nfs_direct_commit_complete, | 
| Trond Myklebust | b20135d | 2015-12-31 09:28:06 -0500 | [diff] [blame] | 724 | .resched_write = nfs_direct_resched_write, | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 725 | }; | 
|  | 726 |  | 
|  | 727 | static void nfs_direct_commit_schedule(struct nfs_direct_req *dreq) | 
|  | 728 | { | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 729 | int res; | 
|  | 730 | struct nfs_commit_info cinfo; | 
|  | 731 | LIST_HEAD(mds_list); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 732 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 733 | nfs_init_cinfo_from_dreq(&cinfo, dreq); | 
|  | 734 | nfs_scan_commit(dreq->inode, &mds_list, &cinfo); | 
|  | 735 | res = nfs_generic_commit_list(dreq->inode, &mds_list, 0, &cinfo); | 
|  | 736 | if (res < 0) /* res == -ENOMEM */ | 
|  | 737 | nfs_direct_write_reschedule(dreq); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 738 | } | 
|  | 739 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 740 | static void nfs_direct_write_schedule_work(struct work_struct *work) | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 741 | { | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 742 | struct nfs_direct_req *dreq = container_of(work, struct nfs_direct_req, work); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 743 | int flags = dreq->flags; | 
|  | 744 |  | 
|  | 745 | dreq->flags = 0; | 
|  | 746 | switch (flags) { | 
|  | 747 | case NFS_ODIRECT_DO_COMMIT: | 
|  | 748 | nfs_direct_commit_schedule(dreq); | 
|  | 749 | break; | 
|  | 750 | case NFS_ODIRECT_RESCHED_WRITES: | 
|  | 751 | nfs_direct_write_reschedule(dreq); | 
|  | 752 | break; | 
|  | 753 | default: | 
| Trond Myklebust | f7b5c34 | 2016-06-23 09:29:47 -0400 | [diff] [blame] | 754 | nfs_zap_mapping(dreq->inode, dreq->inode->i_mapping); | 
|  | 755 | nfs_direct_complete(dreq); | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 756 | } | 
|  | 757 | } | 
|  | 758 |  | 
| Anna Schumaker | 4d3b55d | 2016-11-23 13:49:38 -0500 | [diff] [blame] | 759 | static void nfs_direct_write_complete(struct nfs_direct_req *dreq) | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 760 | { | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 761 | schedule_work(&dreq->work); /* Calls nfs_direct_write_schedule_work */ | 
| Trond Myklebust | fad6149 | 2006-03-20 13:44:36 -0500 | [diff] [blame] | 762 | } | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 763 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 764 | static void nfs_direct_write_completion(struct nfs_pgio_header *hdr) | 
|  | 765 | { | 
|  | 766 | struct nfs_direct_req *dreq = hdr->dreq; | 
|  | 767 | struct nfs_commit_info cinfo; | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 768 | bool request_commit = false; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 769 | struct nfs_page *req = nfs_list_entry(hdr->pages.next); | 
|  | 770 |  | 
|  | 771 | if (test_bit(NFS_IOHDR_REDO, &hdr->flags)) | 
|  | 772 | goto out_put; | 
|  | 773 |  | 
|  | 774 | nfs_init_cinfo_from_dreq(&cinfo, dreq); | 
|  | 775 |  | 
|  | 776 | spin_lock(&dreq->lock); | 
|  | 777 |  | 
| J. Bruce Fields | 1b8d97b | 2018-01-16 10:08:00 -0500 | [diff] [blame] | 778 | if (test_bit(NFS_IOHDR_ERROR, &hdr->flags)) | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 779 | dreq->error = hdr->error; | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 780 | if (dreq->error == 0) { | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 781 | nfs_direct_good_bytes(dreq, hdr); | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 782 | if (nfs_write_need_commit(hdr)) { | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 783 | if (dreq->flags == NFS_ODIRECT_RESCHED_WRITES) | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 784 | request_commit = true; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 785 | else if (dreq->flags == 0) { | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 786 | nfs_direct_set_hdr_verf(dreq, hdr); | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 787 | request_commit = true; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 788 | dreq->flags = NFS_ODIRECT_DO_COMMIT; | 
|  | 789 | } else if (dreq->flags == NFS_ODIRECT_DO_COMMIT) { | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 790 | request_commit = true; | 
|  | 791 | if (nfs_direct_set_or_cmp_hdr_verf(dreq, hdr)) | 
| Weston Andros Adamson | 5002c58 | 2014-05-15 11:56:54 -0400 | [diff] [blame] | 792 | dreq->flags = | 
|  | 793 | NFS_ODIRECT_RESCHED_WRITES; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 794 | } | 
|  | 795 | } | 
|  | 796 | } | 
|  | 797 | spin_unlock(&dreq->lock); | 
|  | 798 |  | 
|  | 799 | while (!list_empty(&hdr->pages)) { | 
| Weston Andros Adamson | 2bfc6e5 | 2014-05-15 11:56:45 -0400 | [diff] [blame] | 800 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 801 | req = nfs_list_entry(hdr->pages.next); | 
|  | 802 | nfs_list_remove_request(req); | 
| Weston Andros Adamson | c65e625 | 2014-06-09 11:48:36 -0400 | [diff] [blame] | 803 | if (request_commit) { | 
| Trond Myklebust | 0427708 | 2012-05-09 13:54:53 -0400 | [diff] [blame] | 804 | kref_get(&req->wb_kref); | 
| Weston Andros Adamson | b57ff13 | 2014-09-05 18:20:21 -0400 | [diff] [blame] | 805 | nfs_mark_request_commit(req, hdr->lseg, &cinfo, | 
|  | 806 | hdr->ds_commit_idx); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 807 | } | 
| Trond Myklebust | 1d1afcb | 2012-05-09 14:04:55 -0400 | [diff] [blame] | 808 | nfs_unlock_and_release_request(req); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 809 | } | 
|  | 810 |  | 
|  | 811 | out_put: | 
|  | 812 | if (put_dreq(dreq)) | 
| Anna Schumaker | 4d3b55d | 2016-11-23 13:49:38 -0500 | [diff] [blame] | 813 | nfs_direct_write_complete(dreq); | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 814 | hdr->release(hdr); | 
|  | 815 | } | 
|  | 816 |  | 
| Trond Myklebust | 3e9e0ca3 | 2012-04-30 13:40:06 -0400 | [diff] [blame] | 817 | static void nfs_write_sync_pgio_error(struct list_head *head) | 
|  | 818 | { | 
|  | 819 | struct nfs_page *req; | 
|  | 820 |  | 
|  | 821 | while (!list_empty(head)) { | 
|  | 822 | req = nfs_list_entry(head->next); | 
|  | 823 | nfs_list_remove_request(req); | 
| Trond Myklebust | 1d1afcb | 2012-05-09 14:04:55 -0400 | [diff] [blame] | 824 | nfs_unlock_and_release_request(req); | 
| Trond Myklebust | 3e9e0ca3 | 2012-04-30 13:40:06 -0400 | [diff] [blame] | 825 | } | 
|  | 826 | } | 
|  | 827 |  | 
| Trond Myklebust | dc602dd | 2015-12-31 11:44:06 -0500 | [diff] [blame] | 828 | static void nfs_direct_write_reschedule_io(struct nfs_pgio_header *hdr) | 
|  | 829 | { | 
|  | 830 | struct nfs_direct_req *dreq = hdr->dreq; | 
|  | 831 |  | 
|  | 832 | spin_lock(&dreq->lock); | 
|  | 833 | if (dreq->error == 0) { | 
|  | 834 | dreq->flags = NFS_ODIRECT_RESCHED_WRITES; | 
|  | 835 | /* fake unstable write to let common nfs resend pages */ | 
|  | 836 | hdr->verf.committed = NFS_UNSTABLE; | 
|  | 837 | hdr->good_bytes = hdr->args.count; | 
|  | 838 | } | 
|  | 839 | spin_unlock(&dreq->lock); | 
|  | 840 | } | 
|  | 841 |  | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 842 | static const struct nfs_pgio_completion_ops nfs_direct_write_completion_ops = { | 
| Trond Myklebust | 3e9e0ca3 | 2012-04-30 13:40:06 -0400 | [diff] [blame] | 843 | .error_cleanup = nfs_write_sync_pgio_error, | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 844 | .init_hdr = nfs_direct_pgio_init, | 
|  | 845 | .completion = nfs_direct_write_completion, | 
| Trond Myklebust | dc602dd | 2015-12-31 11:44:06 -0500 | [diff] [blame] | 846 | .reschedule_io = nfs_direct_write_reschedule_io, | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 847 | }; | 
|  | 848 |  | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 849 |  | 
|  | 850 | /* | 
|  | 851 | * NB: Return the value of the first error return code.  Subsequent | 
|  | 852 | *     errors after the first one are ignored. | 
|  | 853 | */ | 
|  | 854 | /* | 
|  | 855 | * For each wsize'd chunk of the user's buffer, dispatch an NFS WRITE | 
|  | 856 | * operation.  If nfs_writedata_alloc() or get_user_pages() fails, | 
|  | 857 | * bail and stop sending more writes.  Write length accounting is | 
|  | 858 | * handled automatically by nfs_direct_write_result().  Otherwise, if | 
|  | 859 | * no requests have been sent, just return an error. | 
|  | 860 | */ | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 861 | static ssize_t nfs_direct_write_schedule_iovec(struct nfs_direct_req *dreq, | 
| Al Viro | 619d30b | 2014-03-04 21:53:33 -0500 | [diff] [blame] | 862 | struct iov_iter *iter, | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 863 | loff_t pos) | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 864 | { | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 865 | struct nfs_pageio_descriptor desc; | 
| Trond Myklebust | 1d59d61 | 2012-05-31 12:22:33 -0400 | [diff] [blame] | 866 | struct inode *inode = dreq->inode; | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 867 | ssize_t result = 0; | 
|  | 868 | size_t requested_bytes = 0; | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 869 | size_t wsize = max_t(size_t, NFS_SERVER(inode)->wsize, PAGE_SIZE); | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 870 |  | 
| Christoph Hellwig | a20c93e | 2014-04-16 15:07:21 +0200 | [diff] [blame] | 871 | nfs_pageio_init_write(&desc, inode, FLUSH_COND_STABLE, false, | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 872 | &nfs_direct_write_completion_ops); | 
|  | 873 | desc.pg_dreq = dreq; | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 874 | get_dreq(dreq); | 
| Jens Axboe | fe0f07d | 2015-04-15 17:05:48 -0600 | [diff] [blame] | 875 | inode_dio_begin(inode); | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 876 |  | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 877 | NFS_I(inode)->write_io += iov_iter_count(iter); | 
|  | 878 | while (iov_iter_count(iter)) { | 
|  | 879 | struct page **pagevec; | 
|  | 880 | size_t bytes; | 
|  | 881 | size_t pgbase; | 
|  | 882 | unsigned npages, i; | 
|  | 883 |  | 
|  | 884 | result = iov_iter_get_pages_alloc(iter, &pagevec, | 
|  | 885 | wsize, &pgbase); | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 886 | if (result < 0) | 
|  | 887 | break; | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 888 |  | 
|  | 889 | bytes = result; | 
|  | 890 | iov_iter_advance(iter, bytes); | 
|  | 891 | npages = (result + pgbase + PAGE_SIZE - 1) / PAGE_SIZE; | 
|  | 892 | for (i = 0; i < npages; i++) { | 
|  | 893 | struct nfs_page *req; | 
|  | 894 | unsigned int req_len = min_t(size_t, bytes, PAGE_SIZE - pgbase); | 
|  | 895 |  | 
| Linus Torvalds | 16b9057 | 2014-06-12 10:30:18 -0700 | [diff] [blame] | 896 | req = nfs_create_request(dreq->ctx, pagevec[i], NULL, | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 897 | pgbase, req_len); | 
|  | 898 | if (IS_ERR(req)) { | 
|  | 899 | result = PTR_ERR(req); | 
|  | 900 | break; | 
|  | 901 | } | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 902 |  | 
|  | 903 | nfs_direct_setup_mirroring(dreq, &desc, req); | 
| Peng Tao | d600ad1 | 2015-12-04 02:57:48 +0800 | [diff] [blame] | 904 | if (desc.pg_error < 0) { | 
|  | 905 | nfs_free_request(req); | 
|  | 906 | result = desc.pg_error; | 
|  | 907 | break; | 
|  | 908 | } | 
| Weston Andros Adamson | 0a00b77 | 2014-09-19 12:48:33 -0400 | [diff] [blame] | 909 |  | 
| Al Viro | 91f79c4 | 2014-03-21 04:58:33 -0400 | [diff] [blame] | 910 | nfs_lock_request(req); | 
|  | 911 | req->wb_index = pos >> PAGE_SHIFT; | 
|  | 912 | req->wb_offset = pos & ~PAGE_MASK; | 
|  | 913 | if (!nfs_pageio_add_request(&desc, req)) { | 
|  | 914 | result = desc.pg_error; | 
|  | 915 | nfs_unlock_and_release_request(req); | 
|  | 916 | break; | 
|  | 917 | } | 
|  | 918 | pgbase = 0; | 
|  | 919 | bytes -= req_len; | 
|  | 920 | requested_bytes += req_len; | 
|  | 921 | pos += req_len; | 
|  | 922 | dreq->bytes_left -= req_len; | 
|  | 923 | } | 
|  | 924 | nfs_direct_release_pages(pagevec, npages); | 
|  | 925 | kvfree(pagevec); | 
|  | 926 | if (result < 0) | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 927 | break; | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 928 | } | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 929 | nfs_pageio_complete(&desc); | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 930 |  | 
| Chuck Lever | 839f7ad | 2011-01-21 15:54:57 +0000 | [diff] [blame] | 931 | /* | 
|  | 932 | * If no bytes were started, return the error, and let the | 
|  | 933 | * generic layer handle the completion. | 
|  | 934 | */ | 
|  | 935 | if (requested_bytes == 0) { | 
| Jens Axboe | fe0f07d | 2015-04-15 17:05:48 -0600 | [diff] [blame] | 936 | inode_dio_end(inode); | 
| Chuck Lever | 839f7ad | 2011-01-21 15:54:57 +0000 | [diff] [blame] | 937 | nfs_direct_req_release(dreq); | 
|  | 938 | return result < 0 ? result : -EIO; | 
|  | 939 | } | 
|  | 940 |  | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 941 | if (put_dreq(dreq)) | 
| Anna Schumaker | 4d3b55d | 2016-11-23 13:49:38 -0500 | [diff] [blame] | 942 | nfs_direct_write_complete(dreq); | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 943 | return requested_bytes; | 
| Chuck Lever | 19f7378 | 2007-11-12 12:16:47 -0500 | [diff] [blame] | 944 | } | 
|  | 945 |  | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 946 | /** | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 947 | * nfs_file_direct_write - file direct write operation for NFS files | 
|  | 948 | * @iocb: target I/O control block | 
| Al Viro | 619d30b | 2014-03-04 21:53:33 -0500 | [diff] [blame] | 949 | * @iter: vector of user buffers from which to write data | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 950 | * | 
|  | 951 | * We use this function for direct writes instead of calling | 
|  | 952 | * generic_file_aio_write() in order to avoid taking the inode | 
|  | 953 | * semaphore and updating the i_size.  The NFS server will set | 
|  | 954 | * the new i_size and this client must read the updated size | 
|  | 955 | * back into its cache.  We let the server do generic write | 
|  | 956 | * parameter checking and report problems. | 
|  | 957 | * | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 958 | * We eliminate local atime updates, see direct read above. | 
|  | 959 | * | 
|  | 960 | * We avoid unnecessary page cache invalidations for normal cached | 
|  | 961 | * readers of this file. | 
|  | 962 | * | 
|  | 963 | * Note that O_APPEND is not supported for NFS direct writes, as there | 
|  | 964 | * is no atomic O_APPEND write facility in the NFS protocol. | 
|  | 965 | */ | 
| Al Viro | 65a4a1c | 2015-04-09 14:11:08 -0400 | [diff] [blame] | 966 | ssize_t nfs_file_direct_write(struct kiocb *iocb, struct iov_iter *iter) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 967 | { | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 968 | ssize_t result = -EINVAL, requested; | 
| Trond Myklebust | 89698b2 | 2016-06-23 10:35:48 -0400 | [diff] [blame] | 969 | size_t count; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 970 | struct file *file = iocb->ki_filp; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 971 | struct address_space *mapping = file->f_mapping; | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 972 | struct inode *inode = mapping->host; | 
|  | 973 | struct nfs_direct_req *dreq; | 
|  | 974 | struct nfs_lock_context *l_ctx; | 
| Al Viro | 65a4a1c | 2015-04-09 14:11:08 -0400 | [diff] [blame] | 975 | loff_t pos, end; | 
| Chuck Lever | c216fd7 | 2007-11-12 12:16:52 -0500 | [diff] [blame] | 976 |  | 
| Al Viro | 6de1472 | 2013-09-16 10:53:17 -0400 | [diff] [blame] | 977 | dfprintk(FILE, "NFS: direct write(%pD2, %zd@%Ld)\n", | 
| Al Viro | 3309dd0 | 2015-04-09 12:55:47 -0400 | [diff] [blame] | 978 | file, iov_iter_count(iter), (long long) iocb->ki_pos); | 
| Badari Pulavarty | 027445c | 2006-09-30 23:28:46 -0700 | [diff] [blame] | 979 |  | 
| Trond Myklebust | 89698b2 | 2016-06-23 10:35:48 -0400 | [diff] [blame] | 980 | result = generic_write_checks(iocb, iter); | 
|  | 981 | if (result <= 0) | 
|  | 982 | return result; | 
|  | 983 | count = result; | 
|  | 984 | nfs_add_stats(mapping->host, NFSIOS_DIRECTWRITTENBYTES, count); | 
| Al Viro | 3309dd0 | 2015-04-09 12:55:47 -0400 | [diff] [blame] | 985 |  | 
|  | 986 | pos = iocb->ki_pos; | 
| Kirill A. Shutemov | 09cbfea | 2016-04-01 15:29:47 +0300 | [diff] [blame] | 987 | end = (pos + iov_iter_count(iter) - 1) >> PAGE_SHIFT; | 
| Chuck Lever | ce1a8e6 | 2005-11-30 18:08:17 -0500 | [diff] [blame] | 988 |  | 
| Trond Myklebust | 89698b2 | 2016-06-23 10:35:48 -0400 | [diff] [blame] | 989 | task_io_account_write(count); | 
| Konstantin Khlebnikov | 7ec10f2 | 2011-02-22 00:28:34 +0300 | [diff] [blame] | 990 |  | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 991 | result = -ENOMEM; | 
|  | 992 | dreq = nfs_direct_req_alloc(); | 
|  | 993 | if (!dreq) | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 994 | goto out; | 
| Chuck Lever | 9eafa8c | 2006-03-20 13:44:33 -0500 | [diff] [blame] | 995 |  | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 996 | dreq->inode = inode; | 
| Trond Myklebust | 89698b2 | 2016-06-23 10:35:48 -0400 | [diff] [blame] | 997 | dreq->bytes_left = dreq->max_count = count; | 
| Peng Tao | 5fadeb4 | 2015-01-19 12:41:16 +0800 | [diff] [blame] | 998 | dreq->io_start = pos; | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 999 | dreq->ctx = get_nfs_open_context(nfs_file_open_context(iocb->ki_filp)); | 
|  | 1000 | l_ctx = nfs_get_lock_context(dreq->ctx); | 
|  | 1001 | if (IS_ERR(l_ctx)) { | 
|  | 1002 | result = PTR_ERR(l_ctx); | 
|  | 1003 | goto out_release; | 
| Fred Isaman | 1763da1 | 2012-04-20 14:47:57 -0400 | [diff] [blame] | 1004 | } | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 1005 | dreq->l_ctx = l_ctx; | 
|  | 1006 | if (!is_sync_kiocb(iocb)) | 
|  | 1007 | dreq->iocb = iocb; | 
|  | 1008 |  | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 1009 | nfs_start_io_direct(inode); | 
|  | 1010 |  | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 1011 | requested = nfs_direct_write_schedule_iovec(dreq, iter, pos); | 
| Christoph Hellwig | a9ab5e8 | 2013-11-14 08:50:34 -0800 | [diff] [blame] | 1012 |  | 
|  | 1013 | if (mapping->nrpages) { | 
|  | 1014 | invalidate_inode_pages2_range(mapping, | 
| Kirill A. Shutemov | 09cbfea | 2016-04-01 15:29:47 +0300 | [diff] [blame] | 1015 | pos >> PAGE_SHIFT, end); | 
| Christoph Hellwig | a9ab5e8 | 2013-11-14 08:50:34 -0800 | [diff] [blame] | 1016 | } | 
|  | 1017 |  | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 1018 | nfs_end_io_direct(inode); | 
| Christoph Hellwig | a9ab5e8 | 2013-11-14 08:50:34 -0800 | [diff] [blame] | 1019 |  | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 1020 | if (requested > 0) { | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 1021 | result = nfs_direct_wait(dreq); | 
|  | 1022 | if (result > 0) { | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 1023 | requested -= result; | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 1024 | iocb->ki_pos = pos + result; | 
| Christoph Hellwig | e259221 | 2016-04-07 08:52:01 -0700 | [diff] [blame] | 1025 | /* XXX: should check the generic_write_sync retval */ | 
|  | 1026 | generic_write_sync(iocb, result); | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 1027 | } | 
| Al Viro | 85128b2 | 2017-04-13 09:31:51 -0400 | [diff] [blame] | 1028 | iov_iter_revert(iter, requested); | 
|  | 1029 | } else { | 
|  | 1030 | result = requested; | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 1031 | } | 
|  | 1032 | out_release: | 
|  | 1033 | nfs_direct_req_release(dreq); | 
| Trond Myklebust | a5864c9 | 2016-06-03 17:07:19 -0400 | [diff] [blame] | 1034 | out: | 
| Christoph Hellwig | 22cd1bf | 2013-11-14 08:50:32 -0800 | [diff] [blame] | 1035 | return result; | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1036 | } | 
|  | 1037 |  | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 1038 | /** | 
|  | 1039 | * nfs_init_directcache - create a slab cache for nfs_direct_req structures | 
|  | 1040 | * | 
|  | 1041 | */ | 
| David Howells | f7b422b | 2006-06-09 09:34:33 -0400 | [diff] [blame] | 1042 | int __init nfs_init_directcache(void) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1043 | { | 
|  | 1044 | nfs_direct_cachep = kmem_cache_create("nfs_direct_cache", | 
|  | 1045 | sizeof(struct nfs_direct_req), | 
| Paul Jackson | fffb60f | 2006-03-24 03:16:06 -0800 | [diff] [blame] | 1046 | 0, (SLAB_RECLAIM_ACCOUNT| | 
|  | 1047 | SLAB_MEM_SPREAD), | 
| Paul Mundt | 20c2df8 | 2007-07-20 10:11:58 +0900 | [diff] [blame] | 1048 | NULL); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1049 | if (nfs_direct_cachep == NULL) | 
|  | 1050 | return -ENOMEM; | 
|  | 1051 |  | 
|  | 1052 | return 0; | 
|  | 1053 | } | 
|  | 1054 |  | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 1055 | /** | 
| David Howells | f7b422b | 2006-06-09 09:34:33 -0400 | [diff] [blame] | 1056 | * nfs_destroy_directcache - destroy the slab cache for nfs_direct_req structures | 
| Chuck Lever | 8846705 | 2006-03-20 13:44:34 -0500 | [diff] [blame] | 1057 | * | 
|  | 1058 | */ | 
| David Brownell | 266bee8 | 2006-06-27 12:59:15 -0700 | [diff] [blame] | 1059 | void nfs_destroy_directcache(void) | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1060 | { | 
| Alexey Dobriyan | 1a1d92c | 2006-09-27 01:49:40 -0700 | [diff] [blame] | 1061 | kmem_cache_destroy(nfs_direct_cachep); | 
| Linus Torvalds | 1da177e | 2005-04-16 15:20:36 -0700 | [diff] [blame] | 1062 | } |