blob: fed65303eeeb246ae74285d60541d13a814b7cb1 [file] [log] [blame]
Miklos Szeredi334f4852005-09-09 13:10:27 -07001/*
2 FUSE: Filesystem in Userspace
Miklos Szeredi1729a162008-11-26 12:03:54 +01003 Copyright (C) 2001-2008 Miklos Szeredi <miklos@szeredi.hu>
Miklos Szeredi334f4852005-09-09 13:10:27 -07004
5 This program can be distributed under the terms of the GNU GPL.
6 See the file COPYING.
7*/
8
9#include "fuse_i.h"
10
11#include <linux/init.h>
12#include <linux/module.h>
13#include <linux/poll.h>
14#include <linux/uio.h>
15#include <linux/miscdevice.h>
16#include <linux/pagemap.h>
17#include <linux/file.h>
18#include <linux/slab.h>
Miklos Szeredidd3bb142010-05-25 15:06:06 +020019#include <linux/pipe_fs_i.h>
Miklos Szeredice534fb2010-05-25 15:06:07 +020020#include <linux/swap.h>
21#include <linux/splice.h>
Miklos Szeredi334f4852005-09-09 13:10:27 -070022
23MODULE_ALIAS_MISCDEV(FUSE_MINOR);
Kay Sievers578454f2010-05-20 18:07:20 +020024MODULE_ALIAS("devname:fuse");
Miklos Szeredi334f4852005-09-09 13:10:27 -070025
Christoph Lametere18b8902006-12-06 20:33:20 -080026static struct kmem_cache *fuse_req_cachep;
Miklos Szeredi334f4852005-09-09 13:10:27 -070027
Miklos Szeredi8bfc0162006-01-16 22:14:28 -080028static struct fuse_conn *fuse_get_conn(struct file *file)
Miklos Szeredi334f4852005-09-09 13:10:27 -070029{
Miklos Szeredi0720b312006-04-10 22:54:55 -070030 /*
31 * Lockless access is OK, because file->private data is set
32 * once during mount and is valid until the file is released.
33 */
34 return file->private_data;
Miklos Szeredi334f4852005-09-09 13:10:27 -070035}
36
Miklos Szeredi8bfc0162006-01-16 22:14:28 -080037static void fuse_request_init(struct fuse_req *req)
Miklos Szeredi334f4852005-09-09 13:10:27 -070038{
39 memset(req, 0, sizeof(*req));
40 INIT_LIST_HEAD(&req->list);
Miklos Szeredia4d27e72006-06-25 05:48:54 -070041 INIT_LIST_HEAD(&req->intr_entry);
Miklos Szeredi334f4852005-09-09 13:10:27 -070042 init_waitqueue_head(&req->waitq);
43 atomic_set(&req->count, 1);
44}
45
46struct fuse_req *fuse_request_alloc(void)
47{
Christoph Lametere94b1762006-12-06 20:33:17 -080048 struct fuse_req *req = kmem_cache_alloc(fuse_req_cachep, GFP_KERNEL);
Miklos Szeredi334f4852005-09-09 13:10:27 -070049 if (req)
50 fuse_request_init(req);
51 return req;
52}
Tejun Heo08cbf542009-04-14 10:54:53 +090053EXPORT_SYMBOL_GPL(fuse_request_alloc);
Miklos Szeredi334f4852005-09-09 13:10:27 -070054
Miklos Szeredi3be5a522008-04-30 00:54:41 -070055struct fuse_req *fuse_request_alloc_nofs(void)
56{
57 struct fuse_req *req = kmem_cache_alloc(fuse_req_cachep, GFP_NOFS);
58 if (req)
59 fuse_request_init(req);
60 return req;
61}
62
Miklos Szeredi334f4852005-09-09 13:10:27 -070063void fuse_request_free(struct fuse_req *req)
64{
65 kmem_cache_free(fuse_req_cachep, req);
66}
67
Miklos Szeredi8bfc0162006-01-16 22:14:28 -080068static void block_sigs(sigset_t *oldset)
Miklos Szeredi334f4852005-09-09 13:10:27 -070069{
70 sigset_t mask;
71
72 siginitsetinv(&mask, sigmask(SIGKILL));
73 sigprocmask(SIG_BLOCK, &mask, oldset);
74}
75
Miklos Szeredi8bfc0162006-01-16 22:14:28 -080076static void restore_sigs(sigset_t *oldset)
Miklos Szeredi334f4852005-09-09 13:10:27 -070077{
78 sigprocmask(SIG_SETMASK, oldset, NULL);
79}
80
Miklos Szeredi334f4852005-09-09 13:10:27 -070081static void __fuse_get_request(struct fuse_req *req)
82{
83 atomic_inc(&req->count);
84}
85
86/* Must be called with > 1 refcount */
87static void __fuse_put_request(struct fuse_req *req)
88{
89 BUG_ON(atomic_read(&req->count) < 2);
90 atomic_dec(&req->count);
91}
92
Miklos Szeredi33649c92006-06-25 05:48:52 -070093static void fuse_req_init_context(struct fuse_req *req)
94{
David Howells2186a712008-11-14 10:38:53 +110095 req->in.h.uid = current_fsuid();
96 req->in.h.gid = current_fsgid();
Miklos Szeredi33649c92006-06-25 05:48:52 -070097 req->in.h.pid = current->pid;
98}
99
Miklos Szeredice1d5a42006-04-10 22:54:58 -0700100struct fuse_req *fuse_get_req(struct fuse_conn *fc)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700101{
Miklos Szeredi08a53cd2006-04-10 22:54:59 -0700102 struct fuse_req *req;
103 sigset_t oldset;
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200104 int intr;
Miklos Szeredi08a53cd2006-04-10 22:54:59 -0700105 int err;
106
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200107 atomic_inc(&fc->num_waiting);
Miklos Szeredi08a53cd2006-04-10 22:54:59 -0700108 block_sigs(&oldset);
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200109 intr = wait_event_interruptible(fc->blocked_waitq, !fc->blocked);
Miklos Szeredi08a53cd2006-04-10 22:54:59 -0700110 restore_sigs(&oldset);
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200111 err = -EINTR;
112 if (intr)
113 goto out;
Miklos Szeredi08a53cd2006-04-10 22:54:59 -0700114
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700115 err = -ENOTCONN;
116 if (!fc->connected)
117 goto out;
118
Miklos Szeredi08a53cd2006-04-10 22:54:59 -0700119 req = fuse_request_alloc();
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200120 err = -ENOMEM;
Miklos Szeredice1d5a42006-04-10 22:54:58 -0700121 if (!req)
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200122 goto out;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700123
Miklos Szeredi33649c92006-06-25 05:48:52 -0700124 fuse_req_init_context(req);
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200125 req->waiting = 1;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700126 return req;
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200127
128 out:
129 atomic_dec(&fc->num_waiting);
130 return ERR_PTR(err);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700131}
Tejun Heo08cbf542009-04-14 10:54:53 +0900132EXPORT_SYMBOL_GPL(fuse_get_req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700133
Miklos Szeredi33649c92006-06-25 05:48:52 -0700134/*
135 * Return request in fuse_file->reserved_req. However that may
136 * currently be in use. If that is the case, wait for it to become
137 * available.
138 */
139static struct fuse_req *get_reserved_req(struct fuse_conn *fc,
140 struct file *file)
141{
142 struct fuse_req *req = NULL;
143 struct fuse_file *ff = file->private_data;
144
145 do {
Miklos Szeredide5e3de2007-10-16 23:31:00 -0700146 wait_event(fc->reserved_req_waitq, ff->reserved_req);
Miklos Szeredi33649c92006-06-25 05:48:52 -0700147 spin_lock(&fc->lock);
148 if (ff->reserved_req) {
149 req = ff->reserved_req;
150 ff->reserved_req = NULL;
151 get_file(file);
152 req->stolen_file = file;
153 }
154 spin_unlock(&fc->lock);
155 } while (!req);
156
157 return req;
158}
159
160/*
161 * Put stolen request back into fuse_file->reserved_req
162 */
163static void put_reserved_req(struct fuse_conn *fc, struct fuse_req *req)
164{
165 struct file *file = req->stolen_file;
166 struct fuse_file *ff = file->private_data;
167
168 spin_lock(&fc->lock);
169 fuse_request_init(req);
170 BUG_ON(ff->reserved_req);
171 ff->reserved_req = req;
Miklos Szeredide5e3de2007-10-16 23:31:00 -0700172 wake_up_all(&fc->reserved_req_waitq);
Miklos Szeredi33649c92006-06-25 05:48:52 -0700173 spin_unlock(&fc->lock);
174 fput(file);
175}
176
177/*
178 * Gets a requests for a file operation, always succeeds
179 *
180 * This is used for sending the FLUSH request, which must get to
181 * userspace, due to POSIX locks which may need to be unlocked.
182 *
183 * If allocation fails due to OOM, use the reserved request in
184 * fuse_file.
185 *
186 * This is very unlikely to deadlock accidentally, since the
187 * filesystem should not have it's own file open. If deadlock is
188 * intentional, it can still be broken by "aborting" the filesystem.
189 */
190struct fuse_req *fuse_get_req_nofail(struct fuse_conn *fc, struct file *file)
191{
192 struct fuse_req *req;
193
194 atomic_inc(&fc->num_waiting);
195 wait_event(fc->blocked_waitq, !fc->blocked);
196 req = fuse_request_alloc();
197 if (!req)
198 req = get_reserved_req(fc, file);
199
200 fuse_req_init_context(req);
201 req->waiting = 1;
202 return req;
203}
204
Miklos Szeredi334f4852005-09-09 13:10:27 -0700205void fuse_put_request(struct fuse_conn *fc, struct fuse_req *req)
206{
Miklos Szeredi7128ec22006-02-04 23:27:40 -0800207 if (atomic_dec_and_test(&req->count)) {
Miklos Szeredi9bc5ddd2006-04-11 21:16:09 +0200208 if (req->waiting)
209 atomic_dec(&fc->num_waiting);
Miklos Szeredi33649c92006-06-25 05:48:52 -0700210
211 if (req->stolen_file)
212 put_reserved_req(fc, req);
213 else
214 fuse_request_free(req);
Miklos Szeredi7128ec22006-02-04 23:27:40 -0800215 }
216}
Tejun Heo08cbf542009-04-14 10:54:53 +0900217EXPORT_SYMBOL_GPL(fuse_put_request);
Miklos Szeredi7128ec22006-02-04 23:27:40 -0800218
Miklos Szeredid12def12008-02-06 01:38:39 -0800219static unsigned len_args(unsigned numargs, struct fuse_arg *args)
220{
221 unsigned nbytes = 0;
222 unsigned i;
223
224 for (i = 0; i < numargs; i++)
225 nbytes += args[i].size;
226
227 return nbytes;
228}
229
230static u64 fuse_get_unique(struct fuse_conn *fc)
231{
232 fc->reqctr++;
233 /* zero is special */
234 if (fc->reqctr == 0)
235 fc->reqctr = 1;
236
237 return fc->reqctr;
238}
239
240static void queue_request(struct fuse_conn *fc, struct fuse_req *req)
241{
Miklos Szeredid12def12008-02-06 01:38:39 -0800242 req->in.h.len = sizeof(struct fuse_in_header) +
243 len_args(req->in.numargs, (struct fuse_arg *) req->in.args);
244 list_add_tail(&req->list, &fc->pending);
245 req->state = FUSE_REQ_PENDING;
246 if (!req->waiting) {
247 req->waiting = 1;
248 atomic_inc(&fc->num_waiting);
249 }
250 wake_up(&fc->waitq);
251 kill_fasync(&fc->fasync, SIGIO, POLL_IN);
252}
253
Miklos Szeredi07e77dc2010-12-07 20:16:56 +0100254void fuse_queue_forget(struct fuse_conn *fc, struct fuse_forget_link *forget,
255 u64 nodeid, u64 nlookup)
256{
257 forget->nodeid = nodeid;
258 forget->nlookup = nlookup;
259
260 spin_lock(&fc->lock);
261 fc->forget_list_tail->next = forget;
262 fc->forget_list_tail = forget;
263 wake_up(&fc->waitq);
264 kill_fasync(&fc->fasync, SIGIO, POLL_IN);
265 spin_unlock(&fc->lock);
266}
267
Miklos Szeredid12def12008-02-06 01:38:39 -0800268static void flush_bg_queue(struct fuse_conn *fc)
269{
Csaba Henk7a6d3c82009-07-01 17:28:41 -0700270 while (fc->active_background < fc->max_background &&
Miklos Szeredid12def12008-02-06 01:38:39 -0800271 !list_empty(&fc->bg_queue)) {
272 struct fuse_req *req;
273
274 req = list_entry(fc->bg_queue.next, struct fuse_req, list);
275 list_del(&req->list);
276 fc->active_background++;
Miklos Szeredi2d45ba32010-07-12 14:41:40 +0200277 req->in.h.unique = fuse_get_unique(fc);
Miklos Szeredid12def12008-02-06 01:38:39 -0800278 queue_request(fc, req);
279 }
280}
281
Miklos Szeredi6dbbcb12006-04-26 10:49:06 +0200282/*
Miklos Szeredi334f4852005-09-09 13:10:27 -0700283 * This function is called when a request is finished. Either a reply
Miklos Szeredif9a28422006-06-25 05:48:53 -0700284 * has arrived or it was aborted (and not yet sent) or some error
Miklos Szeredif43b1552006-01-16 22:14:26 -0800285 * occurred during communication with userspace, or the device file
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700286 * was closed. The requester thread is woken up (if still waiting),
287 * the 'end' callback is called if given, else the reference to the
288 * request is released
Miklos Szeredi7128ec22006-02-04 23:27:40 -0800289 *
Miklos Szeredid7133112006-04-10 22:54:55 -0700290 * Called with fc->lock, unlocks it
Miklos Szeredi334f4852005-09-09 13:10:27 -0700291 */
292static void request_end(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +0200293__releases(fc->lock)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700294{
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700295 void (*end) (struct fuse_conn *, struct fuse_req *) = req->end;
296 req->end = NULL;
Miklos Szeredid77a1d52006-01-16 22:14:31 -0800297 list_del(&req->list);
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700298 list_del(&req->intr_entry);
Miklos Szeredi83cfd492006-01-16 22:14:31 -0800299 req->state = FUSE_REQ_FINISHED;
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700300 if (req->background) {
Csaba Henk7a6d3c82009-07-01 17:28:41 -0700301 if (fc->num_background == fc->max_background) {
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700302 fc->blocked = 0;
303 wake_up_all(&fc->blocked_waitq);
304 }
Csaba Henk7a6d3c82009-07-01 17:28:41 -0700305 if (fc->num_background == fc->congestion_threshold &&
Tejun Heoa325f9b2009-04-14 10:54:52 +0900306 fc->connected && fc->bdi_initialized) {
Jens Axboe8aa7e842009-07-09 14:52:32 +0200307 clear_bdi_congested(&fc->bdi, BLK_RW_SYNC);
308 clear_bdi_congested(&fc->bdi, BLK_RW_ASYNC);
Miklos Szeredif92b99b2007-10-16 23:30:59 -0700309 }
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700310 fc->num_background--;
Miklos Szeredid12def12008-02-06 01:38:39 -0800311 fc->active_background--;
312 flush_bg_queue(fc);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700313 }
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700314 spin_unlock(&fc->lock);
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700315 wake_up(&req->waitq);
316 if (end)
317 end(fc, req);
Tejun Heoe9bb09d2008-11-26 12:03:54 +0100318 fuse_put_request(fc, req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700319}
320
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700321static void wait_answer_interruptible(struct fuse_conn *fc,
322 struct fuse_req *req)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +0200323__releases(fc->lock)
324__acquires(fc->lock)
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700325{
326 if (signal_pending(current))
327 return;
328
329 spin_unlock(&fc->lock);
330 wait_event_interruptible(req->waitq, req->state == FUSE_REQ_FINISHED);
331 spin_lock(&fc->lock);
332}
333
334static void queue_interrupt(struct fuse_conn *fc, struct fuse_req *req)
335{
336 list_add_tail(&req->intr_entry, &fc->interrupts);
337 wake_up(&fc->waitq);
338 kill_fasync(&fc->fasync, SIGIO, POLL_IN);
339}
340
Miklos Szeredi7c352bd2005-09-09 13:10:39 -0700341static void request_wait_answer(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +0200342__releases(fc->lock)
343__acquires(fc->lock)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700344{
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700345 if (!fc->no_interrupt) {
346 /* Any signal may interrupt this */
347 wait_answer_interruptible(fc, req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700348
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700349 if (req->aborted)
350 goto aborted;
351 if (req->state == FUSE_REQ_FINISHED)
352 return;
353
354 req->interrupted = 1;
355 if (req->state == FUSE_REQ_SENT)
356 queue_interrupt(fc, req);
357 }
358
Miklos Szeredia131de02007-10-16 23:31:04 -0700359 if (!req->force) {
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700360 sigset_t oldset;
361
362 /* Only fatal signals may interrupt this */
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700363 block_sigs(&oldset);
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700364 wait_answer_interruptible(fc, req);
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700365 restore_sigs(&oldset);
Miklos Szeredia131de02007-10-16 23:31:04 -0700366
367 if (req->aborted)
368 goto aborted;
369 if (req->state == FUSE_REQ_FINISHED)
370 return;
371
372 /* Request is not yet in userspace, bail out */
373 if (req->state == FUSE_REQ_PENDING) {
374 list_del(&req->list);
375 __fuse_put_request(req);
376 req->out.h.error = -EINTR;
377 return;
378 }
Miklos Szeredi51eb01e2006-06-25 05:48:50 -0700379 }
Miklos Szeredi334f4852005-09-09 13:10:27 -0700380
Miklos Szeredia131de02007-10-16 23:31:04 -0700381 /*
382 * Either request is already in userspace, or it was forced.
383 * Wait it out.
384 */
385 spin_unlock(&fc->lock);
386 wait_event(req->waitq, req->state == FUSE_REQ_FINISHED);
387 spin_lock(&fc->lock);
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700388
Miklos Szeredia131de02007-10-16 23:31:04 -0700389 if (!req->aborted)
390 return;
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700391
392 aborted:
Miklos Szeredia131de02007-10-16 23:31:04 -0700393 BUG_ON(req->state != FUSE_REQ_FINISHED);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700394 if (req->locked) {
395 /* This is uninterruptible sleep, because data is
396 being copied to/from the buffers of req. During
397 locked state, there mustn't be any filesystem
398 operation (e.g. page fault), since that could lead
399 to deadlock */
Miklos Szeredid7133112006-04-10 22:54:55 -0700400 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700401 wait_event(req->waitq, !req->locked);
Miklos Szeredid7133112006-04-10 22:54:55 -0700402 spin_lock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700403 }
Miklos Szeredi334f4852005-09-09 13:10:27 -0700404}
405
Tejun Heob93f8582008-11-26 12:03:55 +0100406void fuse_request_send(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700407{
408 req->isreply = 1;
Miklos Szeredid7133112006-04-10 22:54:55 -0700409 spin_lock(&fc->lock);
Miklos Szeredi1e9a4ed2005-09-09 13:10:31 -0700410 if (!fc->connected)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700411 req->out.h.error = -ENOTCONN;
412 else if (fc->conn_error)
413 req->out.h.error = -ECONNREFUSED;
414 else {
Miklos Szeredi2d45ba32010-07-12 14:41:40 +0200415 req->in.h.unique = fuse_get_unique(fc);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700416 queue_request(fc, req);
417 /* acquire extra reference, since request is still needed
418 after request_end() */
419 __fuse_get_request(req);
420
Miklos Szeredi7c352bd2005-09-09 13:10:39 -0700421 request_wait_answer(fc, req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700422 }
Miklos Szeredid7133112006-04-10 22:54:55 -0700423 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700424}
Tejun Heo08cbf542009-04-14 10:54:53 +0900425EXPORT_SYMBOL_GPL(fuse_request_send);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700426
Tejun Heob93f8582008-11-26 12:03:55 +0100427static void fuse_request_send_nowait_locked(struct fuse_conn *fc,
428 struct fuse_req *req)
Miklos Szeredid12def12008-02-06 01:38:39 -0800429{
430 req->background = 1;
431 fc->num_background++;
Csaba Henk7a6d3c82009-07-01 17:28:41 -0700432 if (fc->num_background == fc->max_background)
Miklos Szeredid12def12008-02-06 01:38:39 -0800433 fc->blocked = 1;
Csaba Henk7a6d3c82009-07-01 17:28:41 -0700434 if (fc->num_background == fc->congestion_threshold &&
Tejun Heoa325f9b2009-04-14 10:54:52 +0900435 fc->bdi_initialized) {
Jens Axboe8aa7e842009-07-09 14:52:32 +0200436 set_bdi_congested(&fc->bdi, BLK_RW_SYNC);
437 set_bdi_congested(&fc->bdi, BLK_RW_ASYNC);
Miklos Szeredid12def12008-02-06 01:38:39 -0800438 }
439 list_add_tail(&req->list, &fc->bg_queue);
440 flush_bg_queue(fc);
441}
442
Tejun Heob93f8582008-11-26 12:03:55 +0100443static void fuse_request_send_nowait(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700444{
Miklos Szeredid7133112006-04-10 22:54:55 -0700445 spin_lock(&fc->lock);
Miklos Szeredi1e9a4ed2005-09-09 13:10:31 -0700446 if (fc->connected) {
Tejun Heob93f8582008-11-26 12:03:55 +0100447 fuse_request_send_nowait_locked(fc, req);
Miklos Szeredid7133112006-04-10 22:54:55 -0700448 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700449 } else {
450 req->out.h.error = -ENOTCONN;
451 request_end(fc, req);
452 }
453}
454
Tejun Heob93f8582008-11-26 12:03:55 +0100455void fuse_request_send_background(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700456{
457 req->isreply = 1;
Tejun Heob93f8582008-11-26 12:03:55 +0100458 fuse_request_send_nowait(fc, req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700459}
Tejun Heo08cbf542009-04-14 10:54:53 +0900460EXPORT_SYMBOL_GPL(fuse_request_send_background);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700461
Miklos Szeredi2d45ba32010-07-12 14:41:40 +0200462static int fuse_request_send_notify_reply(struct fuse_conn *fc,
463 struct fuse_req *req, u64 unique)
464{
465 int err = -ENODEV;
466
467 req->isreply = 0;
468 req->in.h.unique = unique;
469 spin_lock(&fc->lock);
470 if (fc->connected) {
471 queue_request(fc, req);
472 err = 0;
473 }
474 spin_unlock(&fc->lock);
475
476 return err;
477}
478
Miklos Szeredi334f4852005-09-09 13:10:27 -0700479/*
Miklos Szeredi3be5a522008-04-30 00:54:41 -0700480 * Called under fc->lock
481 *
482 * fc->connected must have been checked previously
483 */
Tejun Heob93f8582008-11-26 12:03:55 +0100484void fuse_request_send_background_locked(struct fuse_conn *fc,
485 struct fuse_req *req)
Miklos Szeredi3be5a522008-04-30 00:54:41 -0700486{
487 req->isreply = 1;
Tejun Heob93f8582008-11-26 12:03:55 +0100488 fuse_request_send_nowait_locked(fc, req);
Miklos Szeredi3be5a522008-04-30 00:54:41 -0700489}
490
491/*
Miklos Szeredi334f4852005-09-09 13:10:27 -0700492 * Lock the request. Up to the next unlock_request() there mustn't be
493 * anything that could cause a page-fault. If the request was already
Miklos Szeredif9a28422006-06-25 05:48:53 -0700494 * aborted bail out.
Miklos Szeredi334f4852005-09-09 13:10:27 -0700495 */
Miklos Szeredid7133112006-04-10 22:54:55 -0700496static int lock_request(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700497{
498 int err = 0;
499 if (req) {
Miklos Szeredid7133112006-04-10 22:54:55 -0700500 spin_lock(&fc->lock);
Miklos Szeredif9a28422006-06-25 05:48:53 -0700501 if (req->aborted)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700502 err = -ENOENT;
503 else
504 req->locked = 1;
Miklos Szeredid7133112006-04-10 22:54:55 -0700505 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700506 }
507 return err;
508}
509
510/*
Miklos Szeredif9a28422006-06-25 05:48:53 -0700511 * Unlock request. If it was aborted during being locked, the
Miklos Szeredi334f4852005-09-09 13:10:27 -0700512 * requester thread is currently waiting for it to be unlocked, so
513 * wake it up.
514 */
Miklos Szeredid7133112006-04-10 22:54:55 -0700515static void unlock_request(struct fuse_conn *fc, struct fuse_req *req)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700516{
517 if (req) {
Miklos Szeredid7133112006-04-10 22:54:55 -0700518 spin_lock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700519 req->locked = 0;
Miklos Szeredif9a28422006-06-25 05:48:53 -0700520 if (req->aborted)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700521 wake_up(&req->waitq);
Miklos Szeredid7133112006-04-10 22:54:55 -0700522 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700523 }
524}
525
526struct fuse_copy_state {
Miklos Szeredid7133112006-04-10 22:54:55 -0700527 struct fuse_conn *fc;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700528 int write;
529 struct fuse_req *req;
530 const struct iovec *iov;
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200531 struct pipe_buffer *pipebufs;
532 struct pipe_buffer *currbuf;
533 struct pipe_inode_info *pipe;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700534 unsigned long nr_segs;
535 unsigned long seglen;
536 unsigned long addr;
537 struct page *pg;
538 void *mapaddr;
539 void *buf;
540 unsigned len;
Miklos Szeredice534fb2010-05-25 15:06:07 +0200541 unsigned move_pages:1;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700542};
543
Miklos Szeredid7133112006-04-10 22:54:55 -0700544static void fuse_copy_init(struct fuse_copy_state *cs, struct fuse_conn *fc,
Miklos Szeredic3021622010-05-25 15:06:07 +0200545 int write,
Miklos Szeredid7133112006-04-10 22:54:55 -0700546 const struct iovec *iov, unsigned long nr_segs)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700547{
548 memset(cs, 0, sizeof(*cs));
Miklos Szeredid7133112006-04-10 22:54:55 -0700549 cs->fc = fc;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700550 cs->write = write;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700551 cs->iov = iov;
552 cs->nr_segs = nr_segs;
553}
554
555/* Unmap and put previous page of userspace buffer */
Miklos Szeredi8bfc0162006-01-16 22:14:28 -0800556static void fuse_copy_finish(struct fuse_copy_state *cs)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700557{
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200558 if (cs->currbuf) {
559 struct pipe_buffer *buf = cs->currbuf;
560
Miklos Szeredic3021622010-05-25 15:06:07 +0200561 if (!cs->write) {
562 buf->ops->unmap(cs->pipe, buf, cs->mapaddr);
563 } else {
Miklos Szeredi7909b1c2010-07-12 14:41:40 +0200564 kunmap(buf->page);
Miklos Szeredic3021622010-05-25 15:06:07 +0200565 buf->len = PAGE_SIZE - cs->len;
566 }
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200567 cs->currbuf = NULL;
568 cs->mapaddr = NULL;
569 } else if (cs->mapaddr) {
Miklos Szeredi7909b1c2010-07-12 14:41:40 +0200570 kunmap(cs->pg);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700571 if (cs->write) {
572 flush_dcache_page(cs->pg);
573 set_page_dirty_lock(cs->pg);
574 }
575 put_page(cs->pg);
576 cs->mapaddr = NULL;
577 }
578}
579
580/*
581 * Get another pagefull of userspace buffer, and map it to kernel
582 * address space, and lock request
583 */
584static int fuse_copy_fill(struct fuse_copy_state *cs)
585{
586 unsigned long offset;
587 int err;
588
Miklos Szeredid7133112006-04-10 22:54:55 -0700589 unlock_request(cs->fc, cs->req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700590 fuse_copy_finish(cs);
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200591 if (cs->pipebufs) {
592 struct pipe_buffer *buf = cs->pipebufs;
593
Miklos Szeredic3021622010-05-25 15:06:07 +0200594 if (!cs->write) {
595 err = buf->ops->confirm(cs->pipe, buf);
596 if (err)
597 return err;
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200598
Miklos Szeredic3021622010-05-25 15:06:07 +0200599 BUG_ON(!cs->nr_segs);
600 cs->currbuf = buf;
Miklos Szeredi7909b1c2010-07-12 14:41:40 +0200601 cs->mapaddr = buf->ops->map(cs->pipe, buf, 0);
Miklos Szeredic3021622010-05-25 15:06:07 +0200602 cs->len = buf->len;
603 cs->buf = cs->mapaddr + buf->offset;
604 cs->pipebufs++;
605 cs->nr_segs--;
606 } else {
607 struct page *page;
608
609 if (cs->nr_segs == cs->pipe->buffers)
610 return -EIO;
611
612 page = alloc_page(GFP_HIGHUSER);
613 if (!page)
614 return -ENOMEM;
615
616 buf->page = page;
617 buf->offset = 0;
618 buf->len = 0;
619
620 cs->currbuf = buf;
Miklos Szeredi7909b1c2010-07-12 14:41:40 +0200621 cs->mapaddr = kmap(page);
Miklos Szeredic3021622010-05-25 15:06:07 +0200622 cs->buf = cs->mapaddr;
623 cs->len = PAGE_SIZE;
624 cs->pipebufs++;
625 cs->nr_segs++;
626 }
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200627 } else {
628 if (!cs->seglen) {
629 BUG_ON(!cs->nr_segs);
630 cs->seglen = cs->iov[0].iov_len;
631 cs->addr = (unsigned long) cs->iov[0].iov_base;
632 cs->iov++;
633 cs->nr_segs--;
634 }
635 err = get_user_pages_fast(cs->addr, 1, cs->write, &cs->pg);
636 if (err < 0)
637 return err;
638 BUG_ON(err != 1);
639 offset = cs->addr % PAGE_SIZE;
Miklos Szeredi7909b1c2010-07-12 14:41:40 +0200640 cs->mapaddr = kmap(cs->pg);
Miklos Szeredidd3bb142010-05-25 15:06:06 +0200641 cs->buf = cs->mapaddr + offset;
642 cs->len = min(PAGE_SIZE - offset, cs->seglen);
643 cs->seglen -= cs->len;
644 cs->addr += cs->len;
Miklos Szeredi334f4852005-09-09 13:10:27 -0700645 }
Miklos Szeredi334f4852005-09-09 13:10:27 -0700646
Miklos Szeredid7133112006-04-10 22:54:55 -0700647 return lock_request(cs->fc, cs->req);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700648}
649
650/* Do as much copy to/from userspace buffer as we can */
Miklos Szeredi8bfc0162006-01-16 22:14:28 -0800651static int fuse_copy_do(struct fuse_copy_state *cs, void **val, unsigned *size)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700652{
653 unsigned ncpy = min(*size, cs->len);
654 if (val) {
655 if (cs->write)
656 memcpy(cs->buf, *val, ncpy);
657 else
658 memcpy(*val, cs->buf, ncpy);
659 *val += ncpy;
660 }
661 *size -= ncpy;
662 cs->len -= ncpy;
663 cs->buf += ncpy;
664 return ncpy;
665}
666
Miklos Szeredice534fb2010-05-25 15:06:07 +0200667static int fuse_check_page(struct page *page)
668{
669 if (page_mapcount(page) ||
670 page->mapping != NULL ||
671 page_count(page) != 1 ||
672 (page->flags & PAGE_FLAGS_CHECK_AT_PREP &
673 ~(1 << PG_locked |
674 1 << PG_referenced |
675 1 << PG_uptodate |
676 1 << PG_lru |
677 1 << PG_active |
678 1 << PG_reclaim))) {
679 printk(KERN_WARNING "fuse: trying to steal weird page\n");
680 printk(KERN_WARNING " page=%p index=%li flags=%08lx, count=%i, mapcount=%i, mapping=%p\n", page, page->index, page->flags, page_count(page), page_mapcount(page), page->mapping);
681 return 1;
682 }
683 return 0;
684}
685
686static int fuse_try_move_page(struct fuse_copy_state *cs, struct page **pagep)
687{
688 int err;
689 struct page *oldpage = *pagep;
690 struct page *newpage;
691 struct pipe_buffer *buf = cs->pipebufs;
692 struct address_space *mapping;
693 pgoff_t index;
694
695 unlock_request(cs->fc, cs->req);
696 fuse_copy_finish(cs);
697
698 err = buf->ops->confirm(cs->pipe, buf);
699 if (err)
700 return err;
701
702 BUG_ON(!cs->nr_segs);
703 cs->currbuf = buf;
704 cs->len = buf->len;
705 cs->pipebufs++;
706 cs->nr_segs--;
707
708 if (cs->len != PAGE_SIZE)
709 goto out_fallback;
710
711 if (buf->ops->steal(cs->pipe, buf) != 0)
712 goto out_fallback;
713
714 newpage = buf->page;
715
716 if (WARN_ON(!PageUptodate(newpage)))
717 return -EIO;
718
719 ClearPageMappedToDisk(newpage);
720
721 if (fuse_check_page(newpage) != 0)
722 goto out_fallback_unlock;
723
724 mapping = oldpage->mapping;
725 index = oldpage->index;
726
727 /*
728 * This is a new and locked page, it shouldn't be mapped or
729 * have any special flags on it
730 */
731 if (WARN_ON(page_mapped(oldpage)))
732 goto out_fallback_unlock;
733 if (WARN_ON(page_has_private(oldpage)))
734 goto out_fallback_unlock;
735 if (WARN_ON(PageDirty(oldpage) || PageWriteback(oldpage)))
736 goto out_fallback_unlock;
737 if (WARN_ON(PageMlocked(oldpage)))
738 goto out_fallback_unlock;
739
740 remove_from_page_cache(oldpage);
741 page_cache_release(oldpage);
742
743 err = add_to_page_cache_locked(newpage, mapping, index, GFP_KERNEL);
744 if (err) {
745 printk(KERN_WARNING "fuse_try_move_page: failed to add page");
746 goto out_fallback_unlock;
747 }
748 page_cache_get(newpage);
749
750 if (!(buf->flags & PIPE_BUF_FLAG_LRU))
751 lru_cache_add_file(newpage);
752
753 err = 0;
754 spin_lock(&cs->fc->lock);
755 if (cs->req->aborted)
756 err = -ENOENT;
757 else
758 *pagep = newpage;
759 spin_unlock(&cs->fc->lock);
760
761 if (err) {
762 unlock_page(newpage);
763 page_cache_release(newpage);
764 return err;
765 }
766
767 unlock_page(oldpage);
768 page_cache_release(oldpage);
769 cs->len = 0;
770
771 return 0;
772
773out_fallback_unlock:
774 unlock_page(newpage);
775out_fallback:
776 cs->mapaddr = buf->ops->map(cs->pipe, buf, 1);
777 cs->buf = cs->mapaddr + buf->offset;
778
779 err = lock_request(cs->fc, cs->req);
780 if (err)
781 return err;
782
783 return 1;
784}
785
Miklos Szeredic3021622010-05-25 15:06:07 +0200786static int fuse_ref_page(struct fuse_copy_state *cs, struct page *page,
787 unsigned offset, unsigned count)
788{
789 struct pipe_buffer *buf;
790
791 if (cs->nr_segs == cs->pipe->buffers)
792 return -EIO;
793
794 unlock_request(cs->fc, cs->req);
795 fuse_copy_finish(cs);
796
797 buf = cs->pipebufs;
798 page_cache_get(page);
799 buf->page = page;
800 buf->offset = offset;
801 buf->len = count;
802
803 cs->pipebufs++;
804 cs->nr_segs++;
805 cs->len = 0;
806
807 return 0;
808}
809
Miklos Szeredi334f4852005-09-09 13:10:27 -0700810/*
811 * Copy a page in the request to/from the userspace buffer. Must be
812 * done atomically
813 */
Miklos Szeredice534fb2010-05-25 15:06:07 +0200814static int fuse_copy_page(struct fuse_copy_state *cs, struct page **pagep,
Miklos Szeredi8bfc0162006-01-16 22:14:28 -0800815 unsigned offset, unsigned count, int zeroing)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700816{
Miklos Szeredice534fb2010-05-25 15:06:07 +0200817 int err;
818 struct page *page = *pagep;
819
Miklos Szeredib6777c42010-10-26 14:22:27 -0700820 if (page && zeroing && count < PAGE_SIZE)
821 clear_highpage(page);
822
Miklos Szeredi334f4852005-09-09 13:10:27 -0700823 while (count) {
Miklos Szeredic3021622010-05-25 15:06:07 +0200824 if (cs->write && cs->pipebufs && page) {
825 return fuse_ref_page(cs, page, offset, count);
826 } else if (!cs->len) {
Miklos Szeredice534fb2010-05-25 15:06:07 +0200827 if (cs->move_pages && page &&
828 offset == 0 && count == PAGE_SIZE) {
829 err = fuse_try_move_page(cs, pagep);
830 if (err <= 0)
831 return err;
832 } else {
833 err = fuse_copy_fill(cs);
834 if (err)
835 return err;
836 }
Miklos Szeredi1729a162008-11-26 12:03:54 +0100837 }
Miklos Szeredi334f4852005-09-09 13:10:27 -0700838 if (page) {
Miklos Szeredib6777c42010-10-26 14:22:27 -0700839 void *mapaddr = kmap_atomic(page, KM_USER0);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700840 void *buf = mapaddr + offset;
841 offset += fuse_copy_do(cs, &buf, &count);
Miklos Szeredib6777c42010-10-26 14:22:27 -0700842 kunmap_atomic(mapaddr, KM_USER0);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700843 } else
844 offset += fuse_copy_do(cs, NULL, &count);
845 }
846 if (page && !cs->write)
847 flush_dcache_page(page);
848 return 0;
849}
850
851/* Copy pages in the request to/from userspace buffer */
852static int fuse_copy_pages(struct fuse_copy_state *cs, unsigned nbytes,
853 int zeroing)
854{
855 unsigned i;
856 struct fuse_req *req = cs->req;
857 unsigned offset = req->page_offset;
858 unsigned count = min(nbytes, (unsigned) PAGE_SIZE - offset);
859
860 for (i = 0; i < req->num_pages && (nbytes || zeroing); i++) {
Miklos Szeredice534fb2010-05-25 15:06:07 +0200861 int err;
862
863 err = fuse_copy_page(cs, &req->pages[i], offset, count,
864 zeroing);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700865 if (err)
866 return err;
867
868 nbytes -= count;
869 count = min(nbytes, (unsigned) PAGE_SIZE);
870 offset = 0;
871 }
872 return 0;
873}
874
875/* Copy a single argument in the request to/from userspace buffer */
876static int fuse_copy_one(struct fuse_copy_state *cs, void *val, unsigned size)
877{
878 while (size) {
Miklos Szeredi1729a162008-11-26 12:03:54 +0100879 if (!cs->len) {
880 int err = fuse_copy_fill(cs);
881 if (err)
882 return err;
883 }
Miklos Szeredi334f4852005-09-09 13:10:27 -0700884 fuse_copy_do(cs, &val, &size);
885 }
886 return 0;
887}
888
889/* Copy request arguments to/from userspace buffer */
890static int fuse_copy_args(struct fuse_copy_state *cs, unsigned numargs,
891 unsigned argpages, struct fuse_arg *args,
892 int zeroing)
893{
894 int err = 0;
895 unsigned i;
896
897 for (i = 0; !err && i < numargs; i++) {
898 struct fuse_arg *arg = &args[i];
899 if (i == numargs - 1 && argpages)
900 err = fuse_copy_pages(cs, arg->size, zeroing);
901 else
902 err = fuse_copy_one(cs, arg->value, arg->size);
903 }
904 return err;
905}
906
Miklos Szeredi07e77dc2010-12-07 20:16:56 +0100907static int forget_pending(struct fuse_conn *fc)
908{
909 return fc->forget_list_head.next != NULL;
910}
911
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700912static int request_pending(struct fuse_conn *fc)
913{
Miklos Szeredi07e77dc2010-12-07 20:16:56 +0100914 return !list_empty(&fc->pending) || !list_empty(&fc->interrupts) ||
915 forget_pending(fc);
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700916}
917
Miklos Szeredi334f4852005-09-09 13:10:27 -0700918/* Wait until a request is available on the pending list */
919static void request_wait(struct fuse_conn *fc)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +0200920__releases(fc->lock)
921__acquires(fc->lock)
Miklos Szeredi334f4852005-09-09 13:10:27 -0700922{
923 DECLARE_WAITQUEUE(wait, current);
924
925 add_wait_queue_exclusive(&fc->waitq, &wait);
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700926 while (fc->connected && !request_pending(fc)) {
Miklos Szeredi334f4852005-09-09 13:10:27 -0700927 set_current_state(TASK_INTERRUPTIBLE);
928 if (signal_pending(current))
929 break;
930
Miklos Szeredid7133112006-04-10 22:54:55 -0700931 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700932 schedule();
Miklos Szeredid7133112006-04-10 22:54:55 -0700933 spin_lock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -0700934 }
935 set_current_state(TASK_RUNNING);
936 remove_wait_queue(&fc->waitq, &wait);
937}
938
939/*
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700940 * Transfer an interrupt request to userspace
941 *
942 * Unlike other requests this is assembled on demand, without a need
943 * to allocate a separate fuse_req structure.
944 *
945 * Called with fc->lock held, releases it
946 */
Miklos Szeredic3021622010-05-25 15:06:07 +0200947static int fuse_read_interrupt(struct fuse_conn *fc, struct fuse_copy_state *cs,
948 size_t nbytes, struct fuse_req *req)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +0200949__releases(fc->lock)
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700950{
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700951 struct fuse_in_header ih;
952 struct fuse_interrupt_in arg;
953 unsigned reqsize = sizeof(ih) + sizeof(arg);
954 int err;
955
956 list_del_init(&req->intr_entry);
957 req->intr_unique = fuse_get_unique(fc);
958 memset(&ih, 0, sizeof(ih));
959 memset(&arg, 0, sizeof(arg));
960 ih.len = reqsize;
961 ih.opcode = FUSE_INTERRUPT;
962 ih.unique = req->intr_unique;
963 arg.unique = req->in.h.unique;
964
965 spin_unlock(&fc->lock);
Miklos Szeredic3021622010-05-25 15:06:07 +0200966 if (nbytes < reqsize)
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700967 return -EINVAL;
968
Miklos Szeredic3021622010-05-25 15:06:07 +0200969 err = fuse_copy_one(cs, &ih, sizeof(ih));
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700970 if (!err)
Miklos Szeredic3021622010-05-25 15:06:07 +0200971 err = fuse_copy_one(cs, &arg, sizeof(arg));
972 fuse_copy_finish(cs);
Miklos Szeredia4d27e72006-06-25 05:48:54 -0700973
974 return err ? err : reqsize;
975}
976
Miklos Szeredi07e77dc2010-12-07 20:16:56 +0100977static struct fuse_forget_link *dequeue_forget(struct fuse_conn *fc)
978{
979 struct fuse_forget_link *forget = fc->forget_list_head.next;
980
981 fc->forget_list_head.next = forget->next;
982 if (fc->forget_list_head.next == NULL)
983 fc->forget_list_tail = &fc->forget_list_head;
984
985 return forget;
986}
987
988static int fuse_read_single_forget(struct fuse_conn *fc,
989 struct fuse_copy_state *cs,
990 size_t nbytes)
991__releases(fc->lock)
992{
993 int err;
994 struct fuse_forget_link *forget = dequeue_forget(fc);
995 struct fuse_forget_in arg = {
996 .nlookup = forget->nlookup,
997 };
998 struct fuse_in_header ih = {
999 .opcode = FUSE_FORGET,
1000 .nodeid = forget->nodeid,
1001 .unique = fuse_get_unique(fc),
1002 .len = sizeof(ih) + sizeof(arg),
1003 };
1004
1005 spin_unlock(&fc->lock);
1006 kfree(forget);
1007 if (nbytes < ih.len)
1008 return -EINVAL;
1009
1010 err = fuse_copy_one(cs, &ih, sizeof(ih));
1011 if (!err)
1012 err = fuse_copy_one(cs, &arg, sizeof(arg));
1013 fuse_copy_finish(cs);
1014
1015 if (err)
1016 return err;
1017
1018 return ih.len;
1019}
1020
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001021/*
Miklos Szeredi334f4852005-09-09 13:10:27 -07001022 * Read a single request into the userspace filesystem's buffer. This
1023 * function waits until a request is available, then removes it from
1024 * the pending list and copies request data to userspace buffer. If
Miklos Szeredif9a28422006-06-25 05:48:53 -07001025 * no reply is needed (FORGET) or request has been aborted or there
1026 * was an error during the copying then it's finished by calling
Miklos Szeredi334f4852005-09-09 13:10:27 -07001027 * request_end(). Otherwise add it to the processing list, and set
1028 * the 'sent' flag.
1029 */
Miklos Szeredic3021622010-05-25 15:06:07 +02001030static ssize_t fuse_dev_do_read(struct fuse_conn *fc, struct file *file,
1031 struct fuse_copy_state *cs, size_t nbytes)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001032{
1033 int err;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001034 struct fuse_req *req;
1035 struct fuse_in *in;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001036 unsigned reqsize;
1037
Miklos Szeredi1d3d7522006-01-06 00:19:40 -08001038 restart:
Miklos Szeredid7133112006-04-10 22:54:55 -07001039 spin_lock(&fc->lock);
Jeff Dikee5ac1d12006-04-10 22:54:53 -07001040 err = -EAGAIN;
1041 if ((file->f_flags & O_NONBLOCK) && fc->connected &&
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001042 !request_pending(fc))
Jeff Dikee5ac1d12006-04-10 22:54:53 -07001043 goto err_unlock;
1044
Miklos Szeredi334f4852005-09-09 13:10:27 -07001045 request_wait(fc);
1046 err = -ENODEV;
Miklos Szeredi9ba7cbb2006-01-16 22:14:34 -08001047 if (!fc->connected)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001048 goto err_unlock;
1049 err = -ERESTARTSYS;
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001050 if (!request_pending(fc))
Miklos Szeredi334f4852005-09-09 13:10:27 -07001051 goto err_unlock;
1052
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001053 if (!list_empty(&fc->interrupts)) {
1054 req = list_entry(fc->interrupts.next, struct fuse_req,
1055 intr_entry);
Miklos Szeredic3021622010-05-25 15:06:07 +02001056 return fuse_read_interrupt(fc, cs, nbytes, req);
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001057 }
1058
Miklos Szeredi07e77dc2010-12-07 20:16:56 +01001059 if (forget_pending(fc)) {
1060 if (list_empty(&fc->pending) || fc->forget_batch-- > 0)
1061 return fuse_read_single_forget(fc, cs, nbytes);
1062
1063 if (fc->forget_batch <= -8)
1064 fc->forget_batch = 16;
1065 }
1066
Miklos Szeredi334f4852005-09-09 13:10:27 -07001067 req = list_entry(fc->pending.next, struct fuse_req, list);
Miklos Szeredi83cfd492006-01-16 22:14:31 -08001068 req->state = FUSE_REQ_READING;
Miklos Szeredid77a1d52006-01-16 22:14:31 -08001069 list_move(&req->list, &fc->io);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001070
1071 in = &req->in;
Miklos Szeredi1d3d7522006-01-06 00:19:40 -08001072 reqsize = in->h.len;
1073 /* If request is too large, reply with an error and restart the read */
Miklos Szeredic3021622010-05-25 15:06:07 +02001074 if (nbytes < reqsize) {
Miklos Szeredi1d3d7522006-01-06 00:19:40 -08001075 req->out.h.error = -EIO;
1076 /* SETXATTR is special, since it may contain too large data */
1077 if (in->h.opcode == FUSE_SETXATTR)
1078 req->out.h.error = -E2BIG;
1079 request_end(fc, req);
1080 goto restart;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001081 }
Miklos Szeredid7133112006-04-10 22:54:55 -07001082 spin_unlock(&fc->lock);
Miklos Szeredic3021622010-05-25 15:06:07 +02001083 cs->req = req;
1084 err = fuse_copy_one(cs, &in->h, sizeof(in->h));
Miklos Szeredi1d3d7522006-01-06 00:19:40 -08001085 if (!err)
Miklos Szeredic3021622010-05-25 15:06:07 +02001086 err = fuse_copy_args(cs, in->numargs, in->argpages,
Miklos Szeredi1d3d7522006-01-06 00:19:40 -08001087 (struct fuse_arg *) in->args, 0);
Miklos Szeredic3021622010-05-25 15:06:07 +02001088 fuse_copy_finish(cs);
Miklos Szeredid7133112006-04-10 22:54:55 -07001089 spin_lock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001090 req->locked = 0;
Miklos Szeredic9c9d7d2007-10-16 23:31:05 -07001091 if (req->aborted) {
1092 request_end(fc, req);
1093 return -ENODEV;
1094 }
Miklos Szeredi334f4852005-09-09 13:10:27 -07001095 if (err) {
Miklos Szeredic9c9d7d2007-10-16 23:31:05 -07001096 req->out.h.error = -EIO;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001097 request_end(fc, req);
1098 return err;
1099 }
1100 if (!req->isreply)
1101 request_end(fc, req);
1102 else {
Miklos Szeredi83cfd492006-01-16 22:14:31 -08001103 req->state = FUSE_REQ_SENT;
Miklos Szeredid77a1d52006-01-16 22:14:31 -08001104 list_move_tail(&req->list, &fc->processing);
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001105 if (req->interrupted)
1106 queue_interrupt(fc, req);
Miklos Szeredid7133112006-04-10 22:54:55 -07001107 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001108 }
1109 return reqsize;
1110
1111 err_unlock:
Miklos Szeredid7133112006-04-10 22:54:55 -07001112 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001113 return err;
1114}
1115
Miklos Szeredic3021622010-05-25 15:06:07 +02001116static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
1117 unsigned long nr_segs, loff_t pos)
1118{
1119 struct fuse_copy_state cs;
1120 struct file *file = iocb->ki_filp;
1121 struct fuse_conn *fc = fuse_get_conn(file);
1122 if (!fc)
1123 return -EPERM;
1124
1125 fuse_copy_init(&cs, fc, 1, iov, nr_segs);
1126
1127 return fuse_dev_do_read(fc, file, &cs, iov_length(iov, nr_segs));
1128}
1129
1130static int fuse_dev_pipe_buf_steal(struct pipe_inode_info *pipe,
1131 struct pipe_buffer *buf)
1132{
1133 return 1;
1134}
1135
1136static const struct pipe_buf_operations fuse_dev_pipe_buf_ops = {
1137 .can_merge = 0,
1138 .map = generic_pipe_buf_map,
1139 .unmap = generic_pipe_buf_unmap,
1140 .confirm = generic_pipe_buf_confirm,
1141 .release = generic_pipe_buf_release,
1142 .steal = fuse_dev_pipe_buf_steal,
1143 .get = generic_pipe_buf_get,
1144};
1145
1146static ssize_t fuse_dev_splice_read(struct file *in, loff_t *ppos,
1147 struct pipe_inode_info *pipe,
1148 size_t len, unsigned int flags)
1149{
1150 int ret;
1151 int page_nr = 0;
1152 int do_wakeup = 0;
1153 struct pipe_buffer *bufs;
1154 struct fuse_copy_state cs;
1155 struct fuse_conn *fc = fuse_get_conn(in);
1156 if (!fc)
1157 return -EPERM;
1158
Miklos Szeredi07e77dc2010-12-07 20:16:56 +01001159 bufs = kmalloc(pipe->buffers * sizeof(struct pipe_buffer), GFP_KERNEL);
Miklos Szeredic3021622010-05-25 15:06:07 +02001160 if (!bufs)
1161 return -ENOMEM;
1162
1163 fuse_copy_init(&cs, fc, 1, NULL, 0);
1164 cs.pipebufs = bufs;
1165 cs.pipe = pipe;
1166 ret = fuse_dev_do_read(fc, in, &cs, len);
1167 if (ret < 0)
1168 goto out;
1169
1170 ret = 0;
1171 pipe_lock(pipe);
1172
1173 if (!pipe->readers) {
1174 send_sig(SIGPIPE, current, 0);
1175 if (!ret)
1176 ret = -EPIPE;
1177 goto out_unlock;
1178 }
1179
1180 if (pipe->nrbufs + cs.nr_segs > pipe->buffers) {
1181 ret = -EIO;
1182 goto out_unlock;
1183 }
1184
1185 while (page_nr < cs.nr_segs) {
1186 int newbuf = (pipe->curbuf + pipe->nrbufs) & (pipe->buffers - 1);
1187 struct pipe_buffer *buf = pipe->bufs + newbuf;
1188
1189 buf->page = bufs[page_nr].page;
1190 buf->offset = bufs[page_nr].offset;
1191 buf->len = bufs[page_nr].len;
1192 buf->ops = &fuse_dev_pipe_buf_ops;
1193
1194 pipe->nrbufs++;
1195 page_nr++;
1196 ret += buf->len;
1197
1198 if (pipe->inode)
1199 do_wakeup = 1;
1200 }
1201
1202out_unlock:
1203 pipe_unlock(pipe);
1204
1205 if (do_wakeup) {
1206 smp_mb();
1207 if (waitqueue_active(&pipe->wait))
1208 wake_up_interruptible(&pipe->wait);
1209 kill_fasync(&pipe->fasync_readers, SIGIO, POLL_IN);
1210 }
1211
1212out:
1213 for (; page_nr < cs.nr_segs; page_nr++)
1214 page_cache_release(bufs[page_nr].page);
1215
1216 kfree(bufs);
1217 return ret;
1218}
1219
Tejun Heo95668a62008-11-26 12:03:55 +01001220static int fuse_notify_poll(struct fuse_conn *fc, unsigned int size,
1221 struct fuse_copy_state *cs)
1222{
1223 struct fuse_notify_poll_wakeup_out outarg;
Miklos Szeredif6d47a12009-01-26 15:00:59 +01001224 int err = -EINVAL;
Tejun Heo95668a62008-11-26 12:03:55 +01001225
1226 if (size != sizeof(outarg))
Miklos Szeredif6d47a12009-01-26 15:00:59 +01001227 goto err;
Tejun Heo95668a62008-11-26 12:03:55 +01001228
1229 err = fuse_copy_one(cs, &outarg, sizeof(outarg));
1230 if (err)
Miklos Szeredif6d47a12009-01-26 15:00:59 +01001231 goto err;
Tejun Heo95668a62008-11-26 12:03:55 +01001232
Miklos Szeredif6d47a12009-01-26 15:00:59 +01001233 fuse_copy_finish(cs);
Tejun Heo95668a62008-11-26 12:03:55 +01001234 return fuse_notify_poll_wakeup(fc, &outarg);
Miklos Szeredif6d47a12009-01-26 15:00:59 +01001235
1236err:
1237 fuse_copy_finish(cs);
1238 return err;
Tejun Heo95668a62008-11-26 12:03:55 +01001239}
1240
John Muir3b463ae2009-05-31 11:13:57 -04001241static int fuse_notify_inval_inode(struct fuse_conn *fc, unsigned int size,
1242 struct fuse_copy_state *cs)
1243{
1244 struct fuse_notify_inval_inode_out outarg;
1245 int err = -EINVAL;
1246
1247 if (size != sizeof(outarg))
1248 goto err;
1249
1250 err = fuse_copy_one(cs, &outarg, sizeof(outarg));
1251 if (err)
1252 goto err;
1253 fuse_copy_finish(cs);
1254
1255 down_read(&fc->killsb);
1256 err = -ENOENT;
Miklos Szeredib21dda42010-02-05 12:08:31 +01001257 if (fc->sb) {
1258 err = fuse_reverse_inval_inode(fc->sb, outarg.ino,
1259 outarg.off, outarg.len);
1260 }
John Muir3b463ae2009-05-31 11:13:57 -04001261 up_read(&fc->killsb);
1262 return err;
1263
1264err:
1265 fuse_copy_finish(cs);
1266 return err;
1267}
1268
1269static int fuse_notify_inval_entry(struct fuse_conn *fc, unsigned int size,
1270 struct fuse_copy_state *cs)
1271{
1272 struct fuse_notify_inval_entry_out outarg;
Fang Wenqib2d82ee2009-12-30 18:37:13 +08001273 int err = -ENOMEM;
1274 char *buf;
John Muir3b463ae2009-05-31 11:13:57 -04001275 struct qstr name;
1276
Fang Wenqib2d82ee2009-12-30 18:37:13 +08001277 buf = kzalloc(FUSE_NAME_MAX + 1, GFP_KERNEL);
1278 if (!buf)
1279 goto err;
1280
1281 err = -EINVAL;
John Muir3b463ae2009-05-31 11:13:57 -04001282 if (size < sizeof(outarg))
1283 goto err;
1284
1285 err = fuse_copy_one(cs, &outarg, sizeof(outarg));
1286 if (err)
1287 goto err;
1288
1289 err = -ENAMETOOLONG;
1290 if (outarg.namelen > FUSE_NAME_MAX)
1291 goto err;
1292
1293 name.name = buf;
1294 name.len = outarg.namelen;
1295 err = fuse_copy_one(cs, buf, outarg.namelen + 1);
1296 if (err)
1297 goto err;
1298 fuse_copy_finish(cs);
1299 buf[outarg.namelen] = 0;
1300 name.hash = full_name_hash(name.name, name.len);
1301
1302 down_read(&fc->killsb);
1303 err = -ENOENT;
Miklos Szeredib21dda42010-02-05 12:08:31 +01001304 if (fc->sb)
1305 err = fuse_reverse_inval_entry(fc->sb, outarg.parent, &name);
John Muir3b463ae2009-05-31 11:13:57 -04001306 up_read(&fc->killsb);
Fang Wenqib2d82ee2009-12-30 18:37:13 +08001307 kfree(buf);
John Muir3b463ae2009-05-31 11:13:57 -04001308 return err;
1309
1310err:
Fang Wenqib2d82ee2009-12-30 18:37:13 +08001311 kfree(buf);
John Muir3b463ae2009-05-31 11:13:57 -04001312 fuse_copy_finish(cs);
1313 return err;
1314}
1315
Miklos Szeredia1d75f22010-07-12 14:41:40 +02001316static int fuse_notify_store(struct fuse_conn *fc, unsigned int size,
1317 struct fuse_copy_state *cs)
1318{
1319 struct fuse_notify_store_out outarg;
1320 struct inode *inode;
1321 struct address_space *mapping;
1322 u64 nodeid;
1323 int err;
1324 pgoff_t index;
1325 unsigned int offset;
1326 unsigned int num;
1327 loff_t file_size;
1328 loff_t end;
1329
1330 err = -EINVAL;
1331 if (size < sizeof(outarg))
1332 goto out_finish;
1333
1334 err = fuse_copy_one(cs, &outarg, sizeof(outarg));
1335 if (err)
1336 goto out_finish;
1337
1338 err = -EINVAL;
1339 if (size - sizeof(outarg) != outarg.size)
1340 goto out_finish;
1341
1342 nodeid = outarg.nodeid;
1343
1344 down_read(&fc->killsb);
1345
1346 err = -ENOENT;
1347 if (!fc->sb)
1348 goto out_up_killsb;
1349
1350 inode = ilookup5(fc->sb, nodeid, fuse_inode_eq, &nodeid);
1351 if (!inode)
1352 goto out_up_killsb;
1353
1354 mapping = inode->i_mapping;
1355 index = outarg.offset >> PAGE_CACHE_SHIFT;
1356 offset = outarg.offset & ~PAGE_CACHE_MASK;
1357 file_size = i_size_read(inode);
1358 end = outarg.offset + outarg.size;
1359 if (end > file_size) {
1360 file_size = end;
1361 fuse_write_update_size(inode, file_size);
1362 }
1363
1364 num = outarg.size;
1365 while (num) {
1366 struct page *page;
1367 unsigned int this_num;
1368
1369 err = -ENOMEM;
1370 page = find_or_create_page(mapping, index,
1371 mapping_gfp_mask(mapping));
1372 if (!page)
1373 goto out_iput;
1374
1375 this_num = min_t(unsigned, num, PAGE_CACHE_SIZE - offset);
1376 err = fuse_copy_page(cs, &page, offset, this_num, 0);
1377 if (!err && offset == 0 && (num != 0 || file_size == end))
1378 SetPageUptodate(page);
1379 unlock_page(page);
1380 page_cache_release(page);
1381
1382 if (err)
1383 goto out_iput;
1384
1385 num -= this_num;
1386 offset = 0;
1387 index++;
1388 }
1389
1390 err = 0;
1391
1392out_iput:
1393 iput(inode);
1394out_up_killsb:
1395 up_read(&fc->killsb);
1396out_finish:
1397 fuse_copy_finish(cs);
1398 return err;
1399}
1400
Miklos Szeredi2d45ba32010-07-12 14:41:40 +02001401static void fuse_retrieve_end(struct fuse_conn *fc, struct fuse_req *req)
1402{
Miklos Szeredi0be85572010-10-27 15:34:46 -07001403 release_pages(req->pages, req->num_pages, 0);
Miklos Szeredi2d45ba32010-07-12 14:41:40 +02001404}
1405
1406static int fuse_retrieve(struct fuse_conn *fc, struct inode *inode,
1407 struct fuse_notify_retrieve_out *outarg)
1408{
1409 int err;
1410 struct address_space *mapping = inode->i_mapping;
1411 struct fuse_req *req;
1412 pgoff_t index;
1413 loff_t file_size;
1414 unsigned int num;
1415 unsigned int offset;
Geert Uytterhoeven01574432010-09-30 22:06:21 +02001416 size_t total_len = 0;
Miklos Szeredi2d45ba32010-07-12 14:41:40 +02001417
1418 req = fuse_get_req(fc);
1419 if (IS_ERR(req))
1420 return PTR_ERR(req);
1421
1422 offset = outarg->offset & ~PAGE_CACHE_MASK;
1423
1424 req->in.h.opcode = FUSE_NOTIFY_REPLY;
1425 req->in.h.nodeid = outarg->nodeid;
1426 req->in.numargs = 2;
1427 req->in.argpages = 1;
1428 req->page_offset = offset;
1429 req->end = fuse_retrieve_end;
1430
1431 index = outarg->offset >> PAGE_CACHE_SHIFT;
1432 file_size = i_size_read(inode);
1433 num = outarg->size;
1434 if (outarg->offset > file_size)
1435 num = 0;
1436 else if (outarg->offset + num > file_size)
1437 num = file_size - outarg->offset;
1438
1439 while (num) {
1440 struct page *page;
1441 unsigned int this_num;
1442
1443 page = find_get_page(mapping, index);
1444 if (!page)
1445 break;
1446
1447 this_num = min_t(unsigned, num, PAGE_CACHE_SIZE - offset);
1448 req->pages[req->num_pages] = page;
1449 req->num_pages++;
1450
1451 num -= this_num;
1452 total_len += this_num;
1453 }
1454 req->misc.retrieve_in.offset = outarg->offset;
1455 req->misc.retrieve_in.size = total_len;
1456 req->in.args[0].size = sizeof(req->misc.retrieve_in);
1457 req->in.args[0].value = &req->misc.retrieve_in;
1458 req->in.args[1].size = total_len;
1459
1460 err = fuse_request_send_notify_reply(fc, req, outarg->notify_unique);
1461 if (err)
1462 fuse_retrieve_end(fc, req);
1463
1464 return err;
1465}
1466
1467static int fuse_notify_retrieve(struct fuse_conn *fc, unsigned int size,
1468 struct fuse_copy_state *cs)
1469{
1470 struct fuse_notify_retrieve_out outarg;
1471 struct inode *inode;
1472 int err;
1473
1474 err = -EINVAL;
1475 if (size != sizeof(outarg))
1476 goto copy_finish;
1477
1478 err = fuse_copy_one(cs, &outarg, sizeof(outarg));
1479 if (err)
1480 goto copy_finish;
1481
1482 fuse_copy_finish(cs);
1483
1484 down_read(&fc->killsb);
1485 err = -ENOENT;
1486 if (fc->sb) {
1487 u64 nodeid = outarg.nodeid;
1488
1489 inode = ilookup5(fc->sb, nodeid, fuse_inode_eq, &nodeid);
1490 if (inode) {
1491 err = fuse_retrieve(fc, inode, &outarg);
1492 iput(inode);
1493 }
1494 }
1495 up_read(&fc->killsb);
1496
1497 return err;
1498
1499copy_finish:
1500 fuse_copy_finish(cs);
1501 return err;
1502}
1503
Tejun Heo85993962008-11-26 12:03:55 +01001504static int fuse_notify(struct fuse_conn *fc, enum fuse_notify_code code,
1505 unsigned int size, struct fuse_copy_state *cs)
1506{
1507 switch (code) {
Tejun Heo95668a62008-11-26 12:03:55 +01001508 case FUSE_NOTIFY_POLL:
1509 return fuse_notify_poll(fc, size, cs);
1510
John Muir3b463ae2009-05-31 11:13:57 -04001511 case FUSE_NOTIFY_INVAL_INODE:
1512 return fuse_notify_inval_inode(fc, size, cs);
1513
1514 case FUSE_NOTIFY_INVAL_ENTRY:
1515 return fuse_notify_inval_entry(fc, size, cs);
1516
Miklos Szeredia1d75f22010-07-12 14:41:40 +02001517 case FUSE_NOTIFY_STORE:
1518 return fuse_notify_store(fc, size, cs);
1519
Miklos Szeredi2d45ba32010-07-12 14:41:40 +02001520 case FUSE_NOTIFY_RETRIEVE:
1521 return fuse_notify_retrieve(fc, size, cs);
1522
Tejun Heo85993962008-11-26 12:03:55 +01001523 default:
Miklos Szeredif6d47a12009-01-26 15:00:59 +01001524 fuse_copy_finish(cs);
Tejun Heo85993962008-11-26 12:03:55 +01001525 return -EINVAL;
1526 }
1527}
1528
Miklos Szeredi334f4852005-09-09 13:10:27 -07001529/* Look up request on processing list by unique ID */
1530static struct fuse_req *request_find(struct fuse_conn *fc, u64 unique)
1531{
1532 struct list_head *entry;
1533
1534 list_for_each(entry, &fc->processing) {
1535 struct fuse_req *req;
1536 req = list_entry(entry, struct fuse_req, list);
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001537 if (req->in.h.unique == unique || req->intr_unique == unique)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001538 return req;
1539 }
1540 return NULL;
1541}
1542
1543static int copy_out_args(struct fuse_copy_state *cs, struct fuse_out *out,
1544 unsigned nbytes)
1545{
1546 unsigned reqsize = sizeof(struct fuse_out_header);
1547
1548 if (out->h.error)
1549 return nbytes != reqsize ? -EINVAL : 0;
1550
1551 reqsize += len_args(out->numargs, out->args);
1552
1553 if (reqsize < nbytes || (reqsize > nbytes && !out->argvar))
1554 return -EINVAL;
1555 else if (reqsize > nbytes) {
1556 struct fuse_arg *lastarg = &out->args[out->numargs-1];
1557 unsigned diffsize = reqsize - nbytes;
1558 if (diffsize > lastarg->size)
1559 return -EINVAL;
1560 lastarg->size -= diffsize;
1561 }
1562 return fuse_copy_args(cs, out->numargs, out->argpages, out->args,
1563 out->page_zeroing);
1564}
1565
1566/*
1567 * Write a single reply to a request. First the header is copied from
1568 * the write buffer. The request is then searched on the processing
1569 * list by the unique ID found in the header. If found, then remove
1570 * it from the list and copy the rest of the buffer to the request.
1571 * The request is finished by calling request_end()
1572 */
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001573static ssize_t fuse_dev_do_write(struct fuse_conn *fc,
1574 struct fuse_copy_state *cs, size_t nbytes)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001575{
1576 int err;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001577 struct fuse_req *req;
1578 struct fuse_out_header oh;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001579
Miklos Szeredi334f4852005-09-09 13:10:27 -07001580 if (nbytes < sizeof(struct fuse_out_header))
1581 return -EINVAL;
1582
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001583 err = fuse_copy_one(cs, &oh, sizeof(oh));
Miklos Szeredi334f4852005-09-09 13:10:27 -07001584 if (err)
1585 goto err_finish;
Tejun Heo85993962008-11-26 12:03:55 +01001586
Miklos Szeredi334f4852005-09-09 13:10:27 -07001587 err = -EINVAL;
Tejun Heo85993962008-11-26 12:03:55 +01001588 if (oh.len != nbytes)
1589 goto err_finish;
1590
1591 /*
1592 * Zero oh.unique indicates unsolicited notification message
1593 * and error contains notification code.
1594 */
1595 if (!oh.unique) {
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001596 err = fuse_notify(fc, oh.error, nbytes - sizeof(oh), cs);
Tejun Heo85993962008-11-26 12:03:55 +01001597 return err ? err : nbytes;
1598 }
1599
1600 err = -EINVAL;
1601 if (oh.error <= -1000 || oh.error > 0)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001602 goto err_finish;
1603
Miklos Szeredid7133112006-04-10 22:54:55 -07001604 spin_lock(&fc->lock);
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001605 err = -ENOENT;
1606 if (!fc->connected)
1607 goto err_unlock;
1608
Miklos Szeredi334f4852005-09-09 13:10:27 -07001609 req = request_find(fc, oh.unique);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001610 if (!req)
1611 goto err_unlock;
1612
Miklos Szeredif9a28422006-06-25 05:48:53 -07001613 if (req->aborted) {
Miklos Szeredid7133112006-04-10 22:54:55 -07001614 spin_unlock(&fc->lock);
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001615 fuse_copy_finish(cs);
Miklos Szeredid7133112006-04-10 22:54:55 -07001616 spin_lock(&fc->lock);
Miklos Szeredi222f1d62006-01-16 22:14:25 -08001617 request_end(fc, req);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001618 return -ENOENT;
1619 }
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001620 /* Is it an interrupt reply? */
1621 if (req->intr_unique == oh.unique) {
1622 err = -EINVAL;
1623 if (nbytes != sizeof(struct fuse_out_header))
1624 goto err_unlock;
1625
1626 if (oh.error == -ENOSYS)
1627 fc->no_interrupt = 1;
1628 else if (oh.error == -EAGAIN)
1629 queue_interrupt(fc, req);
1630
1631 spin_unlock(&fc->lock);
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001632 fuse_copy_finish(cs);
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001633 return nbytes;
1634 }
1635
1636 req->state = FUSE_REQ_WRITING;
Miklos Szeredid77a1d52006-01-16 22:14:31 -08001637 list_move(&req->list, &fc->io);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001638 req->out.h = oh;
1639 req->locked = 1;
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001640 cs->req = req;
Miklos Szeredice534fb2010-05-25 15:06:07 +02001641 if (!req->out.page_replace)
1642 cs->move_pages = 0;
Miklos Szeredid7133112006-04-10 22:54:55 -07001643 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001644
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001645 err = copy_out_args(cs, &req->out, nbytes);
1646 fuse_copy_finish(cs);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001647
Miklos Szeredid7133112006-04-10 22:54:55 -07001648 spin_lock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001649 req->locked = 0;
1650 if (!err) {
Miklos Szeredif9a28422006-06-25 05:48:53 -07001651 if (req->aborted)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001652 err = -ENOENT;
Miklos Szeredif9a28422006-06-25 05:48:53 -07001653 } else if (!req->aborted)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001654 req->out.h.error = -EIO;
1655 request_end(fc, req);
1656
1657 return err ? err : nbytes;
1658
1659 err_unlock:
Miklos Szeredid7133112006-04-10 22:54:55 -07001660 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001661 err_finish:
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001662 fuse_copy_finish(cs);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001663 return err;
1664}
1665
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001666static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
1667 unsigned long nr_segs, loff_t pos)
1668{
1669 struct fuse_copy_state cs;
1670 struct fuse_conn *fc = fuse_get_conn(iocb->ki_filp);
1671 if (!fc)
1672 return -EPERM;
1673
Miklos Szeredic3021622010-05-25 15:06:07 +02001674 fuse_copy_init(&cs, fc, 0, iov, nr_segs);
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001675
1676 return fuse_dev_do_write(fc, &cs, iov_length(iov, nr_segs));
1677}
1678
1679static ssize_t fuse_dev_splice_write(struct pipe_inode_info *pipe,
1680 struct file *out, loff_t *ppos,
1681 size_t len, unsigned int flags)
1682{
1683 unsigned nbuf;
1684 unsigned idx;
1685 struct pipe_buffer *bufs;
1686 struct fuse_copy_state cs;
1687 struct fuse_conn *fc;
1688 size_t rem;
1689 ssize_t ret;
1690
1691 fc = fuse_get_conn(out);
1692 if (!fc)
1693 return -EPERM;
1694
Miklos Szeredi07e77dc2010-12-07 20:16:56 +01001695 bufs = kmalloc(pipe->buffers * sizeof(struct pipe_buffer), GFP_KERNEL);
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001696 if (!bufs)
1697 return -ENOMEM;
1698
1699 pipe_lock(pipe);
1700 nbuf = 0;
1701 rem = 0;
1702 for (idx = 0; idx < pipe->nrbufs && rem < len; idx++)
1703 rem += pipe->bufs[(pipe->curbuf + idx) & (pipe->buffers - 1)].len;
1704
1705 ret = -EINVAL;
1706 if (rem < len) {
1707 pipe_unlock(pipe);
1708 goto out;
1709 }
1710
1711 rem = len;
1712 while (rem) {
1713 struct pipe_buffer *ibuf;
1714 struct pipe_buffer *obuf;
1715
1716 BUG_ON(nbuf >= pipe->buffers);
1717 BUG_ON(!pipe->nrbufs);
1718 ibuf = &pipe->bufs[pipe->curbuf];
1719 obuf = &bufs[nbuf];
1720
1721 if (rem >= ibuf->len) {
1722 *obuf = *ibuf;
1723 ibuf->ops = NULL;
1724 pipe->curbuf = (pipe->curbuf + 1) & (pipe->buffers - 1);
1725 pipe->nrbufs--;
1726 } else {
1727 ibuf->ops->get(pipe, ibuf);
1728 *obuf = *ibuf;
1729 obuf->flags &= ~PIPE_BUF_FLAG_GIFT;
1730 obuf->len = rem;
1731 ibuf->offset += obuf->len;
1732 ibuf->len -= obuf->len;
1733 }
1734 nbuf++;
1735 rem -= obuf->len;
1736 }
1737 pipe_unlock(pipe);
1738
Miklos Szeredic3021622010-05-25 15:06:07 +02001739 fuse_copy_init(&cs, fc, 0, NULL, nbuf);
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001740 cs.pipebufs = bufs;
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001741 cs.pipe = pipe;
1742
Miklos Szeredice534fb2010-05-25 15:06:07 +02001743 if (flags & SPLICE_F_MOVE)
1744 cs.move_pages = 1;
1745
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001746 ret = fuse_dev_do_write(fc, &cs, len);
1747
1748 for (idx = 0; idx < nbuf; idx++) {
1749 struct pipe_buffer *buf = &bufs[idx];
1750 buf->ops->release(pipe, buf);
1751 }
1752out:
1753 kfree(bufs);
1754 return ret;
1755}
1756
Miklos Szeredi334f4852005-09-09 13:10:27 -07001757static unsigned fuse_dev_poll(struct file *file, poll_table *wait)
1758{
Miklos Szeredi334f4852005-09-09 13:10:27 -07001759 unsigned mask = POLLOUT | POLLWRNORM;
Miklos Szeredi7025d9a2006-04-10 22:54:50 -07001760 struct fuse_conn *fc = fuse_get_conn(file);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001761 if (!fc)
Miklos Szeredi7025d9a2006-04-10 22:54:50 -07001762 return POLLERR;
Miklos Szeredi334f4852005-09-09 13:10:27 -07001763
1764 poll_wait(file, &fc->waitq, wait);
1765
Miklos Szeredid7133112006-04-10 22:54:55 -07001766 spin_lock(&fc->lock);
Miklos Szeredi7025d9a2006-04-10 22:54:50 -07001767 if (!fc->connected)
1768 mask = POLLERR;
Miklos Szeredia4d27e72006-06-25 05:48:54 -07001769 else if (request_pending(fc))
Miklos Szeredi7025d9a2006-04-10 22:54:50 -07001770 mask |= POLLIN | POLLRDNORM;
Miklos Szeredid7133112006-04-10 22:54:55 -07001771 spin_unlock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001772
1773 return mask;
1774}
1775
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001776/*
1777 * Abort all requests on the given list (pending or processing)
1778 *
Miklos Szeredid7133112006-04-10 22:54:55 -07001779 * This function releases and reacquires fc->lock
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001780 */
Miklos Szeredi334f4852005-09-09 13:10:27 -07001781static void end_requests(struct fuse_conn *fc, struct list_head *head)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +02001782__releases(fc->lock)
1783__acquires(fc->lock)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001784{
1785 while (!list_empty(head)) {
1786 struct fuse_req *req;
1787 req = list_entry(head->next, struct fuse_req, list);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001788 req->out.h.error = -ECONNABORTED;
1789 request_end(fc, req);
Miklos Szeredid7133112006-04-10 22:54:55 -07001790 spin_lock(&fc->lock);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001791 }
1792}
1793
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001794/*
1795 * Abort requests under I/O
1796 *
Miklos Szeredif9a28422006-06-25 05:48:53 -07001797 * The requests are set to aborted and finished, and the request
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001798 * waiter is woken up. This will make request_wait_answer() wait
1799 * until the request is unlocked and then return.
Miklos Szeredi64c6d8e2006-01-16 22:14:42 -08001800 *
1801 * If the request is asynchronous, then the end function needs to be
1802 * called after waiting for the request to be unlocked (if it was
1803 * locked).
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001804 */
1805static void end_io_requests(struct fuse_conn *fc)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +02001806__releases(fc->lock)
1807__acquires(fc->lock)
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001808{
1809 while (!list_empty(&fc->io)) {
Miklos Szeredi64c6d8e2006-01-16 22:14:42 -08001810 struct fuse_req *req =
1811 list_entry(fc->io.next, struct fuse_req, list);
1812 void (*end) (struct fuse_conn *, struct fuse_req *) = req->end;
1813
Miklos Szeredif9a28422006-06-25 05:48:53 -07001814 req->aborted = 1;
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001815 req->out.h.error = -ECONNABORTED;
1816 req->state = FUSE_REQ_FINISHED;
1817 list_del_init(&req->list);
1818 wake_up(&req->waitq);
Miklos Szeredi64c6d8e2006-01-16 22:14:42 -08001819 if (end) {
1820 req->end = NULL;
Miklos Szeredi64c6d8e2006-01-16 22:14:42 -08001821 __fuse_get_request(req);
Miklos Szeredid7133112006-04-10 22:54:55 -07001822 spin_unlock(&fc->lock);
Miklos Szeredi64c6d8e2006-01-16 22:14:42 -08001823 wait_event(req->waitq, !req->locked);
1824 end(fc, req);
Tejun Heoe9bb09d2008-11-26 12:03:54 +01001825 fuse_put_request(fc, req);
Miklos Szeredid7133112006-04-10 22:54:55 -07001826 spin_lock(&fc->lock);
Miklos Szeredi64c6d8e2006-01-16 22:14:42 -08001827 }
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001828 }
1829}
1830
Miklos Szeredi595afaf2010-09-07 13:42:41 +02001831static void end_queued_requests(struct fuse_conn *fc)
Miklos Szeredib9ca67b2010-09-07 13:42:41 +02001832__releases(fc->lock)
1833__acquires(fc->lock)
Miklos Szeredi595afaf2010-09-07 13:42:41 +02001834{
1835 fc->max_background = UINT_MAX;
1836 flush_bg_queue(fc);
1837 end_requests(fc, &fc->pending);
1838 end_requests(fc, &fc->processing);
Miklos Szeredi07e77dc2010-12-07 20:16:56 +01001839 while (forget_pending(fc))
1840 kfree(dequeue_forget(fc));
Miklos Szeredi595afaf2010-09-07 13:42:41 +02001841}
1842
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001843/*
1844 * Abort all requests.
1845 *
1846 * Emergency exit in case of a malicious or accidental deadlock, or
1847 * just a hung filesystem.
1848 *
1849 * The same effect is usually achievable through killing the
1850 * filesystem daemon and all users of the filesystem. The exception
1851 * is the combination of an asynchronous request and the tricky
1852 * deadlock (see Documentation/filesystems/fuse.txt).
1853 *
1854 * During the aborting, progression of requests from the pending and
1855 * processing lists onto the io list, and progression of new requests
1856 * onto the pending list is prevented by req->connected being false.
1857 *
1858 * Progression of requests under I/O to the processing list is
Miklos Szeredif9a28422006-06-25 05:48:53 -07001859 * prevented by the req->aborted flag being true for these requests.
1860 * For this reason requests on the io list must be aborted first.
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001861 */
1862void fuse_abort_conn(struct fuse_conn *fc)
1863{
Miklos Szeredid7133112006-04-10 22:54:55 -07001864 spin_lock(&fc->lock);
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001865 if (fc->connected) {
1866 fc->connected = 0;
Miklos Szeredi51eb01e2006-06-25 05:48:50 -07001867 fc->blocked = 0;
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001868 end_io_requests(fc);
Miklos Szeredi595afaf2010-09-07 13:42:41 +02001869 end_queued_requests(fc);
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001870 wake_up_all(&fc->waitq);
Miklos Szeredi51eb01e2006-06-25 05:48:50 -07001871 wake_up_all(&fc->blocked_waitq);
Jeff Dike385a17b2006-04-10 22:54:52 -07001872 kill_fasync(&fc->fasync, SIGIO, POLL_IN);
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001873 }
Miklos Szeredid7133112006-04-10 22:54:55 -07001874 spin_unlock(&fc->lock);
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001875}
Tejun Heo08cbf542009-04-14 10:54:53 +09001876EXPORT_SYMBOL_GPL(fuse_abort_conn);
Miklos Szeredi69a53bf2006-01-16 22:14:41 -08001877
Tejun Heo08cbf542009-04-14 10:54:53 +09001878int fuse_dev_release(struct inode *inode, struct file *file)
Miklos Szeredi334f4852005-09-09 13:10:27 -07001879{
Miklos Szeredi0720b312006-04-10 22:54:55 -07001880 struct fuse_conn *fc = fuse_get_conn(file);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001881 if (fc) {
Miklos Szeredid7133112006-04-10 22:54:55 -07001882 spin_lock(&fc->lock);
Miklos Szeredi1e9a4ed2005-09-09 13:10:31 -07001883 fc->connected = 0;
Miklos Szeredi595afaf2010-09-07 13:42:41 +02001884 fc->blocked = 0;
1885 end_queued_requests(fc);
1886 wake_up_all(&fc->blocked_waitq);
Miklos Szeredid7133112006-04-10 22:54:55 -07001887 spin_unlock(&fc->lock);
Miklos Szeredibafa9652006-06-25 05:48:51 -07001888 fuse_conn_put(fc);
Jeff Dike385a17b2006-04-10 22:54:52 -07001889 }
Miklos Szeredif543f252006-01-16 22:14:35 -08001890
Miklos Szeredi334f4852005-09-09 13:10:27 -07001891 return 0;
1892}
Tejun Heo08cbf542009-04-14 10:54:53 +09001893EXPORT_SYMBOL_GPL(fuse_dev_release);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001894
Jeff Dike385a17b2006-04-10 22:54:52 -07001895static int fuse_dev_fasync(int fd, struct file *file, int on)
1896{
1897 struct fuse_conn *fc = fuse_get_conn(file);
1898 if (!fc)
Miklos Szeredia87046d2006-04-10 22:54:56 -07001899 return -EPERM;
Jeff Dike385a17b2006-04-10 22:54:52 -07001900
1901 /* No locking - fasync_helper does its own locking */
1902 return fasync_helper(fd, file, on, &fc->fasync);
1903}
1904
Arjan van de Ven4b6f5d22006-03-28 01:56:42 -08001905const struct file_operations fuse_dev_operations = {
Miklos Szeredi334f4852005-09-09 13:10:27 -07001906 .owner = THIS_MODULE,
1907 .llseek = no_llseek,
Badari Pulavartyee0b3e62006-09-30 23:28:47 -07001908 .read = do_sync_read,
1909 .aio_read = fuse_dev_read,
Miklos Szeredic3021622010-05-25 15:06:07 +02001910 .splice_read = fuse_dev_splice_read,
Badari Pulavartyee0b3e62006-09-30 23:28:47 -07001911 .write = do_sync_write,
1912 .aio_write = fuse_dev_write,
Miklos Szeredidd3bb142010-05-25 15:06:06 +02001913 .splice_write = fuse_dev_splice_write,
Miklos Szeredi334f4852005-09-09 13:10:27 -07001914 .poll = fuse_dev_poll,
1915 .release = fuse_dev_release,
Jeff Dike385a17b2006-04-10 22:54:52 -07001916 .fasync = fuse_dev_fasync,
Miklos Szeredi334f4852005-09-09 13:10:27 -07001917};
Tejun Heo08cbf542009-04-14 10:54:53 +09001918EXPORT_SYMBOL_GPL(fuse_dev_operations);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001919
1920static struct miscdevice fuse_miscdevice = {
1921 .minor = FUSE_MINOR,
1922 .name = "fuse",
1923 .fops = &fuse_dev_operations,
1924};
1925
1926int __init fuse_dev_init(void)
1927{
1928 int err = -ENOMEM;
1929 fuse_req_cachep = kmem_cache_create("fuse_request",
1930 sizeof(struct fuse_req),
Paul Mundt20c2df82007-07-20 10:11:58 +09001931 0, 0, NULL);
Miklos Szeredi334f4852005-09-09 13:10:27 -07001932 if (!fuse_req_cachep)
1933 goto out;
1934
1935 err = misc_register(&fuse_miscdevice);
1936 if (err)
1937 goto out_cache_clean;
1938
1939 return 0;
1940
1941 out_cache_clean:
1942 kmem_cache_destroy(fuse_req_cachep);
1943 out:
1944 return err;
1945}
1946
1947void fuse_dev_cleanup(void)
1948{
1949 misc_deregister(&fuse_miscdevice);
1950 kmem_cache_destroy(fuse_req_cachep);
1951}