Blame - fs/nfsd/vfs.c - kernel/msm-4.19

blob: f83ab4cf426503d4b6714035e8b5601817e960c7 [file] [log] [blame]

Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1	#define MSNFS /* HACK HACK */
				2	/*
				3	* linux/fs/nfsd/vfs.c
				4	*
				5	* File operations used by nfsd. Some of these have been ripped from
				6	* other parts of the kernel because they weren't exported, others
				7	* are partial duplicates with added or changed functionality.
				8	*
				9	* Note that several functions dget() the dentry upon which they want
				10	* to act, most notably those that create directory entries. Response
				11	* dentry's are dput()'d if necessary in the release callback.
				12	* So if you notice code paths that apparently fail to dput() the
				13	* dentry, don't worry--they have been taken care of.
				14	*
				15	* Copyright (C) 1995-1999 Olaf Kirch <okir@monad.swb.de>
				16	* Zerocpy NFS support (C) 2002 Hirokazu Takahashi <taka@valinux.co.jp>
				17	*/
				18
				19	#include <linux/config.h>
				20	#include <linux/string.h>
				21	#include <linux/time.h>
				22	#include <linux/errno.h>
				23	#include <linux/fs.h>
				24	#include <linux/file.h>
				25	#include <linux/mount.h>
				26	#include <linux/major.h>
				27	#include <linux/ext2_fs.h>
				28	#include <linux/proc_fs.h>
				29	#include <linux/stat.h>
				30	#include <linux/fcntl.h>
				31	#include <linux/net.h>
				32	#include <linux/unistd.h>
				33	#include <linux/slab.h>
				34	#include <linux/pagemap.h>
				35	#include <linux/in.h>
				36	#include <linux/module.h>
				37	#include <linux/namei.h>
				38	#include <linux/vfs.h>
				39	#include <linux/delay.h>
				40	#include <linux/sunrpc/svc.h>
				41	#include <linux/nfsd/nfsd.h>
				42	#ifdef CONFIG_NFSD_V3
				43	#include <linux/nfs3.h>
				44	#include <linux/nfsd/xdr3.h>
				45	#endif /* CONFIG_NFSD_V3 */
				46	#include <linux/nfsd/nfsfh.h>
				47	#include <linux/quotaops.h>
Robert Love	0eeca28	2005-07-12 17:06:03 -0400	[diff] [blame]	48	#include <linux/fsnotify.h>
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	49	#include <linux/posix_acl.h>
				50	#include <linux/posix_acl_xattr.h>
Christoph Hellwig	334a13e	2005-06-28 20:44:58 -0700	[diff] [blame]	51	#ifdef CONFIG_NFSD_V4
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	52	#include <linux/xattr.h>
				53	#include <linux/nfs4.h>
				54	#include <linux/nfs4_acl.h>
				55	#include <linux/nfsd_idmap.h>
				56	#include <linux/security.h>
				57	#endif /* CONFIG_NFSD_V4 */
				58
				59	#include <asm/uaccess.h>
				60
				61	#define NFSDDBG_FACILITY NFSDDBG_FILEOP
				62	#define NFSD_PARANOIA
				63
				64
				65	/* We must ignore files (but only files) which might have mandatory
				66	* locks on them because there is no way to know if the accesser has
				67	* the lock.
				68	*/
				69	#define IS_ISMNDLK(i) (S_ISREG((i)->i_mode) && MANDATORY_LOCK(i))
				70
				71	/*
				72	* This is a cache of readahead params that help us choose the proper
				73	* readahead strategy. Initially, we set all readahead parameters to 0
				74	* and let the VFS handle things.
				75	* If you increase the number of cached files very much, you'll need to
				76	* add a hash table here.
				77	*/
				78	struct raparms {
				79	struct raparms *p_next;
				80	unsigned int p_count;
				81	ino_t p_ino;
				82	dev_t p_dev;
				83	int p_set;
				84	struct file_ra_state p_ra;
				85	};
				86
				87	static struct raparms * raparml;
				88	static struct raparms * raparm_cache;
				89
				90	/*
				91	* Called from nfsd_lookup and encode_dirent. Check if we have crossed
				92	* a mount point.
				93	* Returns -EAGAIN leaving dpp and expp unchanged,
				94	* or nfs_ok having possibly changed dpp and expp
				95	*/
				96	int
				97	nfsd_cross_mnt(struct svc_rqst rqstp, struct dentry *dpp,
				98	struct svc_export **expp)
				99	{
				100	struct svc_export exp = expp, *exp2 = NULL;
				101	struct dentry dentry = dpp;
				102	struct vfsmount *mnt = mntget(exp->ex_mnt);
				103	struct dentry *mounts = dget(dentry);
				104	int err = nfs_ok;
				105
				106	while (follow_down(&mnt,&mounts)&&d_mountpoint(mounts));
				107
				108	exp2 = exp_get_by_name(exp->ex_client, mnt, mounts, &rqstp->rq_chandle);
				109	if (IS_ERR(exp2)) {
				110	err = PTR_ERR(exp2);
				111	dput(mounts);
				112	mntput(mnt);
				113	goto out;
				114	}
				115	if (exp2 && ((exp->ex_flags & NFSEXP_CROSSMOUNT) \|\| EX_NOHIDE(exp2))) {
				116	/* successfully crossed mount point */
				117	exp_put(exp);
				118	*expp = exp2;
				119	dput(dentry);
				120	*dpp = mounts;
				121	} else {
				122	if (exp2) exp_put(exp2);
				123	dput(mounts);
				124	}
				125	mntput(mnt);
				126	out:
				127	return err;
				128	}
				129
				130	/*
				131	* Look up one component of a pathname.
				132	* N.B. After this call _both_ fhp and resfh need an fh_put
				133	*
				134	* If the lookup would cross a mountpoint, and the mounted filesystem
				135	* is exported to the client with NFSEXP_NOHIDE, then the lookup is
				136	* accepted as it stands and the mounted directory is
				137	* returned. Otherwise the covered directory is returned.
				138	* NOTE: this mountpoint crossing is not supported properly by all
				139	* clients and is explicitly disallowed for NFSv3
				140	* NeilBrown <neilb@cse.unsw.edu.au>
				141	*/
				142	int
				143	nfsd_lookup(struct svc_rqst rqstp, struct svc_fh fhp, const char *name,
				144	int len, struct svc_fh *resfh)
				145	{
				146	struct svc_export *exp;
				147	struct dentry *dparent;
				148	struct dentry *dentry;
				149	int err;
				150
				151	dprintk("nfsd: nfsd_lookup(fh %s, %.*s)\n", SVCFH_fmt(fhp), len,name);
				152
				153	/* Obtain dentry and export. */
				154	err = fh_verify(rqstp, fhp, S_IFDIR, MAY_EXEC);
				155	if (err)
				156	return err;
				157
				158	dparent = fhp->fh_dentry;
				159	exp = fhp->fh_export;
				160	exp_get(exp);
				161
				162	err = nfserr_acces;
				163
				164	/* Lookup the name, but don't follow links */
				165	if (isdotent(name, len)) {
				166	if (len==1)
				167	dentry = dget(dparent);
				168	else if (dparent != exp->ex_dentry) {
				169	dentry = dget_parent(dparent);
				170	} else if (!EX_NOHIDE(exp))
				171	dentry = dget(dparent); /* .. == . just like at / */
				172	else {
				173	/* checking mountpoint crossing is very different when stepping up */
				174	struct svc_export *exp2 = NULL;
				175	struct dentry *dp;
				176	struct vfsmount *mnt = mntget(exp->ex_mnt);
				177	dentry = dget(dparent);
				178	while(dentry == mnt->mnt_root && follow_up(&mnt, &dentry))
				179	;
				180	dp = dget_parent(dentry);
				181	dput(dentry);
				182	dentry = dp;
				183
				184	exp2 = exp_parent(exp->ex_client, mnt, dentry,
				185	&rqstp->rq_chandle);
				186	if (IS_ERR(exp2)) {
				187	err = PTR_ERR(exp2);
				188	dput(dentry);
				189	mntput(mnt);
				190	goto out_nfserr;
				191	}
				192	if (!exp2) {
				193	dput(dentry);
				194	dentry = dget(dparent);
				195	} else {
				196	exp_put(exp);
				197	exp = exp2;
				198	}
				199	mntput(mnt);
				200	}
				201	} else {
				202	fh_lock(fhp);
				203	dentry = lookup_one_len(name, dparent, len);
				204	err = PTR_ERR(dentry);
				205	if (IS_ERR(dentry))
				206	goto out_nfserr;
				207	/*
				208	* check if we have crossed a mount point ...
				209	*/
				210	if (d_mountpoint(dentry)) {
				211	if ((err = nfsd_cross_mnt(rqstp, &dentry, &exp))) {
				212	dput(dentry);
				213	goto out_nfserr;
				214	}
				215	}
				216	}
				217	/*
				218	* Note: we compose the file handle now, but as the
				219	* dentry may be negative, it may need to be updated.
				220	*/
				221	err = fh_compose(resfh, exp, dentry, fhp);
				222	if (!err && !dentry->d_inode)
				223	err = nfserr_noent;
				224	dput(dentry);
				225	out:
				226	exp_put(exp);
				227	return err;
				228
				229	out_nfserr:
				230	err = nfserrno(err);
				231	goto out;
				232	}
				233
				234	/*
				235	* Set various file attributes.
				236	* N.B. After this call fhp needs an fh_put
				237	*/
				238	int
				239	nfsd_setattr(struct svc_rqst rqstp, struct svc_fh fhp, struct iattr *iap,
				240	int check_guard, time_t guardtime)
				241	{
				242	struct dentry *dentry;
				243	struct inode *inode;
				244	int accmode = MAY_SATTR;
				245	int ftype = 0;
				246	int imode;
				247	int err;
				248	int size_change = 0;
				249
				250	if (iap->ia_valid & (ATTR_ATIME \| ATTR_MTIME \| ATTR_SIZE))
				251	accmode \|= MAY_WRITE\|MAY_OWNER_OVERRIDE;
				252	if (iap->ia_valid & ATTR_SIZE)
				253	ftype = S_IFREG;
				254
				255	/* Get inode */
				256	err = fh_verify(rqstp, fhp, ftype, accmode);
NeilBrown	15b7a1b	2005-11-07 01:00:23 -0800	[diff] [blame]	257	if (err)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	258	goto out;
				259
				260	dentry = fhp->fh_dentry;
				261	inode = dentry->d_inode;
				262
NeilBrown	15b7a1b	2005-11-07 01:00:23 -0800	[diff] [blame]	263	/* Ignore any mode updates on symlinks */
				264	if (S_ISLNK(inode->i_mode))
				265	iap->ia_valid &= ~ATTR_MODE;
				266
				267	if (!iap->ia_valid)
				268	goto out;
				269
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	270	/* NFSv2 does not differentiate between "set-[ac]time-to-now"
				271	* which only requires access, and "set-[ac]time-to-X" which
				272	* requires ownership.
				273	* So if it looks like it might be "set both to the same time which
				274	* is close to now", and if inode_change_ok fails, then we
				275	* convert to "set to now" instead of "set to explicit time"
				276	*
				277	* We only call inode_change_ok as the last test as technically
				278	* it is not an interface that we should be using. It is only
				279	* valid if the filesystem does not define it's own i_op->setattr.
				280	*/
				281	#define BOTH_TIME_SET (ATTR_ATIME_SET \| ATTR_MTIME_SET)
				282	#define MAX_TOUCH_TIME_ERROR (30*60)
				283	if ((iap->ia_valid & BOTH_TIME_SET) == BOTH_TIME_SET
				284	&& iap->ia_mtime.tv_sec == iap->ia_atime.tv_sec
				285	) {
				286	/* Looks probable. Now just make sure time is in the right ballpark.
				287	* Solaris, at least, doesn't seem to care what the time request is.
				288	* We require it be within 30 minutes of now.
				289	*/
				290	time_t delta = iap->ia_atime.tv_sec - get_seconds();
				291	if (delta<0) delta = -delta;
				292	if (delta < MAX_TOUCH_TIME_ERROR &&
				293	inode_change_ok(inode, iap) != 0) {
				294	/* turn off ATTR_[AM]TIME_SET but leave ATTR_[AM]TIME
				295	* this will cause notify_change to set these times to "now"
				296	*/
				297	iap->ia_valid &= ~BOTH_TIME_SET;
				298	}
				299	}
				300
				301	/* The size case is special. It changes the file as well as the attributes. */
				302	if (iap->ia_valid & ATTR_SIZE) {
				303	if (iap->ia_size < inode->i_size) {
				304	err = nfsd_permission(fhp->fh_export, dentry, MAY_TRUNC\|MAY_OWNER_OVERRIDE);
				305	if (err)
				306	goto out;
				307	}
				308
				309	/*
				310	* If we are changing the size of the file, then
				311	* we need to break all leases.
				312	*/
				313	err = break_lease(inode, FMODE_WRITE \| O_NONBLOCK);
				314	if (err == -EWOULDBLOCK)
				315	err = -ETIMEDOUT;
				316	if (err) /* ENOMEM or EWOULDBLOCK */
				317	goto out_nfserr;
				318
				319	err = get_write_access(inode);
				320	if (err)
				321	goto out_nfserr;
				322
				323	size_change = 1;
				324	err = locks_verify_truncate(inode, NULL, iap->ia_size);
				325	if (err) {
				326	put_write_access(inode);
				327	goto out_nfserr;
				328	}
				329	DQUOT_INIT(inode);
				330	}
				331
				332	imode = inode->i_mode;
				333	if (iap->ia_valid & ATTR_MODE) {
				334	iap->ia_mode &= S_IALLUGO;
				335	imode = iap->ia_mode \|= (imode & ~S_IALLUGO);
				336	}
				337
				338	/* Revoke setuid/setgid bit on chown/chgrp */
				339	if ((iap->ia_valid & ATTR_UID) && iap->ia_uid != inode->i_uid)
				340	iap->ia_valid \|= ATTR_KILL_SUID;
				341	if ((iap->ia_valid & ATTR_GID) && iap->ia_gid != inode->i_gid)
				342	iap->ia_valid \|= ATTR_KILL_SGID;
				343
				344	/* Change the attributes. */
				345
				346	iap->ia_valid \|= ATTR_CTIME;
				347
				348	err = nfserr_notsync;
				349	if (!check_guard \|\| guardtime == inode->i_ctime.tv_sec) {
				350	fh_lock(fhp);
				351	err = notify_change(dentry, iap);
				352	err = nfserrno(err);
				353	fh_unlock(fhp);
				354	}
				355	if (size_change)
				356	put_write_access(inode);
				357	if (!err)
				358	if (EX_ISSYNC(fhp->fh_export))
				359	write_inode_now(inode, 1);
				360	out:
				361	return err;
				362
				363	out_nfserr:
				364	err = nfserrno(err);
				365	goto out;
				366	}
				367
				368	#if defined(CONFIG_NFSD_V4)
				369
				370	static int
				371	set_nfsv4_acl_one(struct dentry dentry, struct posix_acl pacl, char *key)
				372	{
				373	int len;
				374	size_t buflen;
				375	char *buf = NULL;
				376	int error = 0;
				377	struct inode *inode = dentry->d_inode;
				378
				379	buflen = posix_acl_xattr_size(pacl->a_count);
				380	buf = kmalloc(buflen, GFP_KERNEL);
				381	error = -ENOMEM;
				382	if (buf == NULL)
				383	goto out;
				384
				385	len = posix_acl_to_xattr(pacl, buf, buflen);
				386	if (len < 0) {
				387	error = len;
				388	goto out;
				389	}
				390
				391	error = -EOPNOTSUPP;
				392	if (inode->i_op && inode->i_op->setxattr) {
				393	down(&inode->i_sem);
				394	security_inode_setxattr(dentry, key, buf, len, 0);
				395	error = inode->i_op->setxattr(dentry, key, buf, len, 0);
				396	if (!error)
				397	security_inode_post_setxattr(dentry, key, buf, len, 0);
				398	up(&inode->i_sem);
				399	}
				400	out:
				401	kfree(buf);
				402	return error;
				403	}
				404
				405	int
				406	nfsd4_set_nfs4_acl(struct svc_rqst rqstp, struct svc_fh fhp,
				407	struct nfs4_acl *acl)
				408	{
				409	int error;
				410	struct dentry *dentry;
				411	struct inode *inode;
				412	struct posix_acl pacl = NULL, dpacl = NULL;
				413	unsigned int flags = 0;
				414
				415	/* Get inode */
				416	error = fh_verify(rqstp, fhp, 0 /* S_IFREG */, MAY_SATTR);
				417	if (error)
				418	goto out;
				419
				420	dentry = fhp->fh_dentry;
				421	inode = dentry->d_inode;
				422	if (S_ISDIR(inode->i_mode))
				423	flags = NFS4_ACL_DIR;
				424
				425	error = nfs4_acl_nfsv4_to_posix(acl, &pacl, &dpacl, flags);
				426	if (error == -EINVAL) {
				427	error = nfserr_attrnotsupp;
				428	goto out;
				429	} else if (error < 0)
				430	goto out_nfserr;
				431
				432	if (pacl) {
Christoph Hellwig	9a59f45	2005-06-23 00:10:19 -0700	[diff] [blame]	433	error = set_nfsv4_acl_one(dentry, pacl, POSIX_ACL_XATTR_ACCESS);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	434	if (error < 0)
				435	goto out_nfserr;
				436	}
				437
				438	if (dpacl) {
Christoph Hellwig	9a59f45	2005-06-23 00:10:19 -0700	[diff] [blame]	439	error = set_nfsv4_acl_one(dentry, dpacl, POSIX_ACL_XATTR_DEFAULT);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	440	if (error < 0)
				441	goto out_nfserr;
				442	}
				443
				444	error = nfs_ok;
				445
				446	out:
				447	posix_acl_release(pacl);
				448	posix_acl_release(dpacl);
				449	return (error);
				450	out_nfserr:
				451	error = nfserrno(error);
				452	goto out;
				453	}
				454
				455	static struct posix_acl *
				456	_get_posix_acl(struct dentry dentry, char key)
				457	{
				458	struct inode *inode = dentry->d_inode;
				459	char *buf = NULL;
				460	int buflen, error = 0;
				461	struct posix_acl *pacl = NULL;
				462
				463	error = -EOPNOTSUPP;
				464	if (inode->i_op == NULL)
				465	goto out_err;
				466	if (inode->i_op->getxattr == NULL)
				467	goto out_err;
				468
				469	error = security_inode_getxattr(dentry, key);
				470	if (error)
				471	goto out_err;
				472
				473	buflen = inode->i_op->getxattr(dentry, key, NULL, 0);
				474	if (buflen <= 0) {
				475	error = buflen < 0 ? buflen : -ENODATA;
				476	goto out_err;
				477	}
				478
				479	buf = kmalloc(buflen, GFP_KERNEL);
				480	if (buf == NULL) {
				481	error = -ENOMEM;
				482	goto out_err;
				483	}
				484
				485	error = inode->i_op->getxattr(dentry, key, buf, buflen);
				486	if (error < 0)
				487	goto out_err;
				488
				489	pacl = posix_acl_from_xattr(buf, buflen);
				490	out:
				491	kfree(buf);
				492	return pacl;
				493	out_err:
				494	pacl = ERR_PTR(error);
				495	goto out;
				496	}
				497
				498	int
				499	nfsd4_get_nfs4_acl(struct svc_rqst rqstp, struct dentry dentry, struct nfs4_acl **acl)
				500	{
				501	struct inode *inode = dentry->d_inode;
				502	int error = 0;
				503	struct posix_acl pacl = NULL, dpacl = NULL;
				504	unsigned int flags = 0;
				505
Christoph Hellwig	9a59f45	2005-06-23 00:10:19 -0700	[diff] [blame]	506	pacl = _get_posix_acl(dentry, POSIX_ACL_XATTR_ACCESS);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	507	if (IS_ERR(pacl) && PTR_ERR(pacl) == -ENODATA)
				508	pacl = posix_acl_from_mode(inode->i_mode, GFP_KERNEL);
				509	if (IS_ERR(pacl)) {
				510	error = PTR_ERR(pacl);
				511	pacl = NULL;
				512	goto out;
				513	}
				514
				515	if (S_ISDIR(inode->i_mode)) {
Christoph Hellwig	9a59f45	2005-06-23 00:10:19 -0700	[diff] [blame]	516	dpacl = _get_posix_acl(dentry, POSIX_ACL_XATTR_DEFAULT);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	517	if (IS_ERR(dpacl) && PTR_ERR(dpacl) == -ENODATA)
				518	dpacl = NULL;
				519	else if (IS_ERR(dpacl)) {
				520	error = PTR_ERR(dpacl);
				521	dpacl = NULL;
				522	goto out;
				523	}
				524	flags = NFS4_ACL_DIR;
				525	}
				526
				527	*acl = nfs4_acl_posix_to_nfsv4(pacl, dpacl, flags);
				528	if (IS_ERR(*acl)) {
				529	error = PTR_ERR(*acl);
				530	*acl = NULL;
				531	}
				532	out:
				533	posix_acl_release(pacl);
				534	posix_acl_release(dpacl);
				535	return error;
				536	}
				537
				538	#endif /* defined(CONFIG_NFS_V4) */
				539
				540	#ifdef CONFIG_NFSD_V3
				541	/*
				542	* Check server access rights to a file system object
				543	*/
				544	struct accessmap {
				545	u32 access;
				546	int how;
				547	};
				548	static struct accessmap nfs3_regaccess[] = {
				549	{ NFS3_ACCESS_READ, MAY_READ },
				550	{ NFS3_ACCESS_EXECUTE, MAY_EXEC },
				551	{ NFS3_ACCESS_MODIFY, MAY_WRITE\|MAY_TRUNC },
				552	{ NFS3_ACCESS_EXTEND, MAY_WRITE },
				553
				554	{ 0, 0 }
				555	};
				556
				557	static struct accessmap nfs3_diraccess[] = {
				558	{ NFS3_ACCESS_READ, MAY_READ },
				559	{ NFS3_ACCESS_LOOKUP, MAY_EXEC },
				560	{ NFS3_ACCESS_MODIFY, MAY_EXEC\|MAY_WRITE\|MAY_TRUNC },
				561	{ NFS3_ACCESS_EXTEND, MAY_EXEC\|MAY_WRITE },
				562	{ NFS3_ACCESS_DELETE, MAY_REMOVE },
				563
				564	{ 0, 0 }
				565	};
				566
				567	static struct accessmap nfs3_anyaccess[] = {
				568	/* Some clients - Solaris 2.6 at least, make an access call
				569	* to the server to check for access for things like /dev/null
				570	* (which really, the server doesn't care about). So
				571	* We provide simple access checking for them, looking
				572	* mainly at mode bits, and we make sure to ignore read-only
				573	* filesystem checks
				574	*/
				575	{ NFS3_ACCESS_READ, MAY_READ },
				576	{ NFS3_ACCESS_EXECUTE, MAY_EXEC },
				577	{ NFS3_ACCESS_MODIFY, MAY_WRITE\|MAY_LOCAL_ACCESS },
				578	{ NFS3_ACCESS_EXTEND, MAY_WRITE\|MAY_LOCAL_ACCESS },
				579
				580	{ 0, 0 }
				581	};
				582
				583	int
				584	nfsd_access(struct svc_rqst rqstp, struct svc_fh fhp, u32 access, u32 supported)
				585	{
				586	struct accessmap *map;
				587	struct svc_export *export;
				588	struct dentry *dentry;
				589	u32 query, result = 0, sresult = 0;
				590	unsigned int error;
				591
				592	error = fh_verify(rqstp, fhp, 0, MAY_NOP);
				593	if (error)
				594	goto out;
				595
				596	export = fhp->fh_export;
				597	dentry = fhp->fh_dentry;
				598
				599	if (S_ISREG(dentry->d_inode->i_mode))
				600	map = nfs3_regaccess;
				601	else if (S_ISDIR(dentry->d_inode->i_mode))
				602	map = nfs3_diraccess;
				603	else
				604	map = nfs3_anyaccess;
				605
				606
				607	query = *access;
				608	for (; map->access; map++) {
				609	if (map->access & query) {
				610	unsigned int err2;
				611
				612	sresult \|= map->access;
				613
				614	err2 = nfsd_permission(export, dentry, map->how);
				615	switch (err2) {
				616	case nfs_ok:
				617	result \|= map->access;
				618	break;
				619
				620	/* the following error codes just mean the access was not allowed,
				621	* rather than an error occurred */
				622	case nfserr_rofs:
				623	case nfserr_acces:
				624	case nfserr_perm:
				625	/* simply don't "or" in the access bit. */
				626	break;
				627	default:
				628	error = err2;
				629	goto out;
				630	}
				631	}
				632	}
				633	*access = result;
				634	if (supported)
				635	*supported = sresult;
				636
				637	out:
				638	return error;
				639	}
				640	#endif /* CONFIG_NFSD_V3 */
				641
				642
				643
				644	/*
				645	* Open an existing file or directory.
				646	* The access argument indicates the type of open (read/write/lock)
				647	* N.B. After this call fhp needs an fh_put
				648	*/
				649	int
				650	nfsd_open(struct svc_rqst rqstp, struct svc_fh fhp, int type,
				651	int access, struct file **filp)
				652	{
				653	struct dentry *dentry;
				654	struct inode *inode;
				655	int flags = O_RDONLY\|O_LARGEFILE, err;
				656
				657	/*
				658	* If we get here, then the client has already done an "open",
				659	* and (hopefully) checked permission - so allow OWNER_OVERRIDE
				660	* in case a chmod has now revoked permission.
				661	*/
				662	err = fh_verify(rqstp, fhp, type, access \| MAY_OWNER_OVERRIDE);
				663	if (err)
				664	goto out;
				665
				666	dentry = fhp->fh_dentry;
				667	inode = dentry->d_inode;
				668
				669	/* Disallow write access to files with the append-only bit set
				670	* or any access when mandatory locking enabled
				671	*/
				672	err = nfserr_perm;
				673	if (IS_APPEND(inode) && (access & MAY_WRITE))
				674	goto out;
				675	if (IS_ISMNDLK(inode))
				676	goto out;
				677
				678	if (!inode->i_fop)
				679	goto out;
				680
				681	/*
				682	* Check to see if there are any leases on this file.
				683	* This may block while leases are broken.
				684	*/
				685	err = break_lease(inode, O_NONBLOCK \| ((access & MAY_WRITE) ? FMODE_WRITE : 0));
				686	if (err == -EWOULDBLOCK)
				687	err = -ETIMEDOUT;
				688	if (err) /* NOMEM or WOULDBLOCK */
				689	goto out_nfserr;
				690
				691	if (access & MAY_WRITE) {
				692	flags = O_WRONLY\|O_LARGEFILE;
				693
				694	DQUOT_INIT(inode);
				695	}
				696	*filp = dentry_open(dget(dentry), mntget(fhp->fh_export->ex_mnt), flags);
				697	if (IS_ERR(*filp))
				698	err = PTR_ERR(*filp);
				699	out_nfserr:
				700	if (err)
				701	err = nfserrno(err);
				702	out:
				703	return err;
				704	}
				705
				706	/*
				707	* Close a file.
				708	*/
				709	void
				710	nfsd_close(struct file *filp)
				711	{
				712	fput(filp);
				713	}
				714
				715	/*
				716	* Sync a file
				717	* As this calls fsync (not fdatasync) there is no need for a write_inode
				718	* after it.
				719	*/
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	720	static inline int nfsd_dosync(struct file filp, struct dentry dp,
				721	struct file_operations *fop)
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	722	{
				723	struct inode *inode = dp->d_inode;
				724	int (fsync) (struct file , struct dentry *, int);
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	725	int err = nfs_ok;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	726
				727	filemap_fdatawrite(inode->i_mapping);
				728	if (fop && (fsync = fop->fsync))
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	729	err=fsync(filp, dp, 0);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	730	filemap_fdatawait(inode->i_mapping);
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	731
				732	return nfserrno(err);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	733	}
				734
				735
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	736	static int
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	737	nfsd_sync(struct file *filp)
				738	{
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	739	int err;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	740	struct inode *inode = filp->f_dentry->d_inode;
				741	dprintk("nfsd: sync file %s\n", filp->f_dentry->d_name.name);
				742	down(&inode->i_sem);
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	743	err=nfsd_dosync(filp, filp->f_dentry, filp->f_op);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	744	up(&inode->i_sem);
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	745
				746	return err;
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	747	}
				748
NeilBrown	a6ccbbb	2005-07-07 17:59:11 -0700	[diff] [blame]	749	void
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	750	nfsd_sync_dir(struct dentry *dp)
				751	{
				752	nfsd_dosync(NULL, dp, dp->d_inode->i_fop);
				753	}
				754
				755	/*
				756	* Obtain the readahead parameters for the file
				757	* specified by (dev, ino).
				758	*/
				759	static DEFINE_SPINLOCK(ra_lock);
				760
				761	static inline struct raparms *
				762	nfsd_get_raparms(dev_t dev, ino_t ino)
				763	{
				764	struct raparms ra, rap, *frap = NULL;
				765	int depth = 0;
				766
				767	spin_lock(&ra_lock);
				768	for (rap = &raparm_cache; (ra = *rap); rap = &ra->p_next) {
				769	if (ra->p_ino == ino && ra->p_dev == dev)
				770	goto found;
				771	depth++;
				772	if (ra->p_count == 0)
				773	frap = rap;
				774	}
				775	depth = nfsdstats.ra_size*11/10;
				776	if (!frap) {
				777	spin_unlock(&ra_lock);
				778	return NULL;
				779	}
				780	rap = frap;
				781	ra = *frap;
				782	ra->p_dev = dev;
				783	ra->p_ino = ino;
				784	ra->p_set = 0;
				785	found:
				786	if (rap != &raparm_cache) {
				787	*rap = ra->p_next;
				788	ra->p_next = raparm_cache;
				789	raparm_cache = ra;
				790	}
				791	ra->p_count++;
				792	nfsdstats.ra_depth[depth*10/nfsdstats.ra_size]++;
				793	spin_unlock(&ra_lock);
				794	return ra;
				795	}
				796
				797	/*
				798	* Grab and keep cached pages assosiated with a file in the svc_rqst
				799	* so that they can be passed to the netowork sendmsg/sendpage routines
				800	* directrly. They will be released after the sending has completed.
				801	*/
				802	static int
				803	nfsd_read_actor(read_descriptor_t desc, struct page page, unsigned long offset , unsigned long size)
				804	{
				805	unsigned long count = desc->count;
				806	struct svc_rqst *rqstp = desc->arg.data;
				807
				808	if (size > count)
				809	size = count;
				810
				811	if (rqstp->rq_res.page_len == 0) {
				812	get_page(page);
				813	rqstp->rq_respages[rqstp->rq_resused++] = page;
				814	rqstp->rq_res.page_base = offset;
				815	rqstp->rq_res.page_len = size;
				816	} else if (page != rqstp->rq_respages[rqstp->rq_resused-1]) {
				817	get_page(page);
				818	rqstp->rq_respages[rqstp->rq_resused++] = page;
				819	rqstp->rq_res.page_len += size;
				820	} else {
				821	rqstp->rq_res.page_len += size;
				822	}
				823
				824	desc->count = count - size;
				825	desc->written += size;
				826	return size;
				827	}
				828
				829	static inline int
				830	nfsd_vfs_read(struct svc_rqst rqstp, struct svc_fh fhp, struct file *file,
				831	loff_t offset, struct kvec vec, int vlen, unsigned long count)
				832	{
				833	struct inode *inode;
				834	struct raparms *ra;
				835	mm_segment_t oldfs;
				836	int err;
				837
				838	err = nfserr_perm;
				839	inode = file->f_dentry->d_inode;
				840	#ifdef MSNFS
				841	if ((fhp->fh_export->ex_flags & NFSEXP_MSNFS) &&
				842	(!lock_may_read(inode, offset, *count)))
				843	goto out;
				844	#endif
				845
				846	/* Get readahead parameters */
				847	ra = nfsd_get_raparms(inode->i_sb->s_dev, inode->i_ino);
				848
				849	if (ra && ra->p_set)
				850	file->f_ra = ra->p_ra;
				851
				852	if (file->f_op->sendfile) {
				853	svc_pushback_unused_pages(rqstp);
				854	err = file->f_op->sendfile(file, &offset, *count,
				855	nfsd_read_actor, rqstp);
				856	} else {
				857	oldfs = get_fs();
				858	set_fs(KERNEL_DS);
				859	err = vfs_readv(file, (struct iovec __user *)vec, vlen, &offset);
				860	set_fs(oldfs);
				861	}
				862
				863	/* Write back readahead params */
				864	if (ra) {
				865	spin_lock(&ra_lock);
				866	ra->p_ra = file->f_ra;
				867	ra->p_set = 1;
				868	ra->p_count--;
				869	spin_unlock(&ra_lock);
				870	}
				871
				872	if (err >= 0) {
				873	nfsdstats.io_read += err;
				874	*count = err;
				875	err = 0;
Robert Love	0eeca28	2005-07-12 17:06:03 -0400	[diff] [blame]	876	fsnotify_access(file->f_dentry);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	877	} else
				878	err = nfserrno(err);
				879	out:
				880	return err;
				881	}
				882
				883	static inline int
				884	nfsd_vfs_write(struct svc_rqst rqstp, struct svc_fh fhp, struct file *file,
				885	loff_t offset, struct kvec *vec, int vlen,
				886	unsigned long cnt, int *stablep)
				887	{
				888	struct svc_export *exp;
				889	struct dentry *dentry;
				890	struct inode *inode;
				891	mm_segment_t oldfs;
				892	int err = 0;
				893	int stable = *stablep;
				894
				895	err = nfserr_perm;
				896
				897	#ifdef MSNFS
				898	if ((fhp->fh_export->ex_flags & NFSEXP_MSNFS) &&
				899	(!lock_may_write(file->f_dentry->d_inode, offset, cnt)))
				900	goto out;
				901	#endif
				902
				903	dentry = file->f_dentry;
				904	inode = dentry->d_inode;
				905	exp = fhp->fh_export;
				906
				907	/*
				908	* Request sync writes if
				909	* - the sync export option has been set, or
				910	* - the client requested O_SYNC behavior (NFSv3 feature).
				911	* - The file system doesn't support fsync().
				912	* When gathered writes have been configured for this volume,
				913	* flushing the data to disk is handled separately below.
				914	*/
				915
				916	if (file->f_op->fsync == 0) {/* COMMIT3 cannot work */
				917	stable = 2;
				918	stablep = 2; / FILE_SYNC */
				919	}
				920
				921	if (!EX_ISSYNC(exp))
				922	stable = 0;
				923	if (stable && !EX_WGATHER(exp))
				924	file->f_flags \|= O_SYNC;
				925
				926	/* Write the data. */
				927	oldfs = get_fs(); set_fs(KERNEL_DS);
				928	err = vfs_writev(file, (struct iovec __user *)vec, vlen, &offset);
				929	set_fs(oldfs);
				930	if (err >= 0) {
				931	nfsdstats.io_write += cnt;
Robert Love	0eeca28	2005-07-12 17:06:03 -0400	[diff] [blame]	932	fsnotify_modify(file->f_dentry);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	933	}
				934
				935	/* clear setuid/setgid flag after write */
				936	if (err >= 0 && (inode->i_mode & (S_ISUID \| S_ISGID))) {
				937	struct iattr ia;
				938	ia.ia_valid = ATTR_KILL_SUID \| ATTR_KILL_SGID;
				939
				940	down(&inode->i_sem);
				941	notify_change(dentry, &ia);
				942	up(&inode->i_sem);
				943	}
				944
				945	if (err >= 0 && stable) {
				946	static ino_t last_ino;
				947	static dev_t last_dev;
				948
				949	/*
				950	* Gathered writes: If another process is currently
				951	* writing to the file, there's a high chance
				952	* this is another nfsd (triggered by a bulk write
				953	* from a client's biod). Rather than syncing the
				954	* file with each write request, we sleep for 10 msec.
				955	*
				956	* I don't know if this roughly approximates
				957	* C. Juszak's idea of gathered writes, but it's a
				958	* nice and simple solution (IMHO), and it seems to
				959	* work:-)
				960	*/
				961	if (EX_WGATHER(exp)) {
				962	if (atomic_read(&inode->i_writecount) > 1
				963	\|\| (last_ino == inode->i_ino && last_dev == inode->i_sb->s_dev)) {
				964	dprintk("nfsd: write defer %d\n", current->pid);
				965	msleep(10);
				966	dprintk("nfsd: write resume %d\n", current->pid);
				967	}
				968
				969	if (inode->i_state & I_DIRTY) {
				970	dprintk("nfsd: write sync %d\n", current->pid);
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	971	err=nfsd_sync(file);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	972	}
				973	#if 0
				974	wake_up(&inode->i_wait);
				975	#endif
				976	}
				977	last_ino = inode->i_ino;
				978	last_dev = inode->i_sb->s_dev;
				979	}
				980
				981	dprintk("nfsd: write complete err=%d\n", err);
				982	if (err >= 0)
				983	err = 0;
				984	else
				985	err = nfserrno(err);
				986	out:
				987	return err;
				988	}
				989
				990	/*
				991	* Read data from a file. count must contain the requested read count
				992	* on entry. On return, *count contains the number of bytes actually read.
				993	* N.B. After this call fhp needs an fh_put
				994	*/
				995	int
				996	nfsd_read(struct svc_rqst rqstp, struct svc_fh fhp, struct file *file,
				997	loff_t offset, struct kvec *vec, int vlen,
				998	unsigned long *count)
				999	{
				1000	int err;
				1001
				1002	if (file) {
				1003	err = nfsd_permission(fhp->fh_export, fhp->fh_dentry,
				1004	MAY_READ\|MAY_OWNER_OVERRIDE);
				1005	if (err)
				1006	goto out;
				1007	err = nfsd_vfs_read(rqstp, fhp, file, offset, vec, vlen, count);
				1008	} else {
				1009	err = nfsd_open(rqstp, fhp, S_IFREG, MAY_READ, &file);
				1010	if (err)
				1011	goto out;
				1012	err = nfsd_vfs_read(rqstp, fhp, file, offset, vec, vlen, count);
				1013	nfsd_close(file);
				1014	}
				1015	out:
				1016	return err;
				1017	}
				1018
				1019	/*
				1020	* Write data to a file.
				1021	* The stable flag requests synchronous writes.
				1022	* N.B. After this call fhp needs an fh_put
				1023	*/
				1024	int
				1025	nfsd_write(struct svc_rqst rqstp, struct svc_fh fhp, struct file *file,
				1026	loff_t offset, struct kvec *vec, int vlen, unsigned long cnt,
				1027	int *stablep)
				1028	{
				1029	int err = 0;
				1030
				1031	if (file) {
				1032	err = nfsd_permission(fhp->fh_export, fhp->fh_dentry,
				1033	MAY_WRITE\|MAY_OWNER_OVERRIDE);
				1034	if (err)
				1035	goto out;
				1036	err = nfsd_vfs_write(rqstp, fhp, file, offset, vec, vlen, cnt,
				1037	stablep);
				1038	} else {
				1039	err = nfsd_open(rqstp, fhp, S_IFREG, MAY_WRITE, &file);
				1040	if (err)
				1041	goto out;
				1042
				1043	if (cnt)
				1044	err = nfsd_vfs_write(rqstp, fhp, file, offset, vec, vlen,
				1045	cnt, stablep);
				1046	nfsd_close(file);
				1047	}
				1048	out:
				1049	return err;
				1050	}
				1051
				1052	#ifdef CONFIG_NFSD_V3
				1053	/*
				1054	* Commit all pending writes to stable storage.
				1055	* Strictly speaking, we could sync just the indicated file region here,
				1056	* but there's currently no way we can ask the VFS to do so.
				1057	*
				1058	* Unfortunately we cannot lock the file to make sure we return full WCC
				1059	* data to the client, as locking happens lower down in the filesystem.
				1060	*/
				1061	int
				1062	nfsd_commit(struct svc_rqst rqstp, struct svc_fh fhp,
				1063	loff_t offset, unsigned long count)
				1064	{
				1065	struct file *file;
				1066	int err;
				1067
				1068	if ((u64)count > ~(u64)offset)
				1069	return nfserr_inval;
				1070
				1071	if ((err = nfsd_open(rqstp, fhp, S_IFREG, MAY_WRITE, &file)) != 0)
				1072	return err;
				1073	if (EX_ISSYNC(fhp->fh_export)) {
				1074	if (file->f_op && file->f_op->fsync) {
David Shaw	a334de2	2006-01-06 00:19:58 -0800	[diff] [blame^]	1075	err = nfsd_sync(file);
Linus Torvalds	1da177e	2005-04-16 15:20:36 -0700	[diff] [blame]	1076	} else {
				1077	err = nfserr_notsupp;
				1078	}
				1079	}
				1080
				1081	nfsd_close(file);
				1082	return err;
				1083	}
				1084	#endif /* CONFIG_NFSD_V3 */
				1085
				1086	/*
				1087	* Create a file (regular, directory, device, fifo); UNIX sockets
				1088	* not yet implemented.
				1089	* If the response fh has been verified, the parent directory should
				1090	* already be locked. Note that the parent directory is left locked.
				1091	*
				1092	* N.B. Every call to nfsd_create needs an fh_put for _both_ fhp and resfhp
				1093	*/
				1094	int
				1095	nfsd_create(struct svc_rqst rqstp, struct svc_fh fhp,
				1096	char fname, int flen, struct iattr iap,
				1097	int type, dev_t rdev, struct svc_fh *resfhp)
				1098	{
				1099	struct dentry dentry, dchild = NULL;
				1100	struct inode *dirp;
				1101	int err;
				1102
				1103	err = nfserr_perm;
				1104	if (!flen)
				1105	goto out;
				1106	err = nfserr_exist;
				1107	if (isdotent(fname, flen))
				1108	goto out;
				1109
				1110	err = fh_verify(rqstp, fhp, S_IFDIR, MAY_CREATE);
				1111	if (err)
				1112	goto out;
				1113
				1114	dentry = fhp->fh_dentry;
				1115	dirp = dentry->d_inode;
				1116
				1117	err = nfserr_notdir;
				1118	if(!dirp->i_op \|\| !dirp->i_op->lookup)
				1119	goto out;
				1120	/*
				1121	* Check whether the response file handle has been verified yet.
				1122	* If it has, the parent directory should already be locked.
				1123	*/
				1124	if (!resfhp->fh_dentry) {
				1125	/* called from nfsd_proc_mkdir, or possibly nfsd3_proc_create */
				1126	fh_lock(fhp);
				1127	dchild = lookup_one_len(fname, dentry, flen);
				1128	err = PTR_ERR(dchild);
				1129	if (IS_ERR(dchild))
				1130	goto out_nfserr;
				1131	err = fh_compose(resfhp, fhp->fh_export, dchild, fhp);
				1132	if (err)
				1133	goto out;
				1134	} else {
				1135	/* called from nfsd_proc_create */
				1136	dchild = dget(resfhp->fh_dentry);
				1137	if (!fhp->fh_locked) {
				1138	/* not actually possible */
				1139	printk(KERN_ERR
				1140	"nfsd_create: parent %s/%s not locked!\n",
				1141	dentry->d_parent->d_name.name,
				1142	dentry->d_name.name);
				1143	err = -EIO;
				1144	goto out;
				1145	}
				1146	}
				1147	/*
				1148	* Make sure the child dentry is still negative ...
				1149	*/
				1150	err = nfserr_exist;
				1151	if (dchild->d_inode) {
				1152	dprintk("nfsd_create: dentry %s/%s not negative!\n",
				1153	dentry->d_name.name, dchild->d_name.name);
				1154	goto out;
				1155	}
				1156
				1157	if (!(iap->ia_valid & ATTR_MODE))
				1158	iap->ia_mode = 0;
				1159	iap->ia_mode = (iap->ia_mode & S_IALLUGO) \| type;
				1160
				1161	/*
				1162	* Get the dir op function pointer.
				1163	*/
				1164	err = nfserr_perm;
				1165	switch (type) {
				1166	case S_IFREG:
				1167	err = vfs_create(dirp, dchild, iap->ia_mode, NULL);
				1168	break;
				1169	case S_IFDIR:
				1170	err = vfs_mkdir(dirp, dchild, iap->ia_mode);
				1171	break;
				1172	case S_IFCHR:
				1173	case S_IFBLK:
				1174	case S_IFIFO:
				1175	case S_IFSOCK:
				1176	err = vfs_mknod(dirp, dchild, iap->ia_mode, rdev);
				1177	break;
				1178	default:
				1179	printk("nfsd: bad file type %o in nfsd_create\n", type);
				1180	err = -EINVAL;
				1181	}
				1182	if (err < 0)
				1183	goto out_nfserr;
				1184
				1185	if (EX_ISSYNC(fhp->fh_export)) {
				1186	nfsd_sync_dir(dentry);
				1187	write_inode_now(dchild->d_inode, 1);
				1188	}
				1189
				1190
				1191	/* Set file attributes. Mode has already been set and
				1192	* setting uid/gid works only for root. Irix appears to
				1193	* send along the gid when it tries to implement setgid
				1194	* directories via NFS.
				1195	*/
				1196	err = 0;
				1197	if ((iap->ia_valid &= ~(ATTR_UID\|ATTR_GID\|ATTR_MODE)) != 0)
				1198	err = nfsd_setattr(rqstp, resfhp, iap, 0, (time_t)0);
				1199	/*
				1200	* Update the file handle to get the new inode info.
				1201	*/
				1202	if (!err)
				1203	err = fh_update(resfhp);
				1204	out:
				1205	if (dchild && !IS_ERR(dchild))
				1206	dput(dchild);
				1207	return err;
				1208
				1209	out_nfserr:
				1210	err = nfserrno(err);
				1211	goto out;
				1212	}
				1213
				1214	#ifdef CONFIG_NFSD_V3
				1215	/*
				1216	* NFSv3 version of nfsd_create
				1217	*/
				1218	int
				1219	nfsd_create_v3(struct svc_rqst rqstp, struct svc_fh fhp,
				1220	char fname, int flen, struct iattr iap,
				1221	struct svc_fh resfhp, int createmode, u32 verifier,
				1222	int *truncp)
				1223	{
				1224	struct dentry dentry, dchild = NULL;
				1225	struct inode *dirp;
				1226	int err;
				1227	__u32 v_mtime=0, v_atime=0;
				1228	int v_mode=0;
				1229
				1230	err = nfserr_perm;
				1231	if (!flen)
				1232	goto out;
				1233	err = nfserr_exist;
				1234	if (isdotent(fname, flen))
				1235	goto out;
				1236	if (!(iap->ia_valid & ATTR_MODE))
				1237	iap->ia_mode = 0;
				1238	err = fh_verify(rqstp, fhp, S_IFDIR, MAY_CREATE);
				1239	if (err)
				1240	goto out;
				1241
				1242	dentry = fhp->fh_dentry;
				1243	dirp = dentry->d_inode;
				1244
				1245	/* Get all the sanity checks out of the way before
				1246	* we lock the parent. */
				1247	err = nfserr_notdir;
				1248	if(!dirp->i_op \|\| !dirp->i_op->lookup)
				1249	goto out;
				1250	fh_lock(fhp);
				1251
				1252	/*
				1253	* Compose the response file handle.
				1254	*/
				1255	dchild = lookup_one_len(fname, dentry, flen);
				1256	err = PTR_ERR(dchild);
				1257	if (IS_ERR(dchild))
				1258	goto out_nfserr;
				1259
				1260	err = fh_compose(resfhp, fhp->fh_export, dchild, fhp);
				1261	if (err)
				1262	goto out;
				1263
				1264	if (createmode == NFS3_CREATE_EXCLUSIVE) {
				1265	/* while the verifier would fit in mtime+atime,
				1266	* solaris7 gets confused (bugid 4218508) if these have
				1267	* the high bit set, so we use the mode as well
				1268	*/
				1269	v_mtime = verifier[0]&0x7fffffff;
				1270	v_atime = verifier[1]&0x7fffffff;
				1271	v_mode = S_IFREG
				1272	\| ((verifier[0]&0x80000000) >> (32-7)) /* u+x */
				1273	\| ((verifier[1]&0x80000000) >> (32-9)) /* u+r */
				1274	;
				1275	}
				1276
				1277	if (dchild->d_inode) {
				1278	err = 0;
				1279
				1280	switch (createmode) {
				1281	case NFS3_CREATE_UNCHECKED:
				1282	if (! S_ISREG(dchild->d_inode->i_mode))
				1283	err = nfserr_exist;
				1284	else if (truncp) {
				1285	/* in nfsv4, we need to treat this case a little
				1286	* differently. we don't want to truncate the
				1287	* file now; this would be wrong if the OPEN
				1288	* fails for some other reason. furthermore,
				1289	* if the size is nonzero, we should ignore it
				1290	* according to spec!
				1291	*/
				1292	*truncp = (iap->ia_valid & ATTR_SIZE) && !iap->ia_size;
				1293	}
				1294	else {
				1295	iap->ia_valid &= ATTR_SIZE;
				1296	goto set_attr;
				1297	}
				1298	break;
				1299	case NFS3_CREATE_EXCLUSIVE:
				1300	if ( dchild->d_inode->i_mtime.tv_sec == v_mtime
				1301	&& dchild->d_inode->i_atime.tv_sec == v_atime
				1302	&& dchild->d_inode->i_mode == v_mode
				1303	&& dchild->d_inode->i_size == 0 )
				1304	break;
				1305	/* fallthru */
				1306	case NFS3_CREATE_GUARDED:
				1307	err = nfserr_exist;
				1308	}
				1309	goto out;
				1310	}
				1311
				1312	err = vfs_create(dirp, dchild, iap->ia_mode, NULL);
				1313	if (err < 0)
				1314	goto out_nfserr;
				1315
				1316	if (EX_ISSYNC(fhp->fh_export)) {
				1317	nfsd_sync_dir(dentry);
				1318	/* setattr will sync the child (or not) */
				1319	}
				1320
				1321	/*
				1322	* Update the filehandle to get the new inode info.
				1323	*/
				1324	err = fh_update(resfhp);
				1325	if (err)
				1326	goto out;
				1327
				1328	if (createmode == NFS3_CREATE_EXCLUSIVE) {
				1329	/* Cram the verifier into atime/mtime/mode */
				1330	iap->ia_valid = ATTR_MTIME\|ATTR_ATIME
				1331	\| ATTR_MTIME_SET\|ATTR_ATIME_SET
				1332	\| ATTR_MODE;
				1333	/* XXX someone who knows this better please fix it for nsec */
				1334	iap->ia_mtime.tv_sec = v_mtime;
				1335	iap->ia_atime.tv_sec = v_atime;
				1336	iap->ia_mtime.tv_nsec = 0;
				1337	iap->ia_atime.tv_nsec = 0;
				1338	iap->ia_mode = v_mode;
				1339	}
				1340
				1341	/* Set file attributes.
				1342	* Mode has already been set but we might need to reset it
				1343	* for CREATE_EXCLUSIVE
				1344	* Irix appears to send along the gid when it tries to
				1345	* implement setgid directories via NFS. Clear out all that cruft.
				1346	*/
				1347	set_attr:
				1348	if ((iap->ia_valid &= ~(ATTR_UID\|ATTR_GID)) != 0)
				1349	err = nfsd_setattr(rqstp, resfhp, iap, 0, (time_t)0);
				1350
				1351	out:
				1352	fh_unlock(fhp);
				1353	if (dchild && !IS_ERR(dchild))
				1354	dput(dchild);
				1355	return err;
				1356
				1357	out_nfserr:
				1358	err = nfserrno(err);
				1359	goto out;
				1360	}
				1361	#endif /* CONFIG_NFSD_V3 */
				1362
				1363	/*
				1364	* Read a symlink. On entry, *lenp must contain the maximum path length that
				1365	* fits into the buffer. On return, it contains the true length.
				1366	* N.B. After this call fhp needs an fh_put
				1367	*/
				1368	int
				1369	nfsd_readlink(struct svc_rqst rqstp, struct svc_fh fhp, char buf, int lenp)
				1370	{
				1371	struct dentry *dentry;
				1372	struct inode *inode;
				1373	mm_segment_t oldfs;
				1374	int err;
				1375
				1376	err = fh_verify(rqstp, fhp, S_IFLNK, MAY_NOP);
				1377	if (err)
				1378	goto out;
				1379
				1380	dentry = fhp->fh_dentry;
				1381	inode = dentry->d_inode;
				1382
				1383	err = nfserr_inval;
				1384	if (!inode->i_op \|\| !inode->i_op->readlink)
				1385	goto out;
				1386
				1387	touch_atime(fhp->fh_export->ex_mnt, dentry);
				1388	/* N.B. Why does this call need a get_fs()??
				1389	* Remove the set_fs and watch the fireworks:-) --okir
				1390	*/
				1391
				1392	oldfs = get_fs(); set_fs(KERNEL_DS);
				1393	err = inode->i_op->readlink(dentry, buf, *lenp);
				1394	set_fs(oldfs);
				1395
				1396	if (err < 0)
				1397	goto out_nfserr;
				1398	*lenp = err;
				1399	err = 0;
				1400	out:
				1401	return err;
				1402
				1403	out_nfserr:
				1404	err = nfserrno(err);
				1405	goto out;
				1406	}
				1407
				1408	/*
				1409	* Create a symlink and look up its inode
				1410	* N.B. After this call _both_ fhp and resfhp need an fh_put
				1411	*/
				1412	int
				1413	nfsd_symlink(struct svc_rqst rqstp, struct svc_fh fhp,
				1414	char *fname, int flen,
				1415	char *path, int plen,
				1416	struct svc_fh *resfhp,
				1417	struct iattr *iap)
				1418	{
				1419	struct dentry dentry, dnew;
				1420	int err, cerr;
				1421	umode_t mode;
				1422
				1423	err = nfserr_noent;
				1424	if (!flen \|\| !plen)
				1425	goto out;
				1426	err = nfserr_exist;
				1427	if (isdotent(fname, flen))
				1428	goto out;
				1429
				1430	err = fh_verify(rqstp, fhp, S_IFDIR, MAY_CREATE);
				1431	if (err)
				1432	goto out;
				1433	fh_lock(fhp);
				1434	dentry = fhp->fh_dentry;
				1435	dnew = lookup_one_len(fname, dentry, flen);
				1436	err = PTR_ERR(dnew);
				1437	if (IS_ERR(dnew))
				1438	goto out_nfserr;
				1439
				1440	mode = S_IALLUGO;
				1441	/* Only the MODE ATTRibute is even vaguely meaningful */
				1442	if (iap && (iap->ia_valid & ATTR_MODE))
				1443	mode = iap->ia_mode & S_IALLUGO;
				1444
				1445	if (unlikely(path[plen] != 0)) {
				1446	char *path_alloced = kmalloc(plen+1, GFP_KERNEL);
				1447	if (path_alloced == NULL)
				1448	err = -ENOMEM;
				1449	else {
				1450	strncpy(path_alloced, path, plen);
				1451	path_alloced[plen] = 0;
				1452	err = vfs_symlink(dentry->d_inode, dnew, path_alloced, mode);
				1453	kfree(path_alloced);
				1454	}
				1455	} else
				1456	err = vfs_symlink(dentry->d_inode, dnew, path, mode);
				1457
				1458	if (!err) {
				1459	if (EX_ISSYNC(fhp->fh_export))
				1460	nfsd_sync_dir(dentry);
				1461	} else
				1462	err = nfserrno(err);
				1463	fh_unlock(fhp);
				1464
				1465	cerr = fh_compose(resfhp, fhp->fh_export, dnew, fhp);
				1466	dput(dnew);
				1467	if (err==0) err = cerr;
				1468	out:
				1469	return err;
				1470
				1471	out_nfserr:
				1472	err = nfserrno(err);
				1473	goto out;
				1474	}
				1475
				1476	/*
				1477	* Create a hardlink
				1478	* N.B. After this call _both_ ffhp and tfhp need an fh_put
				1479	*/
				1480	int
				1481	nfsd_link(struct svc_rqst rqstp, struct svc_fh ffhp,
				1482	char name, int len, struct svc_fh tfhp)
				1483	{
				1484	struct dentry ddir, dnew, *dold;
				1485	struct inode dirp, dest;
				1486	int err;
				1487
				1488	err = fh_verify(rqstp, ffhp, S_IFDIR, MAY_CREATE);
				1489	if (err)
				1490	goto out;
				1491	err = fh_verify(rqstp, tfhp, -S_IFDIR, MAY_NOP);
				1492	if (err)
				1493	goto out;
				1494
				1495	err = nfserr_perm;
				1496	if (!len)
				1497	goto out;
				1498	err = nfserr_exist;
				1499	if (isdotent(name, len))
				1500	goto out;
				1501
				1502	fh_lock(ffhp);
				1503	ddir = ffhp->fh_dentry;
				1504	dirp = ddir->d_inode;
				1505
				1506	dnew = lookup_one_len(name, ddir, len);
				1507	err = PTR_ERR(dnew);
				1508	if (IS_ERR(dnew))
				1509	goto out_nfserr;
				1510
				1511	dold = tfhp->fh_dentry;
				1512	dest = dold->d_inode;
				1513
				1514	err = vfs_link(dold, dirp, dnew);
				1515	if (!err) {
				1516	if (EX_ISSYNC(ffhp->fh_export)) {
				1517	nfsd_sync_dir(ddir);
				1518	write_inode_now(dest, 1);
				1519	}
				1520	} else {
				1521	if (err == -EXDEV && rqstp->rq_vers == 2)
				1522	err = nfserr_acces;
				1523	else
				1524	err = nfserrno(err);
				1525	}
				1526
				1527	fh_unlock(ffhp);
				1528	dput(dnew);
				1529	out:
				1530	return err;
				1531
				1532	out_nfserr:
				1533	err = nfserrno(err);
				1534	goto out;
				1535	}
				1536
				1537	/*
				1538	* Rename a file
				1539	* N.B. After this call _both_ ffhp and tfhp need an fh_put
				1540	*/
				1541	int
				1542	nfsd_rename(struct svc_rqst rqstp, struct svc_fh ffhp, char *fname, int flen,
				1543	struct svc_fh tfhp, char tname, int tlen)
				1544	{
				1545	struct dentry fdentry, tdentry, odentry, ndentry, *trap;
				1546	struct inode fdir, tdir;
				1547	int err;
				1548
				1549	err = fh_verify(rqstp, ffhp, S_IFDIR, MAY_REMOVE);
				1550	if (err)
				1551	goto out;
				1552	err = fh_verify(rqstp, tfhp, S_IFDIR, MAY_CREATE);
				1553	if (err)
				1554	goto out;
				1555
				1556	fdentry = ffhp->fh_dentry;
				1557	fdir = fdentry->d_inode;
				1558
				1559	tdentry = tfhp->fh_dentry;
				1560	tdir = tdentry->d_inode;
				1561
				1562	err = (rqstp->rq_vers == 2) ? nfserr_acces : nfserr_xdev;
				1563	if (fdir->i_sb != tdir->i_sb)
				1564	goto out;
				1565
				1566	err = nfserr_perm;
				1567	if (!flen \|\| isdotent(fname, flen) \|\| !tlen \|\| isdotent(tname, tlen))
				1568	goto out;
				1569
				1570	/* cannot use fh_lock as we need deadlock protective ordering
				1571	* so do it by hand */
				1572	trap = lock_rename(tdentry, fdentry);
				1573	ffhp->fh_locked = tfhp->fh_locked = 1;
				1574	fill_pre_wcc(ffhp);
				1575	fill_pre_wcc(tfhp);
				1576
				1577	odentry = lookup_one_len(fname, fdentry, flen);
				1578	err = PTR_ERR(odentry);
				1579	if (IS_ERR(odentry))
				1580	goto out_nfserr;
				1581
				1582	err = -ENOENT;
				1583	if (!odentry->d_inode)
				1584	goto out_dput_old;
				1585	err = -EINVAL;
				1586	if (odentry == trap)
				1587	goto out_dput_old;
				1588
				1589	ndentry = lookup_one_len(tname, tdentry, tlen);
				1590	err = PTR_ERR(ndentry);
				1591	if (IS_ERR(ndentry))
				1592	goto out_dput_old;
				1593	err = -ENOTEMPTY;
				1594	if (ndentry == trap)
				1595	goto out_dput_new;
				1596
				1597	#ifdef MSNFS
				1598	if ((ffhp->fh_export->ex_flags & NFSEXP_MSNFS) &&
				1599	((atomic_read(&odentry->d_count) > 1)
				1600	\|\| (atomic_read(&ndentry->d_count) > 1))) {
				1601	err = nfserr_perm;
				1602	} else
				1603	#endif
				1604	err = vfs_rename(fdir, odentry, tdir, ndentry);
				1605	if (!err && EX_ISSYNC(tfhp->fh_export)) {
				1606	nfsd_sync_dir(tdentry);
				1607	nfsd_sync_dir(fdentry);
				1608	}
				1609
				1610	out_dput_new:
				1611	dput(ndentry);
				1612	out_dput_old:
				1613	dput(odentry);
				1614	out_nfserr:
				1615	if (err)
				1616	err = nfserrno(err);
				1617
				1618	/* we cannot reply on fh_unlock on the two filehandles,
				1619	* as that would do the wrong thing if the two directories
				1620	* were the same, so again we do it by hand
				1621	*/
				1622	fill_post_wcc(ffhp);
				1623	fill_post_wcc(tfhp);
				1624	unlock_rename(tdentry, fdentry);
				1625	ffhp->fh_locked = tfhp->fh_locked = 0;
				1626
				1627	out:
				1628	return err;
				1629	}
				1630
				1631	/*
				1632	* Unlink a file or directory
				1633	* N.B. After this call fhp needs an fh_put
				1634	*/
				1635	int
				1636	nfsd_unlink(struct svc_rqst rqstp, struct svc_fh fhp, int type,
				1637	char *fname, int flen)
				1638	{
				1639	struct dentry dentry, rdentry;
				1640	struct inode *dirp;
				1641	int err;
				1642
				1643	err = nfserr_acces;
				1644	if (!flen \|\| isdotent(fname, flen))
				1645	goto out;
				1646	err = fh_verify(rqstp, fhp, S_IFDIR, MAY_REMOVE);
				1647	if (err)
				1648	goto out;
				1649
				1650	fh_lock(fhp);
				1651	dentry = fhp->fh_dentry;
				1652	dirp = dentry->d_inode;
				1653
				1654	rdentry = lookup_one_len(fname, dentry, flen);
				1655	err = PTR_ERR(rdentry);
				1656	if (IS_ERR(rdentry))
				1657	goto out_nfserr;
				1658
				1659	if (!rdentry->d_inode) {
				1660	dput(rdentry);
				1661	err = nfserr_noent;
				1662	goto out;
				1663	}
				1664
				1665	if (!type)
				1666	type = rdentry->d_inode->i_mode & S_IFMT;
				1667
				1668	if (type != S_IFDIR) { /* It's UNLINK */
				1669	#ifdef MSNFS
				1670	if ((fhp->fh_export->ex_flags & NFSEXP_MSNFS) &&
				1671	(atomic_read(&rdentry->d_count) > 1)) {
				1672	err = nfserr_perm;
				1673	} else
				1674	#endif
				1675	err = vfs_unlink(dirp, rdentry);
				1676	} else { /* It's RMDIR */
				1677	err = vfs_rmdir(dirp, rdentry);
				1678	}
				1679
				1680	dput(rdentry);
				1681
				1682	if (err)
				1683	goto out_nfserr;
				1684	if (EX_ISSYNC(fhp->fh_export))
				1685	nfsd_sync_dir(dentry);
				1686
				1687	out:
				1688	return err;
				1689
				1690	out_nfserr:
				1691	err = nfserrno(err);
				1692	goto out;
				1693	}
				1694
				1695	/*
				1696	* Read entries from a directory.
				1697	* The NFSv3/4 verifier we ignore for now.
				1698	*/
				1699	int
				1700	nfsd_readdir(struct svc_rqst rqstp, struct svc_fh fhp, loff_t *offsetp,
				1701	struct readdir_cd *cdp, encode_dent_fn func)
				1702	{
				1703	int err;
				1704	struct file *file;
				1705	loff_t offset = *offsetp;
				1706
				1707	err = nfsd_open(rqstp, fhp, S_IFDIR, MAY_READ, &file);
				1708	if (err)
				1709	goto out;
				1710
				1711	offset = vfs_llseek(file, offset, 0);
				1712	if (offset < 0) {
				1713	err = nfserrno((int)offset);
				1714	goto out_close;
				1715	}
				1716
				1717	/*
				1718	* Read the directory entries. This silly loop is necessary because
				1719	* readdir() is not guaranteed to fill up the entire buffer, but
				1720	* may choose to do less.
				1721	*/
				1722
				1723	do {
				1724	cdp->err = nfserr_eof; /* will be cleared on successful read */
				1725	err = vfs_readdir(file, (filldir_t) func, cdp);
				1726	} while (err >=0 && cdp->err == nfs_ok);
				1727	if (err)
				1728	err = nfserrno(err);
				1729	else
				1730	err = cdp->err;
				1731	*offsetp = vfs_llseek(file, 0, 1);
				1732
				1733	if (err == nfserr_eof \|\| err == nfserr_toosmall)
				1734	err = nfs_ok; /* can still be found in ->err */
				1735	out_close:
				1736	nfsd_close(file);
				1737	out:
				1738	return err;
				1739	}
				1740
				1741	/*
				1742	* Get file system stats
				1743	* N.B. After this call fhp needs an fh_put
				1744	*/
				1745	int
				1746	nfsd_statfs(struct svc_rqst rqstp, struct svc_fh fhp, struct kstatfs *stat)
				1747	{
				1748	int err = fh_verify(rqstp, fhp, 0, MAY_NOP);
				1749	if (!err && vfs_statfs(fhp->fh_dentry->d_inode->i_sb,stat))
				1750	err = nfserr_io;
				1751	return err;
				1752	}
				1753
				1754	/*
				1755	* Check for a user's access permissions to this inode.
				1756	*/
				1757	int
				1758	nfsd_permission(struct svc_export exp, struct dentry dentry, int acc)
				1759	{
				1760	struct inode *inode = dentry->d_inode;
				1761	int err;
				1762
				1763	if (acc == MAY_NOP)
				1764	return 0;
				1765	#if 0
				1766	dprintk("nfsd: permission 0x%x%s%s%s%s%s%s%s mode 0%o%s%s%s\n",
				1767	acc,
				1768	(acc & MAY_READ)? " read" : "",
				1769	(acc & MAY_WRITE)? " write" : "",
				1770	(acc & MAY_EXEC)? " exec" : "",
				1771	(acc & MAY_SATTR)? " sattr" : "",
				1772	(acc & MAY_TRUNC)? " trunc" : "",
				1773	(acc & MAY_LOCK)? " lock" : "",
				1774	(acc & MAY_OWNER_OVERRIDE)? " owneroverride" : "",
				1775	inode->i_mode,
				1776	IS_IMMUTABLE(inode)? " immut" : "",
				1777	IS_APPEND(inode)? " append" : "",
				1778	IS_RDONLY(inode)? " ro" : "");
				1779	dprintk(" owner %d/%d user %d/%d\n",
				1780	inode->i_uid, inode->i_gid, current->fsuid, current->fsgid);
				1781	#endif
				1782
				1783	/* Normally we reject any write/sattr etc access on a read-only file
				1784	* system. But if it is IRIX doing check on write-access for a
				1785	* device special file, we ignore rofs.
				1786	*/
				1787	if (!(acc & MAY_LOCAL_ACCESS))
				1788	if (acc & (MAY_WRITE \| MAY_SATTR \| MAY_TRUNC)) {
				1789	if (EX_RDONLY(exp) \|\| IS_RDONLY(inode))
				1790	return nfserr_rofs;
				1791	if (/* (acc & MAY_WRITE) && */ IS_IMMUTABLE(inode))
				1792	return nfserr_perm;
				1793	}
				1794	if ((acc & MAY_TRUNC) && IS_APPEND(inode))
				1795	return nfserr_perm;
				1796
				1797	if (acc & MAY_LOCK) {
				1798	/* If we cannot rely on authentication in NLM requests,
				1799	* just allow locks, otherwise require read permission, or
				1800	* ownership
				1801	*/
				1802	if (exp->ex_flags & NFSEXP_NOAUTHNLM)
				1803	return 0;
				1804	else
				1805	acc = MAY_READ \| MAY_OWNER_OVERRIDE;
				1806	}
				1807	/*
				1808	* The file owner always gets access permission for accesses that
				1809	* would normally be checked at open time. This is to make
				1810	* file access work even when the client has done a fchmod(fd, 0).
				1811	*
				1812	* However, `cp foo bar' should fail nevertheless when bar is
				1813	* readonly. A sensible way to do this might be to reject all
				1814	* attempts to truncate a read-only file, because a creat() call
				1815	* always implies file truncation.
				1816	* ... but this isn't really fair. A process may reasonably call
				1817	* ftruncate on an open file descriptor on a file with perm 000.
				1818	* We must trust the client to do permission checking - using "ACCESS"
				1819	* with NFSv3.
				1820	*/
				1821	if ((acc & MAY_OWNER_OVERRIDE) &&
				1822	inode->i_uid == current->fsuid)
				1823	return 0;
				1824
				1825	err = permission(inode, acc & (MAY_READ\|MAY_WRITE\|MAY_EXEC), NULL);
				1826
				1827	/* Allow read access to binaries even when mode 111 */
				1828	if (err == -EACCES && S_ISREG(inode->i_mode) &&
				1829	acc == (MAY_READ \| MAY_OWNER_OVERRIDE))
				1830	err = permission(inode, MAY_EXEC, NULL);
				1831
				1832	return err? nfserrno(err) : 0;
				1833	}
				1834
				1835	void
				1836	nfsd_racache_shutdown(void)
				1837	{
				1838	if (!raparm_cache)
				1839	return;
				1840	dprintk("nfsd: freeing readahead buffers.\n");
				1841	kfree(raparml);
				1842	raparm_cache = raparml = NULL;
				1843	}
				1844	/*
				1845	* Initialize readahead param cache
				1846	*/
				1847	int
				1848	nfsd_racache_init(int cache_size)
				1849	{
				1850	int i;
				1851
				1852	if (raparm_cache)
				1853	return 0;
				1854	raparml = kmalloc(sizeof(struct raparms) * cache_size, GFP_KERNEL);
				1855
				1856	if (raparml != NULL) {
				1857	dprintk("nfsd: allocating %d readahead buffers.\n",
				1858	cache_size);
				1859	memset(raparml, 0, sizeof(struct raparms) * cache_size);
				1860	for (i = 0; i < cache_size - 1; i++) {
				1861	raparml[i].p_next = raparml + i + 1;
				1862	}
				1863	raparm_cache = raparml;
				1864	} else {
				1865	printk(KERN_WARNING
				1866	"nfsd: Could not allocate memory read-ahead cache.\n");
				1867	return -ENOMEM;
				1868	}
				1869	nfsdstats.ra_size = cache_size;
				1870	return 0;
				1871	}
Andreas Gruenbacher	a257cdd	2005-06-22 17:16:26 +0000	[diff] [blame]	1872
				1873	#if defined(CONFIG_NFSD_V2_ACL) \|\| defined(CONFIG_NFSD_V3_ACL)
				1874	struct posix_acl *
				1875	nfsd_get_posix_acl(struct svc_fh *fhp, int type)
				1876	{
				1877	struct inode *inode = fhp->fh_dentry->d_inode;
				1878	char *name;
				1879	void *value = NULL;
				1880	ssize_t size;
				1881	struct posix_acl *acl;
				1882
				1883	if (!IS_POSIXACL(inode) \|\| !inode->i_op \|\| !inode->i_op->getxattr)
				1884	return ERR_PTR(-EOPNOTSUPP);
				1885	switch(type) {
				1886	case ACL_TYPE_ACCESS:
Christoph Hellwig	334a13e	2005-06-28 20:44:58 -0700	[diff] [blame]	1887	name = POSIX_ACL_XATTR_ACCESS;
Andreas Gruenbacher	a257cdd	2005-06-22 17:16:26 +0000	[diff] [blame]	1888	break;
				1889	case ACL_TYPE_DEFAULT:
Christoph Hellwig	334a13e	2005-06-28 20:44:58 -0700	[diff] [blame]	1890	name = POSIX_ACL_XATTR_DEFAULT;
Andreas Gruenbacher	a257cdd	2005-06-22 17:16:26 +0000	[diff] [blame]	1891	break;
				1892	default:
				1893	return ERR_PTR(-EOPNOTSUPP);
				1894	}
				1895
				1896	size = inode->i_op->getxattr(fhp->fh_dentry, name, NULL, 0);
				1897
				1898	if (size < 0) {
				1899	acl = ERR_PTR(size);
				1900	goto getout;
				1901	} else if (size > 0) {
				1902	value = kmalloc(size, GFP_KERNEL);
				1903	if (!value) {
				1904	acl = ERR_PTR(-ENOMEM);
				1905	goto getout;
				1906	}
				1907	size = inode->i_op->getxattr(fhp->fh_dentry, name, value, size);
				1908	if (size < 0) {
				1909	acl = ERR_PTR(size);
				1910	goto getout;
				1911	}
				1912	}
				1913	acl = posix_acl_from_xattr(value, size);
				1914
				1915	getout:
				1916	kfree(value);
				1917	return acl;
				1918	}
				1919
				1920	int
				1921	nfsd_set_posix_acl(struct svc_fh fhp, int type, struct posix_acl acl)
				1922	{
				1923	struct inode *inode = fhp->fh_dentry->d_inode;
				1924	char *name;
				1925	void *value = NULL;
				1926	size_t size;
				1927	int error;
				1928
				1929	if (!IS_POSIXACL(inode) \|\| !inode->i_op \|\|
				1930	!inode->i_op->setxattr \|\| !inode->i_op->removexattr)
				1931	return -EOPNOTSUPP;
				1932	switch(type) {
				1933	case ACL_TYPE_ACCESS:
Christoph Hellwig	334a13e	2005-06-28 20:44:58 -0700	[diff] [blame]	1934	name = POSIX_ACL_XATTR_ACCESS;
Andreas Gruenbacher	a257cdd	2005-06-22 17:16:26 +0000	[diff] [blame]	1935	break;
				1936	case ACL_TYPE_DEFAULT:
Christoph Hellwig	334a13e	2005-06-28 20:44:58 -0700	[diff] [blame]	1937	name = POSIX_ACL_XATTR_DEFAULT;
Andreas Gruenbacher	a257cdd	2005-06-22 17:16:26 +0000	[diff] [blame]	1938	break;
				1939	default:
				1940	return -EOPNOTSUPP;
				1941	}
				1942
				1943	if (acl && acl->a_count) {
Christoph Hellwig	334a13e	2005-06-28 20:44:58 -0700	[diff] [blame]	1944	size = posix_acl_xattr_size(acl->a_count);
Andreas Gruenbacher	a257cdd	2005-06-22 17:16:26 +0000	[diff] [blame]	1945	value = kmalloc(size, GFP_KERNEL);
				1946	if (!value)
				1947	return -ENOMEM;
				1948	size = posix_acl_to_xattr(acl, value, size);
				1949	if (size < 0) {
				1950	error = size;
				1951	goto getout;
				1952	}
				1953	} else
				1954	size = 0;
				1955
				1956	if (!fhp->fh_locked)
				1957	fh_lock(fhp); /* unlocking is done automatically */
				1958	if (size)
				1959	error = inode->i_op->setxattr(fhp->fh_dentry, name,
				1960	value, size, 0);
				1961	else {
				1962	if (!S_ISDIR(inode->i_mode) && type == ACL_TYPE_DEFAULT)
				1963	error = 0;
				1964	else {
				1965	error = inode->i_op->removexattr(fhp->fh_dentry, name);
				1966	if (error == -ENODATA)
				1967	error = 0;
				1968	}
				1969	}
				1970
				1971	getout:
				1972	kfree(value);
				1973	return error;
				1974	}
				1975	#endif /* defined(CONFIG_NFSD_V2_ACL) \|\| defined(CONFIG_NFSD_V3_ACL) */