blob: 000bd98650049c6ee27386340982f564dd30870a [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
Tejun Heo6d66f5c2007-09-20 17:31:38 +09002 * fs/sysfs/inode.c - basic sysfs inode and dentry operations
Linus Torvalds1da177e2005-04-16 15:20:36 -07003 *
Tejun Heo6d66f5c2007-09-20 17:31:38 +09004 * Copyright (c) 2001-3 Patrick Mochel
5 * Copyright (c) 2007 SUSE Linux Products GmbH
6 * Copyright (c) 2007 Tejun Heo <teheo@suse.de>
7 *
8 * This file is released under the GPLv2.
Linus Torvalds1da177e2005-04-16 15:20:36 -07009 *
10 * Please see Documentation/filesystems/sysfs.txt for more information.
11 */
12
13#undef DEBUG
14
15#include <linux/pagemap.h>
16#include <linux/namei.h>
17#include <linux/backing-dev.h>
Randy Dunlap16f7e0f2006-01-11 12:17:46 -080018#include <linux/capability.h>
Randy.Dunlap995982c2006-07-10 23:05:25 -070019#include <linux/errno.h>
Alexey Dobriyane8edc6e2007-05-21 01:22:52 +040020#include <linux/sched.h>
David P. Quigleyddd29ec2009-09-09 14:25:37 -040021#include <linux/xattr.h>
22#include <linux/security.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070023#include "sysfs.h"
24
25extern struct super_block * sysfs_sb;
26
Christoph Hellwigf5e54d62006-06-28 04:26:44 -070027static const struct address_space_operations sysfs_aops = {
Linus Torvalds1da177e2005-04-16 15:20:36 -070028 .readpage = simple_readpage,
Nick Piggin800d15a2007-10-16 01:25:03 -070029 .write_begin = simple_write_begin,
30 .write_end = simple_write_end,
Linus Torvalds1da177e2005-04-16 15:20:36 -070031};
32
33static struct backing_dev_info sysfs_backing_dev_info = {
Jens Axboed9938312009-06-12 14:45:52 +020034 .name = "sysfs",
Linus Torvalds1da177e2005-04-16 15:20:36 -070035 .ra_pages = 0, /* No readahead */
Miklos Szeredie4ad08f2008-04-30 00:54:37 -070036 .capabilities = BDI_CAP_NO_ACCT_AND_WRITEBACK,
Linus Torvalds1da177e2005-04-16 15:20:36 -070037};
38
Arjan van de Venc5ef1c42007-02-12 00:55:40 -080039static const struct inode_operations sysfs_inode_operations ={
Maneesh Soni988d1862005-05-31 10:39:14 +053040 .setattr = sysfs_setattr,
David P. Quigleyddd29ec2009-09-09 14:25:37 -040041 .setxattr = sysfs_setxattr,
Maneesh Soni988d1862005-05-31 10:39:14 +053042};
43
Peter Zijlstrae0bf68d2007-10-16 23:25:46 -070044int __init sysfs_inode_init(void)
45{
46 return bdi_init(&sysfs_backing_dev_info);
47}
48
Stefan Richterf38506c2009-10-14 20:47:32 +020049static struct sysfs_inode_attrs *sysfs_init_inode_attrs(struct sysfs_dirent *sd)
David P. Quigleyddd29ec2009-09-09 14:25:37 -040050{
51 struct sysfs_inode_attrs *attrs;
52 struct iattr *iattrs;
53
54 attrs = kzalloc(sizeof(struct sysfs_inode_attrs), GFP_KERNEL);
55 if (!attrs)
56 return NULL;
57 iattrs = &attrs->ia_iattr;
58
59 /* assign default attributes */
60 iattrs->ia_mode = sd->s_mode;
61 iattrs->ia_uid = 0;
62 iattrs->ia_gid = 0;
63 iattrs->ia_atime = iattrs->ia_mtime = iattrs->ia_ctime = CURRENT_TIME;
64
65 return attrs;
66}
Stefan Richterf38506c2009-10-14 20:47:32 +020067
Maneesh Soni988d1862005-05-31 10:39:14 +053068int sysfs_setattr(struct dentry * dentry, struct iattr * iattr)
69{
70 struct inode * inode = dentry->d_inode;
71 struct sysfs_dirent * sd = dentry->d_fsdata;
David P. Quigleyddd29ec2009-09-09 14:25:37 -040072 struct sysfs_inode_attrs *sd_attrs;
73 struct iattr *iattrs;
Maneesh Soni988d1862005-05-31 10:39:14 +053074 unsigned int ia_valid = iattr->ia_valid;
75 int error;
76
77 if (!sd)
78 return -EINVAL;
79
David P. Quigleyddd29ec2009-09-09 14:25:37 -040080 sd_attrs = sd->s_iattr;
Maneesh Soni988d1862005-05-31 10:39:14 +053081
82 error = inode_change_ok(inode, iattr);
83 if (error)
84 return error;
85
Ben Hutchings40a21592008-04-28 15:59:58 +010086 iattr->ia_valid &= ~ATTR_SIZE; /* ignore size changes */
87
Maneesh Soni988d1862005-05-31 10:39:14 +053088 error = inode_setattr(inode, iattr);
89 if (error)
90 return error;
91
David P. Quigleyddd29ec2009-09-09 14:25:37 -040092 if (!sd_attrs) {
Maneesh Soni988d1862005-05-31 10:39:14 +053093 /* setting attributes for the first time, allocate now */
David P. Quigleyddd29ec2009-09-09 14:25:37 -040094 sd_attrs = sysfs_init_inode_attrs(sd);
95 if (!sd_attrs)
Maneesh Soni988d1862005-05-31 10:39:14 +053096 return -ENOMEM;
David P. Quigleyddd29ec2009-09-09 14:25:37 -040097 sd->s_iattr = sd_attrs;
98 } else {
99 /* attributes were changed at least once in past */
100 iattrs = &sd_attrs->ia_iattr;
101
102 if (ia_valid & ATTR_UID)
103 iattrs->ia_uid = iattr->ia_uid;
104 if (ia_valid & ATTR_GID)
105 iattrs->ia_gid = iattr->ia_gid;
106 if (ia_valid & ATTR_ATIME)
107 iattrs->ia_atime = timespec_trunc(iattr->ia_atime,
108 inode->i_sb->s_time_gran);
109 if (ia_valid & ATTR_MTIME)
110 iattrs->ia_mtime = timespec_trunc(iattr->ia_mtime,
111 inode->i_sb->s_time_gran);
112 if (ia_valid & ATTR_CTIME)
113 iattrs->ia_ctime = timespec_trunc(iattr->ia_ctime,
114 inode->i_sb->s_time_gran);
115 if (ia_valid & ATTR_MODE) {
116 umode_t mode = iattr->ia_mode;
117
118 if (!in_group_p(inode->i_gid) && !capable(CAP_FSETID))
119 mode &= ~S_ISGID;
120 iattrs->ia_mode = sd->s_mode = mode;
121 }
Maneesh Soni988d1862005-05-31 10:39:14 +0530122 }
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400123 return error;
124}
Maneesh Soni988d1862005-05-31 10:39:14 +0530125
Eric W. Biedermanf44d3e72009-11-07 23:26:59 -0800126static int sysfs_sd_setsecdata(struct sysfs_dirent *sd, void **secdata, u32 *secdata_len)
127{
128 struct sysfs_inode_attrs *iattrs;
129 void *old_secdata;
130 size_t old_secdata_len;
131
132 iattrs = sd->s_iattr;
133 if (!iattrs)
134 iattrs = sysfs_init_inode_attrs(sd);
135 if (!iattrs)
136 return -ENOMEM;
137
138 old_secdata = iattrs->ia_secdata;
139 old_secdata_len = iattrs->ia_secdata_len;
140
141 iattrs->ia_secdata = *secdata;
142 iattrs->ia_secdata_len = *secdata_len;
143
144 *secdata = old_secdata;
145 *secdata_len = old_secdata_len;
146 return 0;
147}
148
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400149int sysfs_setxattr(struct dentry *dentry, const char *name, const void *value,
150 size_t size, int flags)
151{
152 struct sysfs_dirent *sd = dentry->d_fsdata;
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400153 void *secdata;
154 int error;
155 u32 secdata_len = 0;
Maneesh Soni988d1862005-05-31 10:39:14 +0530156
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400157 if (!sd)
158 return -EINVAL;
Maneesh Soni988d1862005-05-31 10:39:14 +0530159
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400160 if (!strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN)) {
161 const char *suffix = name + XATTR_SECURITY_PREFIX_LEN;
162 error = security_inode_setsecurity(dentry->d_inode, suffix,
163 value, size, flags);
164 if (error)
165 goto out;
166 error = security_inode_getsecctx(dentry->d_inode,
167 &secdata, &secdata_len);
168 if (error)
169 goto out;
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400170
Eric W. Biedermanf44d3e72009-11-07 23:26:59 -0800171 mutex_lock(&sysfs_mutex);
172 error = sysfs_sd_setsecdata(sd, &secdata, &secdata_len);
173 mutex_unlock(&sysfs_mutex);
174
175 if (secdata)
176 security_release_secctx(secdata, secdata_len);
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400177 } else
178 return -EINVAL;
179out:
Maneesh Soni988d1862005-05-31 10:39:14 +0530180 return error;
181}
182
Maneesh Soni82155342005-05-31 10:39:52 +0530183static inline void set_default_inode_attr(struct inode * inode, mode_t mode)
184{
185 inode->i_mode = mode;
Maneesh Soni82155342005-05-31 10:39:52 +0530186 inode->i_atime = inode->i_mtime = inode->i_ctime = CURRENT_TIME;
187}
188
189static inline void set_inode_attr(struct inode * inode, struct iattr * iattr)
190{
191 inode->i_mode = iattr->ia_mode;
192 inode->i_uid = iattr->ia_uid;
193 inode->i_gid = iattr->ia_gid;
194 inode->i_atime = iattr->ia_atime;
195 inode->i_mtime = iattr->ia_mtime;
196 inode->i_ctime = iattr->ia_ctime;
197}
198
Arjan van de Ven232ba9d2006-07-12 09:03:06 -0700199
200/*
201 * sysfs has a different i_mutex lock order behavior for i_mutex than other
202 * filesystems; sysfs i_mutex is called in many places with subsystem locks
203 * held. At the same time, many of the VFS locking rules do not apply to
204 * sysfs at all (cross directory rename for example). To untangle this mess
205 * (which gives false positives in lockdep), we're giving sysfs inodes their
206 * own class for i_mutex.
207 */
208static struct lock_class_key sysfs_inode_imutex_key;
209
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900210static int sysfs_count_nlink(struct sysfs_dirent *sd)
211{
212 struct sysfs_dirent *child;
213 int nr = 0;
214
Tejun Heobc747f32007-09-20 16:05:12 +0900215 for (child = sd->s_dir.children; child; child = child->s_sibling)
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900216 if (sysfs_type(child) == SYSFS_DIR)
217 nr++;
218
219 return nr + 2;
220}
221
Tejun Heobc37e282007-07-18 14:30:28 +0900222static void sysfs_init_inode(struct sysfs_dirent *sd, struct inode *inode)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223{
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900224 struct bin_attribute *bin_attr;
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400225 struct sysfs_inode_attrs *iattrs;
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900226
Eric W. Biederman04256b42009-02-11 13:20:23 -0800227 inode->i_private = sysfs_get(sd);
Tejun Heofc9f54b2007-06-14 03:45:17 +0900228 inode->i_mapping->a_ops = &sysfs_aops;
229 inode->i_mapping->backing_dev_info = &sysfs_backing_dev_info;
230 inode->i_op = &sysfs_inode_operations;
231 inode->i_ino = sd->s_ino;
232 lockdep_set_class(&inode->i_mutex, &sysfs_inode_imutex_key);
Maneesh Soni82155342005-05-31 10:39:52 +0530233
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400234 iattrs = sd->s_iattr;
235 if (iattrs) {
Tejun Heofc9f54b2007-06-14 03:45:17 +0900236 /* sysfs_dirent has non-default attributes
237 * get them for the new inode from persistent copy
238 * in sysfs_dirent
239 */
David P. Quigleyddd29ec2009-09-09 14:25:37 -0400240 set_inode_attr(inode, &iattrs->ia_iattr);
241 if (iattrs->ia_secdata)
242 security_inode_notifysecctx(inode,
243 iattrs->ia_secdata,
244 iattrs->ia_secdata_len);
Tejun Heofc9f54b2007-06-14 03:45:17 +0900245 } else
246 set_default_inode_attr(inode, sd->s_mode);
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900247
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900248 /* initialize inode according to type */
249 switch (sysfs_type(sd)) {
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900250 case SYSFS_DIR:
251 inode->i_op = &sysfs_dir_inode_operations;
252 inode->i_fop = &sysfs_dir_operations;
253 inode->i_nlink = sysfs_count_nlink(sd);
254 break;
255 case SYSFS_KOBJ_ATTR:
256 inode->i_size = PAGE_SIZE;
257 inode->i_fop = &sysfs_file_operations;
258 break;
259 case SYSFS_KOBJ_BIN_ATTR:
Tejun Heob1fc3d62007-09-20 16:05:11 +0900260 bin_attr = sd->s_bin_attr.bin_attr;
Eric W. Biederman372e88b2007-08-20 21:36:29 +0900261 inode->i_size = bin_attr->size;
262 inode->i_fop = &bin_fops;
263 break;
264 case SYSFS_KOBJ_LINK:
265 inode->i_op = &sysfs_symlink_inode_operations;
266 break;
267 default:
268 BUG();
269 }
270
271 unlock_new_inode(inode);
Tejun Heofc9f54b2007-06-14 03:45:17 +0900272}
273
274/**
Tejun Heo8312a8d2007-06-14 03:45:17 +0900275 * sysfs_get_inode - get inode for sysfs_dirent
Tejun Heofc9f54b2007-06-14 03:45:17 +0900276 * @sd: sysfs_dirent to allocate inode for
277 *
Tejun Heo8312a8d2007-06-14 03:45:17 +0900278 * Get inode for @sd. If such inode doesn't exist, a new inode
279 * is allocated and basics are initialized. New inode is
280 * returned locked.
Tejun Heofc9f54b2007-06-14 03:45:17 +0900281 *
282 * LOCKING:
283 * Kernel thread context (may sleep).
284 *
285 * RETURNS:
286 * Pointer to allocated inode on success, NULL on failure.
287 */
Tejun Heo8312a8d2007-06-14 03:45:17 +0900288struct inode * sysfs_get_inode(struct sysfs_dirent *sd)
Tejun Heofc9f54b2007-06-14 03:45:17 +0900289{
290 struct inode *inode;
291
Tejun Heo8312a8d2007-06-14 03:45:17 +0900292 inode = iget_locked(sysfs_sb, sd->s_ino);
293 if (inode && (inode->i_state & I_NEW))
Tejun Heofc9f54b2007-06-14 03:45:17 +0900294 sysfs_init_inode(sd, inode);
295
Linus Torvalds1da177e2005-04-16 15:20:36 -0700296 return inode;
297}
298
Eric W. Biederman04256b42009-02-11 13:20:23 -0800299/*
300 * The sysfs_dirent serves as both an inode and a directory entry for sysfs.
301 * To prevent the sysfs inode numbers from being freed prematurely we take a
302 * reference to sysfs_dirent from the sysfs inode. A
303 * super_operations.delete_inode() implementation is needed to drop that
304 * reference upon inode destruction.
305 */
306void sysfs_delete_inode(struct inode *inode)
307{
308 struct sysfs_dirent *sd = inode->i_private;
309
310 truncate_inode_pages(&inode->i_data, 0);
311 clear_inode(inode);
312 sysfs_put(sd);
313}
314
Tejun Heo608e2662007-06-14 04:27:22 +0900315int sysfs_hash_and_remove(struct sysfs_dirent *dir_sd, const char *name)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700316{
Tejun Heofb6896d2007-06-14 04:27:24 +0900317 struct sysfs_addrm_cxt acxt;
Tejun Heo41fc1c22007-08-02 21:38:03 +0900318 struct sysfs_dirent *sd;
Greg Kroah-Hartman641e6f32006-03-16 15:44:26 -0800319
Tejun Heo608e2662007-06-14 04:27:22 +0900320 if (!dir_sd)
Randy.Dunlap995982c2006-07-10 23:05:25 -0700321 return -ENOENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700322
Tejun Heofb6896d2007-06-14 04:27:24 +0900323 sysfs_addrm_start(&acxt, dir_sd);
Tejun Heo608e2662007-06-14 04:27:22 +0900324
Tejun Heo41fc1c22007-08-02 21:38:03 +0900325 sd = sysfs_find_dirent(dir_sd, name);
326 if (sd)
327 sysfs_remove_one(&acxt, sd);
Tejun Heo3007e992007-06-14 04:27:23 +0900328
Tejun Heo990e53f2007-08-02 21:38:03 +0900329 sysfs_addrm_finish(&acxt);
330
331 if (sd)
Tejun Heofb6896d2007-06-14 04:27:24 +0900332 return 0;
Tejun Heo990e53f2007-08-02 21:38:03 +0900333 else
334 return -ENOENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700335}