blob: fad364548bc9e3716b08dc0f6ca66a58d1f9b56c [file] [log] [blame]
Linus Torvalds1da177e2005-04-16 15:20:36 -07001/*
2 * Copyright (C) International Business Machines Corp., 2000-2004
3 * Copyright (C) Christoph Hellwig, 2002
4 *
5 * This program is free software; you can redistribute it and/or modify
6 * it under the terms of the GNU General Public License as published by
Dave Kleikamp63f83c92006-10-02 09:55:27 -05007 * the Free Software Foundation; either version 2 of the License, or
Linus Torvalds1da177e2005-04-16 15:20:36 -07008 * (at your option) any later version.
Dave Kleikamp63f83c92006-10-02 09:55:27 -05009 *
Linus Torvalds1da177e2005-04-16 15:20:36 -070010 * This program is distributed in the hope that it will be useful,
11 * but WITHOUT ANY WARRANTY; without even the implied warranty of
12 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See
13 * the GNU General Public License for more details.
14 *
15 * You should have received a copy of the GNU General Public License
Dave Kleikamp63f83c92006-10-02 09:55:27 -050016 * along with this program; if not, write to the Free Software
Linus Torvalds1da177e2005-04-16 15:20:36 -070017 * Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19
Randy Dunlap16f7e0f2006-01-11 12:17:46 -080020#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070021#include <linux/fs.h>
22#include <linux/xattr.h>
Christoph Hellwig9a59f452005-06-23 00:10:19 -070023#include <linux/posix_acl_xattr.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070024#include <linux/quotaops.h>
Dave Kleikamp1d15b10f2005-09-01 09:05:39 -050025#include <linux/security.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070026#include "jfs_incore.h"
27#include "jfs_superblock.h"
28#include "jfs_dmap.h"
29#include "jfs_debug.h"
30#include "jfs_dinode.h"
31#include "jfs_extent.h"
32#include "jfs_metapage.h"
33#include "jfs_xattr.h"
34#include "jfs_acl.h"
35
36/*
37 * jfs_xattr.c: extended attribute service
38 *
39 * Overall design --
40 *
41 * Format:
42 *
43 * Extended attribute lists (jfs_ea_list) consist of an overall size (32 bit
44 * value) and a variable (0 or more) number of extended attribute
45 * entries. Each extended attribute entry (jfs_ea) is a <name,value> double
46 * where <name> is constructed from a null-terminated ascii string
47 * (1 ... 255 bytes in the name) and <value> is arbitrary 8 bit data
48 * (1 ... 65535 bytes). The in-memory format is
49 *
50 * 0 1 2 4 4 + namelen + 1
51 * +-------+--------+--------+----------------+-------------------+
52 * | Flags | Name | Value | Name String \0 | Data . . . . |
53 * | | Length | Length | | |
54 * +-------+--------+--------+----------------+-------------------+
55 *
56 * A jfs_ea_list then is structured as
57 *
58 * 0 4 4 + EA_SIZE(ea1)
59 * +------------+-------------------+--------------------+-----
Dave Kleikamp63f83c92006-10-02 09:55:27 -050060 * | Overall EA | First FEA Element | Second FEA Element | .....
Linus Torvalds1da177e2005-04-16 15:20:36 -070061 * | List Size | | |
62 * +------------+-------------------+--------------------+-----
63 *
64 * On-disk:
65 *
Dave Kleikampf720e3b2007-06-06 15:28:35 -050066 * FEALISTs are stored on disk using blocks allocated by dbAlloc() and
67 * written directly. An EA list may be in-lined in the inode if there is
68 * sufficient room available.
Linus Torvalds1da177e2005-04-16 15:20:36 -070069 */
70
71struct ea_buffer {
72 int flag; /* Indicates what storage xattr points to */
73 int max_size; /* largest xattr that fits in current buffer */
74 dxd_t new_ea; /* dxd to replace ea when modifying xattr */
75 struct metapage *mp; /* metapage containing ea list */
76 struct jfs_ea_list *xattr; /* buffer containing ea list */
77};
78
79/*
80 * ea_buffer.flag values
81 */
82#define EA_INLINE 0x0001
83#define EA_EXTENT 0x0002
84#define EA_NEW 0x0004
85#define EA_MALLOC 0x0008
86
Linus Torvalds1da177e2005-04-16 15:20:36 -070087
88/*
89 * These three routines are used to recognize on-disk extended attributes
90 * that are in a recognized namespace. If the attribute is not recognized,
91 * "os2." is prepended to the name
92 */
93static inline int is_os2_xattr(struct jfs_ea *ea)
94{
95 /*
96 * Check for "system."
97 */
98 if ((ea->namelen >= XATTR_SYSTEM_PREFIX_LEN) &&
99 !strncmp(ea->name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
Richard Knutsson4d817152006-09-30 23:27:14 -0700100 return false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700101 /*
102 * Check for "user."
103 */
104 if ((ea->namelen >= XATTR_USER_PREFIX_LEN) &&
105 !strncmp(ea->name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN))
Richard Knutsson4d817152006-09-30 23:27:14 -0700106 return false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700107 /*
108 * Check for "security."
109 */
110 if ((ea->namelen >= XATTR_SECURITY_PREFIX_LEN) &&
111 !strncmp(ea->name, XATTR_SECURITY_PREFIX,
112 XATTR_SECURITY_PREFIX_LEN))
Richard Knutsson4d817152006-09-30 23:27:14 -0700113 return false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700114 /*
115 * Check for "trusted."
116 */
117 if ((ea->namelen >= XATTR_TRUSTED_PREFIX_LEN) &&
118 !strncmp(ea->name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN))
Richard Knutsson4d817152006-09-30 23:27:14 -0700119 return false;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700120 /*
121 * Add any other valid namespace prefixes here
122 */
123
124 /*
125 * We assume it's OS/2's flat namespace
126 */
Richard Knutsson4d817152006-09-30 23:27:14 -0700127 return true;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700128}
129
130static inline int name_size(struct jfs_ea *ea)
131{
132 if (is_os2_xattr(ea))
133 return ea->namelen + XATTR_OS2_PREFIX_LEN;
134 else
135 return ea->namelen;
136}
137
138static inline int copy_name(char *buffer, struct jfs_ea *ea)
139{
140 int len = ea->namelen;
141
142 if (is_os2_xattr(ea)) {
143 memcpy(buffer, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN);
144 buffer += XATTR_OS2_PREFIX_LEN;
145 len += XATTR_OS2_PREFIX_LEN;
146 }
147 memcpy(buffer, ea->name, ea->namelen);
148 buffer[ea->namelen] = 0;
149
150 return len;
151}
152
153/* Forward references */
154static void ea_release(struct inode *inode, struct ea_buffer *ea_buf);
155
156/*
157 * NAME: ea_write_inline
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500158 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700159 * FUNCTION: Attempt to write an EA inline if area is available
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500160 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700161 * PRE CONDITIONS:
162 * Already verified that the specified EA is small enough to fit inline
163 *
164 * PARAMETERS:
165 * ip - Inode pointer
166 * ealist - EA list pointer
167 * size - size of ealist in bytes
168 * ea - dxd_t structure to be filled in with necessary EA information
169 * if we successfully copy the EA inline
170 *
171 * NOTES:
172 * Checks if the inode's inline area is available. If so, copies EA inline
173 * and sets <ea> fields appropriately. Otherwise, returns failure, EA will
174 * have to be put into an extent.
175 *
176 * RETURNS: 0 for successful copy to inline area; -1 if area not available
177 */
178static int ea_write_inline(struct inode *ip, struct jfs_ea_list *ealist,
179 int size, dxd_t * ea)
180{
181 struct jfs_inode_info *ji = JFS_IP(ip);
182
183 /*
184 * Make sure we have an EA -- the NULL EA list is valid, but you
185 * can't copy it!
186 */
187 if (ealist && size > sizeof (struct jfs_ea_list)) {
188 assert(size <= sizeof (ji->i_inline_ea));
189
190 /*
191 * See if the space is available or if it is already being
192 * used for an inline EA.
193 */
194 if (!(ji->mode2 & INLINEEA) && !(ji->ea.flag & DXD_INLINE))
195 return -EPERM;
196
197 DXDsize(ea, size);
198 DXDlength(ea, 0);
199 DXDaddress(ea, 0);
200 memcpy(ji->i_inline_ea, ealist, size);
201 ea->flag = DXD_INLINE;
202 ji->mode2 &= ~INLINEEA;
203 } else {
204 ea->flag = 0;
205 DXDsize(ea, 0);
206 DXDlength(ea, 0);
207 DXDaddress(ea, 0);
208
209 /* Free up INLINE area */
210 if (ji->ea.flag & DXD_INLINE)
211 ji->mode2 |= INLINEEA;
212 }
213
214 return 0;
215}
216
217/*
218 * NAME: ea_write
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500219 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700220 * FUNCTION: Write an EA for an inode
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500221 *
222 * PRE CONDITIONS: EA has been verified
Linus Torvalds1da177e2005-04-16 15:20:36 -0700223 *
224 * PARAMETERS:
225 * ip - Inode pointer
226 * ealist - EA list pointer
227 * size - size of ealist in bytes
228 * ea - dxd_t structure to be filled in appropriately with where the
229 * EA was copied
230 *
231 * NOTES: Will write EA inline if able to, otherwise allocates blocks for an
232 * extent and synchronously writes it to those blocks.
233 *
234 * RETURNS: 0 for success; Anything else indicates failure
235 */
236static int ea_write(struct inode *ip, struct jfs_ea_list *ealist, int size,
237 dxd_t * ea)
238{
239 struct super_block *sb = ip->i_sb;
240 struct jfs_inode_info *ji = JFS_IP(ip);
241 struct jfs_sb_info *sbi = JFS_SBI(sb);
242 int nblocks;
243 s64 blkno;
244 int rc = 0, i;
245 char *cp;
246 s32 nbytes, nb;
247 s32 bytes_to_write;
248 struct metapage *mp;
249
250 /*
251 * Quick check to see if this is an in-linable EA. Short EAs
252 * and empty EAs are all in-linable, provided the space exists.
253 */
254 if (!ealist || size <= sizeof (ji->i_inline_ea)) {
255 if (!ea_write_inline(ip, ealist, size, ea))
256 return 0;
257 }
258
259 /* figure out how many blocks we need */
260 nblocks = (size + (sb->s_blocksize - 1)) >> sb->s_blocksize_bits;
261
262 /* Allocate new blocks to quota. */
Jan Karac94d2a22009-01-26 17:22:32 +0100263 if (vfs_dq_alloc_block(ip, nblocks)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700264 return -EDQUOT;
265 }
266
267 rc = dbAlloc(ip, INOHINT(ip), nblocks, &blkno);
268 if (rc) {
269 /*Rollback quota allocation. */
Jan Karac94d2a22009-01-26 17:22:32 +0100270 vfs_dq_free_block(ip, nblocks);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700271 return rc;
272 }
273
274 /*
275 * Now have nblocks worth of storage to stuff into the FEALIST.
276 * loop over the FEALIST copying data into the buffer one page at
277 * a time.
278 */
279 cp = (char *) ealist;
280 nbytes = size;
281 for (i = 0; i < nblocks; i += sbi->nbperpage) {
282 /*
283 * Determine how many bytes for this request, and round up to
284 * the nearest aggregate block size
285 */
286 nb = min(PSIZE, nbytes);
287 bytes_to_write =
288 ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
289 << sb->s_blocksize_bits;
290
291 if (!(mp = get_metapage(ip, blkno + i, bytes_to_write, 1))) {
292 rc = -EIO;
293 goto failed;
294 }
295
296 memcpy(mp->data, cp, nb);
297
298 /*
299 * We really need a way to propagate errors for
300 * forced writes like this one. --hch
301 *
302 * (__write_metapage => release_metapage => flush_metapage)
303 */
304#ifdef _JFS_FIXME
305 if ((rc = flush_metapage(mp))) {
306 /*
307 * the write failed -- this means that the buffer
308 * is still assigned and the blocks are not being
309 * used. this seems like the best error recovery
310 * we can get ...
311 */
312 goto failed;
313 }
314#else
315 flush_metapage(mp);
316#endif
317
318 cp += PSIZE;
319 nbytes -= nb;
320 }
321
322 ea->flag = DXD_EXTENT;
323 DXDsize(ea, le32_to_cpu(ealist->size));
324 DXDlength(ea, nblocks);
325 DXDaddress(ea, blkno);
326
327 /* Free up INLINE area */
328 if (ji->ea.flag & DXD_INLINE)
329 ji->mode2 |= INLINEEA;
330
331 return 0;
332
333 failed:
334 /* Rollback quota allocation. */
Jan Karac94d2a22009-01-26 17:22:32 +0100335 vfs_dq_free_block(ip, nblocks);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700336
337 dbFree(ip, blkno, nblocks);
338 return rc;
339}
340
341/*
342 * NAME: ea_read_inline
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500343 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700344 * FUNCTION: Read an inlined EA into user's buffer
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500345 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700346 * PARAMETERS:
347 * ip - Inode pointer
348 * ealist - Pointer to buffer to fill in with EA
349 *
350 * RETURNS: 0
351 */
352static int ea_read_inline(struct inode *ip, struct jfs_ea_list *ealist)
353{
354 struct jfs_inode_info *ji = JFS_IP(ip);
355 int ea_size = sizeDXD(&ji->ea);
356
357 if (ea_size == 0) {
358 ealist->size = 0;
359 return 0;
360 }
361
362 /* Sanity Check */
363 if ((sizeDXD(&ji->ea) > sizeof (ji->i_inline_ea)))
364 return -EIO;
365 if (le32_to_cpu(((struct jfs_ea_list *) &ji->i_inline_ea)->size)
366 != ea_size)
367 return -EIO;
368
369 memcpy(ealist, ji->i_inline_ea, ea_size);
370 return 0;
371}
372
373/*
374 * NAME: ea_read
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500375 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700376 * FUNCTION: copy EA data into user's buffer
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500377 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700378 * PARAMETERS:
379 * ip - Inode pointer
380 * ealist - Pointer to buffer to fill in with EA
381 *
382 * NOTES: If EA is inline calls ea_read_inline() to copy EA.
383 *
384 * RETURNS: 0 for success; other indicates failure
385 */
386static int ea_read(struct inode *ip, struct jfs_ea_list *ealist)
387{
388 struct super_block *sb = ip->i_sb;
389 struct jfs_inode_info *ji = JFS_IP(ip);
390 struct jfs_sb_info *sbi = JFS_SBI(sb);
391 int nblocks;
392 s64 blkno;
393 char *cp = (char *) ealist;
394 int i;
395 int nbytes, nb;
396 s32 bytes_to_read;
397 struct metapage *mp;
398
399 /* quick check for in-line EA */
400 if (ji->ea.flag & DXD_INLINE)
401 return ea_read_inline(ip, ealist);
402
403 nbytes = sizeDXD(&ji->ea);
404 if (!nbytes) {
405 jfs_error(sb, "ea_read: nbytes is 0");
406 return -EIO;
407 }
408
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500409 /*
Linus Torvalds1da177e2005-04-16 15:20:36 -0700410 * Figure out how many blocks were allocated when this EA list was
411 * originally written to disk.
412 */
413 nblocks = lengthDXD(&ji->ea) << sbi->l2nbperpage;
414 blkno = addressDXD(&ji->ea) << sbi->l2nbperpage;
415
416 /*
417 * I have found the disk blocks which were originally used to store
418 * the FEALIST. now i loop over each contiguous block copying the
419 * data into the buffer.
420 */
421 for (i = 0; i < nblocks; i += sbi->nbperpage) {
422 /*
423 * Determine how many bytes for this request, and round up to
424 * the nearest aggregate block size
425 */
426 nb = min(PSIZE, nbytes);
427 bytes_to_read =
428 ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
429 << sb->s_blocksize_bits;
430
431 if (!(mp = read_metapage(ip, blkno + i, bytes_to_read, 1)))
432 return -EIO;
433
434 memcpy(cp, mp->data, nb);
435 release_metapage(mp);
436
437 cp += PSIZE;
438 nbytes -= nb;
439 }
440
441 return 0;
442}
443
444/*
445 * NAME: ea_get
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500446 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700447 * FUNCTION: Returns buffer containing existing extended attributes.
448 * The size of the buffer will be the larger of the existing
449 * attributes size, or min_size.
450 *
451 * The buffer, which may be inlined in the inode or in the
Dave Kleikamp63f83c92006-10-02 09:55:27 -0500452 * page cache must be release by calling ea_release or ea_put
453 *
Linus Torvalds1da177e2005-04-16 15:20:36 -0700454 * PARAMETERS:
455 * inode - Inode pointer
456 * ea_buf - Structure to be populated with ealist and its metadata
457 * min_size- minimum size of buffer to be returned
458 *
459 * RETURNS: 0 for success; Other indicates failure
460 */
461static int ea_get(struct inode *inode, struct ea_buffer *ea_buf, int min_size)
462{
463 struct jfs_inode_info *ji = JFS_IP(inode);
464 struct super_block *sb = inode->i_sb;
465 int size;
466 int ea_size = sizeDXD(&ji->ea);
467 int blocks_needed, current_blocks;
468 s64 blkno;
469 int rc;
470 int quota_allocation = 0;
471
472 /* When fsck.jfs clears a bad ea, it doesn't clear the size */
473 if (ji->ea.flag == 0)
474 ea_size = 0;
475
476 if (ea_size == 0) {
477 if (min_size == 0) {
478 ea_buf->flag = 0;
479 ea_buf->max_size = 0;
480 ea_buf->xattr = NULL;
481 return 0;
482 }
483 if ((min_size <= sizeof (ji->i_inline_ea)) &&
484 (ji->mode2 & INLINEEA)) {
485 ea_buf->flag = EA_INLINE | EA_NEW;
486 ea_buf->max_size = sizeof (ji->i_inline_ea);
487 ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
488 DXDlength(&ea_buf->new_ea, 0);
489 DXDaddress(&ea_buf->new_ea, 0);
490 ea_buf->new_ea.flag = DXD_INLINE;
491 DXDsize(&ea_buf->new_ea, min_size);
492 return 0;
493 }
494 current_blocks = 0;
495 } else if (ji->ea.flag & DXD_INLINE) {
496 if (min_size <= sizeof (ji->i_inline_ea)) {
497 ea_buf->flag = EA_INLINE;
498 ea_buf->max_size = sizeof (ji->i_inline_ea);
499 ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
500 goto size_check;
501 }
502 current_blocks = 0;
503 } else {
504 if (!(ji->ea.flag & DXD_EXTENT)) {
505 jfs_error(sb, "ea_get: invalid ea.flag)");
506 return -EIO;
507 }
508 current_blocks = (ea_size + sb->s_blocksize - 1) >>
509 sb->s_blocksize_bits;
510 }
511 size = max(min_size, ea_size);
512
513 if (size > PSIZE) {
514 /*
515 * To keep the rest of the code simple. Allocate a
516 * contiguous buffer to work with
517 */
518 ea_buf->xattr = kmalloc(size, GFP_KERNEL);
519 if (ea_buf->xattr == NULL)
520 return -ENOMEM;
521
522 ea_buf->flag = EA_MALLOC;
523 ea_buf->max_size = (size + sb->s_blocksize - 1) &
524 ~(sb->s_blocksize - 1);
525
526 if (ea_size == 0)
527 return 0;
528
529 if ((rc = ea_read(inode, ea_buf->xattr))) {
530 kfree(ea_buf->xattr);
531 ea_buf->xattr = NULL;
532 return rc;
533 }
534 goto size_check;
535 }
536 blocks_needed = (min_size + sb->s_blocksize - 1) >>
537 sb->s_blocksize_bits;
538
539 if (blocks_needed > current_blocks) {
540 /* Allocate new blocks to quota. */
Jan Karac94d2a22009-01-26 17:22:32 +0100541 if (vfs_dq_alloc_block(inode, blocks_needed))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700542 return -EDQUOT;
543
544 quota_allocation = blocks_needed;
545
546 rc = dbAlloc(inode, INOHINT(inode), (s64) blocks_needed,
547 &blkno);
548 if (rc)
549 goto clean_up;
550
551 DXDlength(&ea_buf->new_ea, blocks_needed);
552 DXDaddress(&ea_buf->new_ea, blkno);
553 ea_buf->new_ea.flag = DXD_EXTENT;
554 DXDsize(&ea_buf->new_ea, min_size);
555
556 ea_buf->flag = EA_EXTENT | EA_NEW;
557
558 ea_buf->mp = get_metapage(inode, blkno,
559 blocks_needed << sb->s_blocksize_bits,
560 1);
561 if (ea_buf->mp == NULL) {
562 dbFree(inode, blkno, (s64) blocks_needed);
563 rc = -EIO;
564 goto clean_up;
565 }
566 ea_buf->xattr = ea_buf->mp->data;
567 ea_buf->max_size = (min_size + sb->s_blocksize - 1) &
568 ~(sb->s_blocksize - 1);
569 if (ea_size == 0)
570 return 0;
571 if ((rc = ea_read(inode, ea_buf->xattr))) {
572 discard_metapage(ea_buf->mp);
573 dbFree(inode, blkno, (s64) blocks_needed);
574 goto clean_up;
575 }
576 goto size_check;
577 }
578 ea_buf->flag = EA_EXTENT;
579 ea_buf->mp = read_metapage(inode, addressDXD(&ji->ea),
580 lengthDXD(&ji->ea) << sb->s_blocksize_bits,
581 1);
582 if (ea_buf->mp == NULL) {
583 rc = -EIO;
584 goto clean_up;
585 }
586 ea_buf->xattr = ea_buf->mp->data;
587 ea_buf->max_size = (ea_size + sb->s_blocksize - 1) &
588 ~(sb->s_blocksize - 1);
589
590 size_check:
591 if (EALIST_SIZE(ea_buf->xattr) != ea_size) {
592 printk(KERN_ERR "ea_get: invalid extended attribute\n");
Dave Kleikamp288e4d82007-06-13 10:17:50 -0500593 print_hex_dump(KERN_ERR, "", DUMP_PREFIX_ADDRESS, 16, 1,
594 ea_buf->xattr, ea_size, 1);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700595 ea_release(inode, ea_buf);
596 rc = -EIO;
597 goto clean_up;
598 }
599
600 return ea_size;
601
602 clean_up:
603 /* Rollback quota allocation */
604 if (quota_allocation)
Jan Karac94d2a22009-01-26 17:22:32 +0100605 vfs_dq_free_block(inode, quota_allocation);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700606
607 return (rc);
608}
609
610static void ea_release(struct inode *inode, struct ea_buffer *ea_buf)
611{
612 if (ea_buf->flag & EA_MALLOC)
613 kfree(ea_buf->xattr);
614 else if (ea_buf->flag & EA_EXTENT) {
615 assert(ea_buf->mp);
616 release_metapage(ea_buf->mp);
617
618 if (ea_buf->flag & EA_NEW)
619 dbFree(inode, addressDXD(&ea_buf->new_ea),
620 lengthDXD(&ea_buf->new_ea));
621 }
622}
623
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500624static int ea_put(tid_t tid, struct inode *inode, struct ea_buffer *ea_buf,
625 int new_size)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700626{
627 struct jfs_inode_info *ji = JFS_IP(inode);
628 unsigned long old_blocks, new_blocks;
629 int rc = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700630
631 if (new_size == 0) {
632 ea_release(inode, ea_buf);
633 ea_buf = NULL;
634 } else if (ea_buf->flag & EA_INLINE) {
635 assert(new_size <= sizeof (ji->i_inline_ea));
636 ji->mode2 &= ~INLINEEA;
637 ea_buf->new_ea.flag = DXD_INLINE;
638 DXDsize(&ea_buf->new_ea, new_size);
639 DXDaddress(&ea_buf->new_ea, 0);
640 DXDlength(&ea_buf->new_ea, 0);
641 } else if (ea_buf->flag & EA_MALLOC) {
642 rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
643 kfree(ea_buf->xattr);
644 } else if (ea_buf->flag & EA_NEW) {
645 /* We have already allocated a new dxd */
646 flush_metapage(ea_buf->mp);
647 } else {
648 /* ->xattr must point to original ea's metapage */
649 rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
650 discard_metapage(ea_buf->mp);
651 }
652 if (rc)
653 return rc;
654
Linus Torvalds1da177e2005-04-16 15:20:36 -0700655 old_blocks = new_blocks = 0;
656
657 if (ji->ea.flag & DXD_EXTENT) {
658 invalidate_dxd_metapages(inode, ji->ea);
659 old_blocks = lengthDXD(&ji->ea);
660 }
661
662 if (ea_buf) {
663 txEA(tid, inode, &ji->ea, &ea_buf->new_ea);
664 if (ea_buf->new_ea.flag & DXD_EXTENT) {
665 new_blocks = lengthDXD(&ea_buf->new_ea);
666 if (ji->ea.flag & DXD_INLINE)
667 ji->mode2 |= INLINEEA;
668 }
669 ji->ea = ea_buf->new_ea;
670 } else {
671 txEA(tid, inode, &ji->ea, NULL);
672 if (ji->ea.flag & DXD_INLINE)
673 ji->mode2 |= INLINEEA;
674 ji->ea.flag = 0;
675 ji->ea.size = 0;
676 }
677
678 /* If old blocks exist, they must be removed from quota allocation. */
679 if (old_blocks)
Jan Karac94d2a22009-01-26 17:22:32 +0100680 vfs_dq_free_block(inode, old_blocks);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700681
682 inode->i_ctime = CURRENT_TIME;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700683
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500684 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700685}
686
687/*
688 * can_set_system_xattr
689 *
690 * This code is specific to the system.* namespace. It contains policy
691 * which doesn't belong in the main xattr codepath.
692 */
693static int can_set_system_xattr(struct inode *inode, const char *name,
694 const void *value, size_t value_len)
695{
696#ifdef CONFIG_JFS_POSIX_ACL
697 struct posix_acl *acl;
698 int rc;
699
Satyam Sharma3bd858a2007-07-17 15:00:08 +0530700 if (!is_owner_or_cap(inode))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700701 return -EPERM;
702
703 /*
Christoph Hellwig9a59f452005-06-23 00:10:19 -0700704 * POSIX_ACL_XATTR_ACCESS is tied to i_mode
Linus Torvalds1da177e2005-04-16 15:20:36 -0700705 */
Christoph Hellwig9a59f452005-06-23 00:10:19 -0700706 if (strcmp(name, POSIX_ACL_XATTR_ACCESS) == 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700707 acl = posix_acl_from_xattr(value, value_len);
708 if (IS_ERR(acl)) {
709 rc = PTR_ERR(acl);
710 printk(KERN_ERR "posix_acl_from_xattr returned %d\n",
711 rc);
712 return rc;
713 }
714 if (acl) {
715 mode_t mode = inode->i_mode;
716 rc = posix_acl_equiv_mode(acl, &mode);
717 posix_acl_release(acl);
718 if (rc < 0) {
719 printk(KERN_ERR
720 "posix_acl_equiv_mode returned %d\n",
721 rc);
722 return rc;
723 }
724 inode->i_mode = mode;
725 mark_inode_dirty(inode);
726 }
727 /*
728 * We're changing the ACL. Get rid of the cached one
729 */
Al Viro073aaa12009-06-09 12:11:54 -0400730 forget_cached_acl(inode, ACL_TYPE_ACCESS);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700731
732 return 0;
Christoph Hellwig9a59f452005-06-23 00:10:19 -0700733 } else if (strcmp(name, POSIX_ACL_XATTR_DEFAULT) == 0) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700734 acl = posix_acl_from_xattr(value, value_len);
735 if (IS_ERR(acl)) {
736 rc = PTR_ERR(acl);
737 printk(KERN_ERR "posix_acl_from_xattr returned %d\n",
738 rc);
739 return rc;
740 }
741 posix_acl_release(acl);
742
743 /*
744 * We're changing the default ACL. Get rid of the cached one
745 */
Al Viro073aaa12009-06-09 12:11:54 -0400746 forget_cached_acl(inode, ACL_TYPE_DEFAULT);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700747
748 return 0;
749 }
750#endif /* CONFIG_JFS_POSIX_ACL */
751 return -EOPNOTSUPP;
752}
753
Dave Kleikampd572b872006-11-02 10:50:40 -0600754/*
755 * Most of the permission checking is done by xattr_permission in the vfs.
756 * The local file system is responsible for handling the system.* namespace.
757 * We also need to verify that this is a namespace that we recognize.
758 */
Linus Torvalds1da177e2005-04-16 15:20:36 -0700759static int can_set_xattr(struct inode *inode, const char *name,
760 const void *value, size_t value_len)
761{
Christoph Hellwig44a00332006-01-09 20:51:57 -0800762 if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700763 return can_set_system_xattr(inode, name, value, value_len);
764
Christoph Hellwig44a00332006-01-09 20:51:57 -0800765 /*
766 * Don't allow setting an attribute in an unknown namespace.
767 */
768 if (strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) &&
769 strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
770 strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN) &&
771 strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN))
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772 return -EOPNOTSUPP;
773
Christoph Hellwig44a00332006-01-09 20:51:57 -0800774 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775}
776
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500777int __jfs_setxattr(tid_t tid, struct inode *inode, const char *name,
778 const void *value, size_t value_len, int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779{
780 struct jfs_ea_list *ealist;
781 struct jfs_ea *ea, *old_ea = NULL, *next_ea = NULL;
782 struct ea_buffer ea_buf;
783 int old_ea_size = 0;
784 int xattr_size;
785 int new_size;
786 int namelen = strlen(name);
787 char *os2name = NULL;
788 int found = 0;
789 int rc;
790 int length;
791
Linus Torvalds1da177e2005-04-16 15:20:36 -0700792 if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
793 os2name = kmalloc(namelen - XATTR_OS2_PREFIX_LEN + 1,
794 GFP_KERNEL);
795 if (!os2name)
796 return -ENOMEM;
797 strcpy(os2name, name + XATTR_OS2_PREFIX_LEN);
798 name = os2name;
799 namelen -= XATTR_OS2_PREFIX_LEN;
800 }
801
802 down_write(&JFS_IP(inode)->xattr_sem);
803
804 xattr_size = ea_get(inode, &ea_buf, 0);
805 if (xattr_size < 0) {
806 rc = xattr_size;
807 goto out;
808 }
809
810 again:
811 ealist = (struct jfs_ea_list *) ea_buf.xattr;
812 new_size = sizeof (struct jfs_ea_list);
813
814 if (xattr_size) {
815 for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist);
816 ea = NEXT_EA(ea)) {
817 if ((namelen == ea->namelen) &&
818 (memcmp(name, ea->name, namelen) == 0)) {
819 found = 1;
820 if (flags & XATTR_CREATE) {
821 rc = -EEXIST;
822 goto release;
823 }
824 old_ea = ea;
825 old_ea_size = EA_SIZE(ea);
826 next_ea = NEXT_EA(ea);
827 } else
828 new_size += EA_SIZE(ea);
829 }
830 }
831
832 if (!found) {
833 if (flags & XATTR_REPLACE) {
834 rc = -ENODATA;
835 goto release;
836 }
837 if (value == NULL) {
838 rc = 0;
839 goto release;
840 }
841 }
842 if (value)
843 new_size += sizeof (struct jfs_ea) + namelen + 1 + value_len;
844
845 if (new_size > ea_buf.max_size) {
846 /*
847 * We need to allocate more space for merged ea list.
848 * We should only have loop to again: once.
849 */
850 ea_release(inode, &ea_buf);
851 xattr_size = ea_get(inode, &ea_buf, new_size);
852 if (xattr_size < 0) {
853 rc = xattr_size;
854 goto out;
855 }
856 goto again;
857 }
858
859 /* Remove old ea of the same name */
860 if (found) {
861 /* number of bytes following target EA */
862 length = (char *) END_EALIST(ealist) - (char *) next_ea;
863 if (length > 0)
864 memmove(old_ea, next_ea, length);
865 xattr_size -= old_ea_size;
866 }
867
868 /* Add new entry to the end */
869 if (value) {
870 if (xattr_size == 0)
871 /* Completely new ea list */
872 xattr_size = sizeof (struct jfs_ea_list);
873
874 ea = (struct jfs_ea *) ((char *) ealist + xattr_size);
875 ea->flag = 0;
876 ea->namelen = namelen;
877 ea->valuelen = (cpu_to_le16(value_len));
878 memcpy(ea->name, name, namelen);
879 ea->name[namelen] = 0;
880 if (value_len)
881 memcpy(&ea->name[namelen + 1], value, value_len);
882 xattr_size += EA_SIZE(ea);
883 }
884
885 /* DEBUG - If we did this right, these number match */
886 if (xattr_size != new_size) {
887 printk(KERN_ERR
888 "jfs_xsetattr: xattr_size = %d, new_size = %d\n",
889 xattr_size, new_size);
890
891 rc = -EINVAL;
892 goto release;
893 }
894
895 /*
896 * If we're left with an empty list, there's no ea
897 */
898 if (new_size == sizeof (struct jfs_ea_list))
899 new_size = 0;
900
901 ealist->size = cpu_to_le32(new_size);
902
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500903 rc = ea_put(tid, inode, &ea_buf, new_size);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700904
905 goto out;
906 release:
907 ea_release(inode, &ea_buf);
908 out:
909 up_write(&JFS_IP(inode)->xattr_sem);
910
Jesper Juhl259692b2005-05-09 10:47:14 -0500911 kfree(os2name);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700912
913 return rc;
914}
915
916int jfs_setxattr(struct dentry *dentry, const char *name, const void *value,
917 size_t value_len, int flags)
918{
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500919 struct inode *inode = dentry->d_inode;
920 struct jfs_inode_info *ji = JFS_IP(inode);
921 int rc;
922 tid_t tid;
923
924 if ((rc = can_set_xattr(inode, name, value, value_len)))
925 return rc;
926
Linus Torvalds1da177e2005-04-16 15:20:36 -0700927 if (value == NULL) { /* empty EA, do not remove */
928 value = "";
929 value_len = 0;
930 }
931
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500932 tid = txBegin(inode->i_sb, 0);
Ingo Molnar1de87442006-01-24 15:22:50 -0600933 mutex_lock(&ji->commit_mutex);
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500934 rc = __jfs_setxattr(tid, dentry->d_inode, name, value, value_len,
935 flags);
936 if (!rc)
937 rc = txCommit(tid, 1, &inode, 0);
938 txEnd(tid);
Ingo Molnar1de87442006-01-24 15:22:50 -0600939 mutex_unlock(&ji->commit_mutex);
Dave Kleikamp4f4b4012005-09-01 09:02:43 -0500940
941 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700942}
943
Linus Torvalds1da177e2005-04-16 15:20:36 -0700944ssize_t __jfs_getxattr(struct inode *inode, const char *name, void *data,
945 size_t buf_size)
946{
947 struct jfs_ea_list *ealist;
948 struct jfs_ea *ea;
949 struct ea_buffer ea_buf;
950 int xattr_size;
951 ssize_t size;
952 int namelen = strlen(name);
953 char *os2name = NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700954 char *value;
955
Linus Torvalds1da177e2005-04-16 15:20:36 -0700956 if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
957 os2name = kmalloc(namelen - XATTR_OS2_PREFIX_LEN + 1,
958 GFP_KERNEL);
959 if (!os2name)
960 return -ENOMEM;
961 strcpy(os2name, name + XATTR_OS2_PREFIX_LEN);
962 name = os2name;
963 namelen -= XATTR_OS2_PREFIX_LEN;
964 }
965
966 down_read(&JFS_IP(inode)->xattr_sem);
967
968 xattr_size = ea_get(inode, &ea_buf, 0);
969
970 if (xattr_size < 0) {
971 size = xattr_size;
972 goto out;
973 }
974
975 if (xattr_size == 0)
976 goto not_found;
977
978 ealist = (struct jfs_ea_list *) ea_buf.xattr;
979
980 /* Find the named attribute */
981 for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea))
982 if ((namelen == ea->namelen) &&
983 memcmp(name, ea->name, namelen) == 0) {
984 /* Found it */
985 size = le16_to_cpu(ea->valuelen);
986 if (!data)
987 goto release;
988 else if (size > buf_size) {
989 size = -ERANGE;
990 goto release;
991 }
992 value = ((char *) &ea->name) + ea->namelen + 1;
993 memcpy(data, value, size);
994 goto release;
995 }
996 not_found:
997 size = -ENODATA;
998 release:
999 ea_release(inode, &ea_buf);
1000 out:
1001 up_read(&JFS_IP(inode)->xattr_sem);
1002
Jesper Juhl259692b2005-05-09 10:47:14 -05001003 kfree(os2name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001004
1005 return size;
1006}
1007
1008ssize_t jfs_getxattr(struct dentry *dentry, const char *name, void *data,
1009 size_t buf_size)
1010{
1011 int err;
1012
1013 err = __jfs_getxattr(dentry->d_inode, name, data, buf_size);
1014
1015 return err;
1016}
1017
1018/*
1019 * No special permissions are needed to list attributes except for trusted.*
1020 */
1021static inline int can_list(struct jfs_ea *ea)
1022{
1023 return (strncmp(ea->name, XATTR_TRUSTED_PREFIX,
1024 XATTR_TRUSTED_PREFIX_LEN) ||
1025 capable(CAP_SYS_ADMIN));
1026}
1027
1028ssize_t jfs_listxattr(struct dentry * dentry, char *data, size_t buf_size)
1029{
1030 struct inode *inode = dentry->d_inode;
1031 char *buffer;
1032 ssize_t size = 0;
1033 int xattr_size;
1034 struct jfs_ea_list *ealist;
1035 struct jfs_ea *ea;
1036 struct ea_buffer ea_buf;
1037
1038 down_read(&JFS_IP(inode)->xattr_sem);
1039
1040 xattr_size = ea_get(inode, &ea_buf, 0);
1041 if (xattr_size < 0) {
1042 size = xattr_size;
1043 goto out;
1044 }
1045
1046 if (xattr_size == 0)
1047 goto release;
1048
1049 ealist = (struct jfs_ea_list *) ea_buf.xattr;
1050
1051 /* compute required size of list */
1052 for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
Dave Kleikamp63f83c92006-10-02 09:55:27 -05001053 if (can_list(ea))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001054 size += name_size(ea) + 1;
1055 }
1056
1057 if (!data)
1058 goto release;
1059
1060 if (size > buf_size) {
1061 size = -ERANGE;
1062 goto release;
1063 }
1064
1065 /* Copy attribute names to buffer */
1066 buffer = data;
1067 for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
Dave Kleikamp63f83c92006-10-02 09:55:27 -05001068 if (can_list(ea)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001069 int namelen = copy_name(buffer, ea);
1070 buffer += namelen + 1;
1071 }
1072 }
1073
1074 release:
1075 ea_release(inode, &ea_buf);
1076 out:
1077 up_read(&JFS_IP(inode)->xattr_sem);
1078 return size;
1079}
1080
1081int jfs_removexattr(struct dentry *dentry, const char *name)
1082{
Dave Kleikamp4f4b4012005-09-01 09:02:43 -05001083 struct inode *inode = dentry->d_inode;
1084 struct jfs_inode_info *ji = JFS_IP(inode);
1085 int rc;
1086 tid_t tid;
1087
1088 if ((rc = can_set_xattr(inode, name, NULL, 0)))
1089 return rc;
1090
1091 tid = txBegin(inode->i_sb, 0);
Ingo Molnar1de87442006-01-24 15:22:50 -06001092 mutex_lock(&ji->commit_mutex);
Dave Kleikamp4f4b4012005-09-01 09:02:43 -05001093 rc = __jfs_setxattr(tid, dentry->d_inode, name, NULL, 0, XATTR_REPLACE);
1094 if (!rc)
1095 rc = txCommit(tid, 1, &inode, 0);
1096 txEnd(tid);
Ingo Molnar1de87442006-01-24 15:22:50 -06001097 mutex_unlock(&ji->commit_mutex);
Dave Kleikamp4f4b4012005-09-01 09:02:43 -05001098
1099 return rc;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001100}
Dave Kleikamp1d15b10f2005-09-01 09:05:39 -05001101
1102#ifdef CONFIG_JFS_SECURITY
1103int jfs_init_security(tid_t tid, struct inode *inode, struct inode *dir)
1104{
1105 int rc;
1106 size_t len;
1107 void *value;
1108 char *suffix;
1109 char *name;
1110
1111 rc = security_inode_init_security(inode, dir, &suffix, &value, &len);
1112 if (rc) {
1113 if (rc == -EOPNOTSUPP)
1114 return 0;
1115 return rc;
1116 }
1117 name = kmalloc(XATTR_SECURITY_PREFIX_LEN + 1 + strlen(suffix),
1118 GFP_NOFS);
1119 if (!name) {
1120 rc = -ENOMEM;
1121 goto kmalloc_failed;
1122 }
1123 strcpy(name, XATTR_SECURITY_PREFIX);
1124 strcpy(name + XATTR_SECURITY_PREFIX_LEN, suffix);
1125
1126 rc = __jfs_setxattr(tid, inode, name, value, len, 0);
1127
1128 kfree(name);
1129kmalloc_failed:
1130 kfree(suffix);
1131 kfree(value);
1132
1133 return rc;
1134}
1135#endif