1/*
2 *   Copyright (C) International Business Machines  Corp., 2000-2004
3 *   Copyright (C) Christoph Hellwig, 2002
4 *
5 *   This program is free software;  you can redistribute it and/or modify
6 *   it under the terms of the GNU General Public License as published by
7 *   the Free Software Foundation; either version 2 of the License, or
8 *   (at your option) any later version.
9 *
10 *   This program is distributed in the hope that it will be useful,
11 *   but WITHOUT ANY WARRANTY;  without even the implied warranty of
12 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See
13 *   the GNU General Public License for more details.
14 *
15 *   You should have received a copy of the GNU General Public License
16 *   along with this program;  if not, write to the Free Software
17 *   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
18 */
19
20#include <linux/capability.h>
21#include <linux/fs.h>
22#include <linux/xattr.h>
23#include <linux/posix_acl_xattr.h>
24#include <linux/slab.h>
25#include <linux/quotaops.h>
26#include <linux/security.h>
27#include "jfs_incore.h"
28#include "jfs_superblock.h"
29#include "jfs_dmap.h"
30#include "jfs_debug.h"
31#include "jfs_dinode.h"
32#include "jfs_extent.h"
33#include "jfs_metapage.h"
34#include "jfs_xattr.h"
35#include "jfs_acl.h"
36
37/*
38 *	jfs_xattr.c: extended attribute service
39 *
40 * Overall design --
41 *
42 * Format:
43 *
44 *   Extended attribute lists (jfs_ea_list) consist of an overall size (32 bit
45 *   value) and a variable (0 or more) number of extended attribute
46 *   entries.  Each extended attribute entry (jfs_ea) is a <name,value> double
47 *   where <name> is constructed from a null-terminated ascii string
48 *   (1 ... 255 bytes in the name) and <value> is arbitrary 8 bit data
49 *   (1 ... 65535 bytes).  The in-memory format is
50 *
51 *   0       1        2        4                4 + namelen + 1
52 *   +-------+--------+--------+----------------+-------------------+
53 *   | Flags | Name   | Value  | Name String \0 | Data . . . .      |
54 *   |       | Length | Length |                |                   |
55 *   +-------+--------+--------+----------------+-------------------+
56 *
57 *   A jfs_ea_list then is structured as
58 *
59 *   0            4                   4 + EA_SIZE(ea1)
60 *   +------------+-------------------+--------------------+-----
61 *   | Overall EA | First FEA Element | Second FEA Element | .....
62 *   | List Size  |                   |                    |
63 *   +------------+-------------------+--------------------+-----
64 *
65 *   On-disk:
66 *
67 *	FEALISTs are stored on disk using blocks allocated by dbAlloc() and
68 *	written directly. An EA list may be in-lined in the inode if there is
69 *	sufficient room available.
70 */
71
72struct ea_buffer {
73	int flag;		/* Indicates what storage xattr points to */
74	int max_size;		/* largest xattr that fits in current buffer */
75	dxd_t new_ea;		/* dxd to replace ea when modifying xattr */
76	struct metapage *mp;	/* metapage containing ea list */
77	struct jfs_ea_list *xattr;	/* buffer containing ea list */
78};
79
80/*
81 * ea_buffer.flag values
82 */
83#define EA_INLINE	0x0001
84#define EA_EXTENT	0x0002
85#define EA_NEW		0x0004
86#define EA_MALLOC	0x0008
87
88
89static int is_known_namespace(const char *name)
90{
91	if (strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN) &&
92	    strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN) &&
93	    strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
94	    strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN))
95		return false;
96
97	return true;
98}
99
100/*
101 * These three routines are used to recognize on-disk extended attributes
102 * that are in a recognized namespace.  If the attribute is not recognized,
103 * "os2." is prepended to the name
104 */
105static int is_os2_xattr(struct jfs_ea *ea)
106{
107	return !is_known_namespace(ea->name);
108}
109
110static inline int name_size(struct jfs_ea *ea)
111{
112	if (is_os2_xattr(ea))
113		return ea->namelen + XATTR_OS2_PREFIX_LEN;
114	else
115		return ea->namelen;
116}
117
118static inline int copy_name(char *buffer, struct jfs_ea *ea)
119{
120	int len = ea->namelen;
121
122	if (is_os2_xattr(ea)) {
123		memcpy(buffer, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN);
124		buffer += XATTR_OS2_PREFIX_LEN;
125		len += XATTR_OS2_PREFIX_LEN;
126	}
127	memcpy(buffer, ea->name, ea->namelen);
128	buffer[ea->namelen] = 0;
129
130	return len;
131}
132
133/* Forward references */
134static void ea_release(struct inode *inode, struct ea_buffer *ea_buf);
135
136/*
137 * NAME: ea_write_inline
138 *
139 * FUNCTION: Attempt to write an EA inline if area is available
140 *
141 * PRE CONDITIONS:
142 *	Already verified that the specified EA is small enough to fit inline
143 *
144 * PARAMETERS:
145 *	ip	- Inode pointer
146 *	ealist	- EA list pointer
147 *	size	- size of ealist in bytes
148 *	ea	- dxd_t structure to be filled in with necessary EA information
149 *		  if we successfully copy the EA inline
150 *
151 * NOTES:
152 *	Checks if the inode's inline area is available.  If so, copies EA inline
153 *	and sets <ea> fields appropriately.  Otherwise, returns failure, EA will
154 *	have to be put into an extent.
155 *
156 * RETURNS: 0 for successful copy to inline area; -1 if area not available
157 */
158static int ea_write_inline(struct inode *ip, struct jfs_ea_list *ealist,
159			   int size, dxd_t * ea)
160{
161	struct jfs_inode_info *ji = JFS_IP(ip);
162
163	/*
164	 * Make sure we have an EA -- the NULL EA list is valid, but you
165	 * can't copy it!
166	 */
167	if (ealist && size > sizeof (struct jfs_ea_list)) {
168		assert(size <= sizeof (ji->i_inline_ea));
169
170		/*
171		 * See if the space is available or if it is already being
172		 * used for an inline EA.
173		 */
174		if (!(ji->mode2 & INLINEEA) && !(ji->ea.flag & DXD_INLINE))
175			return -EPERM;
176
177		DXDsize(ea, size);
178		DXDlength(ea, 0);
179		DXDaddress(ea, 0);
180		memcpy(ji->i_inline_ea, ealist, size);
181		ea->flag = DXD_INLINE;
182		ji->mode2 &= ~INLINEEA;
183	} else {
184		ea->flag = 0;
185		DXDsize(ea, 0);
186		DXDlength(ea, 0);
187		DXDaddress(ea, 0);
188
189		/* Free up INLINE area */
190		if (ji->ea.flag & DXD_INLINE)
191			ji->mode2 |= INLINEEA;
192	}
193
194	return 0;
195}
196
197/*
198 * NAME: ea_write
199 *
200 * FUNCTION: Write an EA for an inode
201 *
202 * PRE CONDITIONS: EA has been verified
203 *
204 * PARAMETERS:
205 *	ip	- Inode pointer
206 *	ealist	- EA list pointer
207 *	size	- size of ealist in bytes
208 *	ea	- dxd_t structure to be filled in appropriately with where the
209 *		  EA was copied
210 *
211 * NOTES: Will write EA inline if able to, otherwise allocates blocks for an
212 *	extent and synchronously writes it to those blocks.
213 *
214 * RETURNS: 0 for success; Anything else indicates failure
215 */
216static int ea_write(struct inode *ip, struct jfs_ea_list *ealist, int size,
217		       dxd_t * ea)
218{
219	struct super_block *sb = ip->i_sb;
220	struct jfs_inode_info *ji = JFS_IP(ip);
221	struct jfs_sb_info *sbi = JFS_SBI(sb);
222	int nblocks;
223	s64 blkno;
224	int rc = 0, i;
225	char *cp;
226	s32 nbytes, nb;
227	s32 bytes_to_write;
228	struct metapage *mp;
229
230	/*
231	 * Quick check to see if this is an in-linable EA.  Short EAs
232	 * and empty EAs are all in-linable, provided the space exists.
233	 */
234	if (!ealist || size <= sizeof (ji->i_inline_ea)) {
235		if (!ea_write_inline(ip, ealist, size, ea))
236			return 0;
237	}
238
239	/* figure out how many blocks we need */
240	nblocks = (size + (sb->s_blocksize - 1)) >> sb->s_blocksize_bits;
241
242	/* Allocate new blocks to quota. */
243	rc = dquot_alloc_block(ip, nblocks);
244	if (rc)
245		return rc;
246
247	rc = dbAlloc(ip, INOHINT(ip), nblocks, &blkno);
248	if (rc) {
249		/*Rollback quota allocation. */
250		dquot_free_block(ip, nblocks);
251		return rc;
252	}
253
254	/*
255	 * Now have nblocks worth of storage to stuff into the FEALIST.
256	 * loop over the FEALIST copying data into the buffer one page at
257	 * a time.
258	 */
259	cp = (char *) ealist;
260	nbytes = size;
261	for (i = 0; i < nblocks; i += sbi->nbperpage) {
262		/*
263		 * Determine how many bytes for this request, and round up to
264		 * the nearest aggregate block size
265		 */
266		nb = min(PSIZE, nbytes);
267		bytes_to_write =
268		    ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
269		    << sb->s_blocksize_bits;
270
271		if (!(mp = get_metapage(ip, blkno + i, bytes_to_write, 1))) {
272			rc = -EIO;
273			goto failed;
274		}
275
276		memcpy(mp->data, cp, nb);
277
278		/*
279		 * We really need a way to propagate errors for
280		 * forced writes like this one.  --hch
281		 *
282		 * (__write_metapage => release_metapage => flush_metapage)
283		 */
284#ifdef _JFS_FIXME
285		if ((rc = flush_metapage(mp))) {
286			/*
287			 * the write failed -- this means that the buffer
288			 * is still assigned and the blocks are not being
289			 * used.  this seems like the best error recovery
290			 * we can get ...
291			 */
292			goto failed;
293		}
294#else
295		flush_metapage(mp);
296#endif
297
298		cp += PSIZE;
299		nbytes -= nb;
300	}
301
302	ea->flag = DXD_EXTENT;
303	DXDsize(ea, le32_to_cpu(ealist->size));
304	DXDlength(ea, nblocks);
305	DXDaddress(ea, blkno);
306
307	/* Free up INLINE area */
308	if (ji->ea.flag & DXD_INLINE)
309		ji->mode2 |= INLINEEA;
310
311	return 0;
312
313      failed:
314	/* Rollback quota allocation. */
315	dquot_free_block(ip, nblocks);
316
317	dbFree(ip, blkno, nblocks);
318	return rc;
319}
320
321/*
322 * NAME: ea_read_inline
323 *
324 * FUNCTION: Read an inlined EA into user's buffer
325 *
326 * PARAMETERS:
327 *	ip	- Inode pointer
328 *	ealist	- Pointer to buffer to fill in with EA
329 *
330 * RETURNS: 0
331 */
332static int ea_read_inline(struct inode *ip, struct jfs_ea_list *ealist)
333{
334	struct jfs_inode_info *ji = JFS_IP(ip);
335	int ea_size = sizeDXD(&ji->ea);
336
337	if (ea_size == 0) {
338		ealist->size = 0;
339		return 0;
340	}
341
342	/* Sanity Check */
343	if ((sizeDXD(&ji->ea) > sizeof (ji->i_inline_ea)))
344		return -EIO;
345	if (le32_to_cpu(((struct jfs_ea_list *) &ji->i_inline_ea)->size)
346	    != ea_size)
347		return -EIO;
348
349	memcpy(ealist, ji->i_inline_ea, ea_size);
350	return 0;
351}
352
353/*
354 * NAME: ea_read
355 *
356 * FUNCTION: copy EA data into user's buffer
357 *
358 * PARAMETERS:
359 *	ip	- Inode pointer
360 *	ealist	- Pointer to buffer to fill in with EA
361 *
362 * NOTES:  If EA is inline calls ea_read_inline() to copy EA.
363 *
364 * RETURNS: 0 for success; other indicates failure
365 */
366static int ea_read(struct inode *ip, struct jfs_ea_list *ealist)
367{
368	struct super_block *sb = ip->i_sb;
369	struct jfs_inode_info *ji = JFS_IP(ip);
370	struct jfs_sb_info *sbi = JFS_SBI(sb);
371	int nblocks;
372	s64 blkno;
373	char *cp = (char *) ealist;
374	int i;
375	int nbytes, nb;
376	s32 bytes_to_read;
377	struct metapage *mp;
378
379	/* quick check for in-line EA */
380	if (ji->ea.flag & DXD_INLINE)
381		return ea_read_inline(ip, ealist);
382
383	nbytes = sizeDXD(&ji->ea);
384	if (!nbytes) {
385		jfs_error(sb, "nbytes is 0\n");
386		return -EIO;
387	}
388
389	/*
390	 * Figure out how many blocks were allocated when this EA list was
391	 * originally written to disk.
392	 */
393	nblocks = lengthDXD(&ji->ea) << sbi->l2nbperpage;
394	blkno = addressDXD(&ji->ea) << sbi->l2nbperpage;
395
396	/*
397	 * I have found the disk blocks which were originally used to store
398	 * the FEALIST.  now i loop over each contiguous block copying the
399	 * data into the buffer.
400	 */
401	for (i = 0; i < nblocks; i += sbi->nbperpage) {
402		/*
403		 * Determine how many bytes for this request, and round up to
404		 * the nearest aggregate block size
405		 */
406		nb = min(PSIZE, nbytes);
407		bytes_to_read =
408		    ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
409		    << sb->s_blocksize_bits;
410
411		if (!(mp = read_metapage(ip, blkno + i, bytes_to_read, 1)))
412			return -EIO;
413
414		memcpy(cp, mp->data, nb);
415		release_metapage(mp);
416
417		cp += PSIZE;
418		nbytes -= nb;
419	}
420
421	return 0;
422}
423
424/*
425 * NAME: ea_get
426 *
427 * FUNCTION: Returns buffer containing existing extended attributes.
428 *	     The size of the buffer will be the larger of the existing
429 *	     attributes size, or min_size.
430 *
431 *	     The buffer, which may be inlined in the inode or in the
432 *	     page cache must be release by calling ea_release or ea_put
433 *
434 * PARAMETERS:
435 *	inode	- Inode pointer
436 *	ea_buf	- Structure to be populated with ealist and its metadata
437 *	min_size- minimum size of buffer to be returned
438 *
439 * RETURNS: 0 for success; Other indicates failure
440 */
441static int ea_get(struct inode *inode, struct ea_buffer *ea_buf, int min_size)
442{
443	struct jfs_inode_info *ji = JFS_IP(inode);
444	struct super_block *sb = inode->i_sb;
445	int size;
446	int ea_size = sizeDXD(&ji->ea);
447	int blocks_needed, current_blocks;
448	s64 blkno;
449	int rc;
450	int quota_allocation = 0;
451
452	/* When fsck.jfs clears a bad ea, it doesn't clear the size */
453	if (ji->ea.flag == 0)
454		ea_size = 0;
455
456	if (ea_size == 0) {
457		if (min_size == 0) {
458			ea_buf->flag = 0;
459			ea_buf->max_size = 0;
460			ea_buf->xattr = NULL;
461			return 0;
462		}
463		if ((min_size <= sizeof (ji->i_inline_ea)) &&
464		    (ji->mode2 & INLINEEA)) {
465			ea_buf->flag = EA_INLINE | EA_NEW;
466			ea_buf->max_size = sizeof (ji->i_inline_ea);
467			ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
468			DXDlength(&ea_buf->new_ea, 0);
469			DXDaddress(&ea_buf->new_ea, 0);
470			ea_buf->new_ea.flag = DXD_INLINE;
471			DXDsize(&ea_buf->new_ea, min_size);
472			return 0;
473		}
474		current_blocks = 0;
475	} else if (ji->ea.flag & DXD_INLINE) {
476		if (min_size <= sizeof (ji->i_inline_ea)) {
477			ea_buf->flag = EA_INLINE;
478			ea_buf->max_size = sizeof (ji->i_inline_ea);
479			ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
480			goto size_check;
481		}
482		current_blocks = 0;
483	} else {
484		if (!(ji->ea.flag & DXD_EXTENT)) {
485			jfs_error(sb, "invalid ea.flag\n");
486			return -EIO;
487		}
488		current_blocks = (ea_size + sb->s_blocksize - 1) >>
489		    sb->s_blocksize_bits;
490	}
491	size = max(min_size, ea_size);
492
493	if (size > PSIZE) {
494		/*
495		 * To keep the rest of the code simple.  Allocate a
496		 * contiguous buffer to work with
497		 */
498		ea_buf->xattr = kmalloc(size, GFP_KERNEL);
499		if (ea_buf->xattr == NULL)
500			return -ENOMEM;
501
502		ea_buf->flag = EA_MALLOC;
503		ea_buf->max_size = (size + sb->s_blocksize - 1) &
504		    ~(sb->s_blocksize - 1);
505
506		if (ea_size == 0)
507			return 0;
508
509		if ((rc = ea_read(inode, ea_buf->xattr))) {
510			kfree(ea_buf->xattr);
511			ea_buf->xattr = NULL;
512			return rc;
513		}
514		goto size_check;
515	}
516	blocks_needed = (min_size + sb->s_blocksize - 1) >>
517	    sb->s_blocksize_bits;
518
519	if (blocks_needed > current_blocks) {
520		/* Allocate new blocks to quota. */
521		rc = dquot_alloc_block(inode, blocks_needed);
522		if (rc)
523			return -EDQUOT;
524
525		quota_allocation = blocks_needed;
526
527		rc = dbAlloc(inode, INOHINT(inode), (s64) blocks_needed,
528			     &blkno);
529		if (rc)
530			goto clean_up;
531
532		DXDlength(&ea_buf->new_ea, blocks_needed);
533		DXDaddress(&ea_buf->new_ea, blkno);
534		ea_buf->new_ea.flag = DXD_EXTENT;
535		DXDsize(&ea_buf->new_ea, min_size);
536
537		ea_buf->flag = EA_EXTENT | EA_NEW;
538
539		ea_buf->mp = get_metapage(inode, blkno,
540					  blocks_needed << sb->s_blocksize_bits,
541					  1);
542		if (ea_buf->mp == NULL) {
543			dbFree(inode, blkno, (s64) blocks_needed);
544			rc = -EIO;
545			goto clean_up;
546		}
547		ea_buf->xattr = ea_buf->mp->data;
548		ea_buf->max_size = (min_size + sb->s_blocksize - 1) &
549		    ~(sb->s_blocksize - 1);
550		if (ea_size == 0)
551			return 0;
552		if ((rc = ea_read(inode, ea_buf->xattr))) {
553			discard_metapage(ea_buf->mp);
554			dbFree(inode, blkno, (s64) blocks_needed);
555			goto clean_up;
556		}
557		goto size_check;
558	}
559	ea_buf->flag = EA_EXTENT;
560	ea_buf->mp = read_metapage(inode, addressDXD(&ji->ea),
561				   lengthDXD(&ji->ea) << sb->s_blocksize_bits,
562				   1);
563	if (ea_buf->mp == NULL) {
564		rc = -EIO;
565		goto clean_up;
566	}
567	ea_buf->xattr = ea_buf->mp->data;
568	ea_buf->max_size = (ea_size + sb->s_blocksize - 1) &
569	    ~(sb->s_blocksize - 1);
570
571      size_check:
572	if (EALIST_SIZE(ea_buf->xattr) != ea_size) {
573		printk(KERN_ERR "ea_get: invalid extended attribute\n");
574		print_hex_dump(KERN_ERR, "", DUMP_PREFIX_ADDRESS, 16, 1,
575				     ea_buf->xattr, ea_size, 1);
576		ea_release(inode, ea_buf);
577		rc = -EIO;
578		goto clean_up;
579	}
580
581	return ea_size;
582
583      clean_up:
584	/* Rollback quota allocation */
585	if (quota_allocation)
586		dquot_free_block(inode, quota_allocation);
587
588	return (rc);
589}
590
591static void ea_release(struct inode *inode, struct ea_buffer *ea_buf)
592{
593	if (ea_buf->flag & EA_MALLOC)
594		kfree(ea_buf->xattr);
595	else if (ea_buf->flag & EA_EXTENT) {
596		assert(ea_buf->mp);
597		release_metapage(ea_buf->mp);
598
599		if (ea_buf->flag & EA_NEW)
600			dbFree(inode, addressDXD(&ea_buf->new_ea),
601			       lengthDXD(&ea_buf->new_ea));
602	}
603}
604
605static int ea_put(tid_t tid, struct inode *inode, struct ea_buffer *ea_buf,
606		  int new_size)
607{
608	struct jfs_inode_info *ji = JFS_IP(inode);
609	unsigned long old_blocks, new_blocks;
610	int rc = 0;
611
612	if (new_size == 0) {
613		ea_release(inode, ea_buf);
614		ea_buf = NULL;
615	} else if (ea_buf->flag & EA_INLINE) {
616		assert(new_size <= sizeof (ji->i_inline_ea));
617		ji->mode2 &= ~INLINEEA;
618		ea_buf->new_ea.flag = DXD_INLINE;
619		DXDsize(&ea_buf->new_ea, new_size);
620		DXDaddress(&ea_buf->new_ea, 0);
621		DXDlength(&ea_buf->new_ea, 0);
622	} else if (ea_buf->flag & EA_MALLOC) {
623		rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
624		kfree(ea_buf->xattr);
625	} else if (ea_buf->flag & EA_NEW) {
626		/* We have already allocated a new dxd */
627		flush_metapage(ea_buf->mp);
628	} else {
629		/* ->xattr must point to original ea's metapage */
630		rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
631		discard_metapage(ea_buf->mp);
632	}
633	if (rc)
634		return rc;
635
636	old_blocks = new_blocks = 0;
637
638	if (ji->ea.flag & DXD_EXTENT) {
639		invalidate_dxd_metapages(inode, ji->ea);
640		old_blocks = lengthDXD(&ji->ea);
641	}
642
643	if (ea_buf) {
644		txEA(tid, inode, &ji->ea, &ea_buf->new_ea);
645		if (ea_buf->new_ea.flag & DXD_EXTENT) {
646			new_blocks = lengthDXD(&ea_buf->new_ea);
647			if (ji->ea.flag & DXD_INLINE)
648				ji->mode2 |= INLINEEA;
649		}
650		ji->ea = ea_buf->new_ea;
651	} else {
652		txEA(tid, inode, &ji->ea, NULL);
653		if (ji->ea.flag & DXD_INLINE)
654			ji->mode2 |= INLINEEA;
655		ji->ea.flag = 0;
656		ji->ea.size = 0;
657	}
658
659	/* If old blocks exist, they must be removed from quota allocation. */
660	if (old_blocks)
661		dquot_free_block(inode, old_blocks);
662
663	inode->i_ctime = CURRENT_TIME;
664
665	return 0;
666}
667
668/*
669 * Most of the permission checking is done by xattr_permission in the vfs.
670 * We also need to verify that this is a namespace that we recognize.
671 */
672static int can_set_xattr(struct inode *inode, const char *name,
673			 const void *value, size_t value_len)
674{
675	if (!strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN)) {
676		/*
677		 * This makes sure that we aren't trying to set an
678		 * attribute in a different namespace by prefixing it
679		 * with "os2."
680		 */
681		if (is_known_namespace(name + XATTR_OS2_PREFIX_LEN))
682			return -EOPNOTSUPP;
683		return 0;
684	}
685
686	/*
687	 * Don't allow setting an attribute in an unknown namespace.
688	 */
689	if (strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) &&
690	    strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
691	    strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN))
692		return -EOPNOTSUPP;
693
694	return 0;
695}
696
697int __jfs_setxattr(tid_t tid, struct inode *inode, const char *name,
698		   const void *value, size_t value_len, int flags)
699{
700	struct jfs_ea_list *ealist;
701	struct jfs_ea *ea, *old_ea = NULL, *next_ea = NULL;
702	struct ea_buffer ea_buf;
703	int old_ea_size = 0;
704	int xattr_size;
705	int new_size;
706	int namelen = strlen(name);
707	char *os2name = NULL;
708	int found = 0;
709	int rc;
710	int length;
711
712	if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
713		os2name = kmalloc(namelen - XATTR_OS2_PREFIX_LEN + 1,
714				  GFP_KERNEL);
715		if (!os2name)
716			return -ENOMEM;
717		strcpy(os2name, name + XATTR_OS2_PREFIX_LEN);
718		name = os2name;
719		namelen -= XATTR_OS2_PREFIX_LEN;
720	}
721
722	down_write(&JFS_IP(inode)->xattr_sem);
723
724	xattr_size = ea_get(inode, &ea_buf, 0);
725	if (xattr_size < 0) {
726		rc = xattr_size;
727		goto out;
728	}
729
730      again:
731	ealist = (struct jfs_ea_list *) ea_buf.xattr;
732	new_size = sizeof (struct jfs_ea_list);
733
734	if (xattr_size) {
735		for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist);
736		     ea = NEXT_EA(ea)) {
737			if ((namelen == ea->namelen) &&
738			    (memcmp(name, ea->name, namelen) == 0)) {
739				found = 1;
740				if (flags & XATTR_CREATE) {
741					rc = -EEXIST;
742					goto release;
743				}
744				old_ea = ea;
745				old_ea_size = EA_SIZE(ea);
746				next_ea = NEXT_EA(ea);
747			} else
748				new_size += EA_SIZE(ea);
749		}
750	}
751
752	if (!found) {
753		if (flags & XATTR_REPLACE) {
754			rc = -ENODATA;
755			goto release;
756		}
757		if (value == NULL) {
758			rc = 0;
759			goto release;
760		}
761	}
762	if (value)
763		new_size += sizeof (struct jfs_ea) + namelen + 1 + value_len;
764
765	if (new_size > ea_buf.max_size) {
766		/*
767		 * We need to allocate more space for merged ea list.
768		 * We should only have loop to again: once.
769		 */
770		ea_release(inode, &ea_buf);
771		xattr_size = ea_get(inode, &ea_buf, new_size);
772		if (xattr_size < 0) {
773			rc = xattr_size;
774			goto out;
775		}
776		goto again;
777	}
778
779	/* Remove old ea of the same name */
780	if (found) {
781		/* number of bytes following target EA */
782		length = (char *) END_EALIST(ealist) - (char *) next_ea;
783		if (length > 0)
784			memmove(old_ea, next_ea, length);
785		xattr_size -= old_ea_size;
786	}
787
788	/* Add new entry to the end */
789	if (value) {
790		if (xattr_size == 0)
791			/* Completely new ea list */
792			xattr_size = sizeof (struct jfs_ea_list);
793
794		/*
795		 * The size of EA value is limitted by on-disk format up to
796		 *  __le16, there would be an overflow if the size is equal
797		 * to XATTR_SIZE_MAX (65536).  In order to avoid this issue,
798		 * we can pre-checkup the value size against USHRT_MAX, and
799		 * return -E2BIG in this case, which is consistent with the
800		 * VFS setxattr interface.
801		 */
802		if (value_len >= USHRT_MAX) {
803			rc = -E2BIG;
804			goto release;
805		}
806
807		ea = (struct jfs_ea *) ((char *) ealist + xattr_size);
808		ea->flag = 0;
809		ea->namelen = namelen;
810		ea->valuelen = (cpu_to_le16(value_len));
811		memcpy(ea->name, name, namelen);
812		ea->name[namelen] = 0;
813		if (value_len)
814			memcpy(&ea->name[namelen + 1], value, value_len);
815		xattr_size += EA_SIZE(ea);
816	}
817
818	/* DEBUG - If we did this right, these number match */
819	if (xattr_size != new_size) {
820		printk(KERN_ERR
821		       "__jfs_setxattr: xattr_size = %d, new_size = %d\n",
822		       xattr_size, new_size);
823
824		rc = -EINVAL;
825		goto release;
826	}
827
828	/*
829	 * If we're left with an empty list, there's no ea
830	 */
831	if (new_size == sizeof (struct jfs_ea_list))
832		new_size = 0;
833
834	ealist->size = cpu_to_le32(new_size);
835
836	rc = ea_put(tid, inode, &ea_buf, new_size);
837
838	goto out;
839      release:
840	ea_release(inode, &ea_buf);
841      out:
842	up_write(&JFS_IP(inode)->xattr_sem);
843
844	kfree(os2name);
845
846	return rc;
847}
848
849int jfs_setxattr(struct dentry *dentry, const char *name, const void *value,
850		 size_t value_len, int flags)
851{
852	struct inode *inode = d_inode(dentry);
853	struct jfs_inode_info *ji = JFS_IP(inode);
854	int rc;
855	tid_t tid;
856
857	/*
858	 * If this is a request for a synthetic attribute in the system.*
859	 * namespace use the generic infrastructure to resolve a handler
860	 * for it via sb->s_xattr.
861	 */
862	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
863		return generic_setxattr(dentry, name, value, value_len, flags);
864
865	if ((rc = can_set_xattr(inode, name, value, value_len)))
866		return rc;
867
868	if (value == NULL) {	/* empty EA, do not remove */
869		value = "";
870		value_len = 0;
871	}
872
873	tid = txBegin(inode->i_sb, 0);
874	mutex_lock(&ji->commit_mutex);
875	rc = __jfs_setxattr(tid, d_inode(dentry), name, value, value_len,
876			    flags);
877	if (!rc)
878		rc = txCommit(tid, 1, &inode, 0);
879	txEnd(tid);
880	mutex_unlock(&ji->commit_mutex);
881
882	return rc;
883}
884
885ssize_t __jfs_getxattr(struct inode *inode, const char *name, void *data,
886		       size_t buf_size)
887{
888	struct jfs_ea_list *ealist;
889	struct jfs_ea *ea;
890	struct ea_buffer ea_buf;
891	int xattr_size;
892	ssize_t size;
893	int namelen = strlen(name);
894	char *value;
895
896	down_read(&JFS_IP(inode)->xattr_sem);
897
898	xattr_size = ea_get(inode, &ea_buf, 0);
899
900	if (xattr_size < 0) {
901		size = xattr_size;
902		goto out;
903	}
904
905	if (xattr_size == 0)
906		goto not_found;
907
908	ealist = (struct jfs_ea_list *) ea_buf.xattr;
909
910	/* Find the named attribute */
911	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea))
912		if ((namelen == ea->namelen) &&
913		    memcmp(name, ea->name, namelen) == 0) {
914			/* Found it */
915			size = le16_to_cpu(ea->valuelen);
916			if (!data)
917				goto release;
918			else if (size > buf_size) {
919				size = -ERANGE;
920				goto release;
921			}
922			value = ((char *) &ea->name) + ea->namelen + 1;
923			memcpy(data, value, size);
924			goto release;
925		}
926      not_found:
927	size = -ENODATA;
928      release:
929	ea_release(inode, &ea_buf);
930      out:
931	up_read(&JFS_IP(inode)->xattr_sem);
932
933	return size;
934}
935
936ssize_t jfs_getxattr(struct dentry *dentry, const char *name, void *data,
937		     size_t buf_size)
938{
939	int err;
940
941	/*
942	 * If this is a request for a synthetic attribute in the system.*
943	 * namespace use the generic infrastructure to resolve a handler
944	 * for it via sb->s_xattr.
945	 */
946	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
947		return generic_getxattr(dentry, name, data, buf_size);
948
949	if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
950		/*
951		 * skip past "os2." prefix
952		 */
953		name += XATTR_OS2_PREFIX_LEN;
954		/*
955		 * Don't allow retrieving properly prefixed attributes
956		 * by prepending them with "os2."
957		 */
958		if (is_known_namespace(name))
959			return -EOPNOTSUPP;
960	}
961
962	err = __jfs_getxattr(d_inode(dentry), name, data, buf_size);
963
964	return err;
965}
966
967/*
968 * No special permissions are needed to list attributes except for trusted.*
969 */
970static inline int can_list(struct jfs_ea *ea)
971{
972	return (strncmp(ea->name, XATTR_TRUSTED_PREFIX,
973			    XATTR_TRUSTED_PREFIX_LEN) ||
974		capable(CAP_SYS_ADMIN));
975}
976
977ssize_t jfs_listxattr(struct dentry * dentry, char *data, size_t buf_size)
978{
979	struct inode *inode = d_inode(dentry);
980	char *buffer;
981	ssize_t size = 0;
982	int xattr_size;
983	struct jfs_ea_list *ealist;
984	struct jfs_ea *ea;
985	struct ea_buffer ea_buf;
986
987	down_read(&JFS_IP(inode)->xattr_sem);
988
989	xattr_size = ea_get(inode, &ea_buf, 0);
990	if (xattr_size < 0) {
991		size = xattr_size;
992		goto out;
993	}
994
995	if (xattr_size == 0)
996		goto release;
997
998	ealist = (struct jfs_ea_list *) ea_buf.xattr;
999
1000	/* compute required size of list */
1001	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
1002		if (can_list(ea))
1003			size += name_size(ea) + 1;
1004	}
1005
1006	if (!data)
1007		goto release;
1008
1009	if (size > buf_size) {
1010		size = -ERANGE;
1011		goto release;
1012	}
1013
1014	/* Copy attribute names to buffer */
1015	buffer = data;
1016	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
1017		if (can_list(ea)) {
1018			int namelen = copy_name(buffer, ea);
1019			buffer += namelen + 1;
1020		}
1021	}
1022
1023      release:
1024	ea_release(inode, &ea_buf);
1025      out:
1026	up_read(&JFS_IP(inode)->xattr_sem);
1027	return size;
1028}
1029
1030int jfs_removexattr(struct dentry *dentry, const char *name)
1031{
1032	struct inode *inode = d_inode(dentry);
1033	struct jfs_inode_info *ji = JFS_IP(inode);
1034	int rc;
1035	tid_t tid;
1036
1037	/*
1038	 * If this is a request for a synthetic attribute in the system.*
1039	 * namespace use the generic infrastructure to resolve a handler
1040	 * for it via sb->s_xattr.
1041	 */
1042	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
1043		return generic_removexattr(dentry, name);
1044
1045	if ((rc = can_set_xattr(inode, name, NULL, 0)))
1046		return rc;
1047
1048	tid = txBegin(inode->i_sb, 0);
1049	mutex_lock(&ji->commit_mutex);
1050	rc = __jfs_setxattr(tid, d_inode(dentry), name, NULL, 0, XATTR_REPLACE);
1051	if (!rc)
1052		rc = txCommit(tid, 1, &inode, 0);
1053	txEnd(tid);
1054	mutex_unlock(&ji->commit_mutex);
1055
1056	return rc;
1057}
1058
1059/*
1060 * List of handlers for synthetic system.* attributes.  All real ondisk
1061 * attributes are handled directly.
1062 */
1063const struct xattr_handler *jfs_xattr_handlers[] = {
1064#ifdef CONFIG_JFS_POSIX_ACL
1065	&posix_acl_access_xattr_handler,
1066	&posix_acl_default_xattr_handler,
1067#endif
1068	NULL,
1069};
1070
1071
1072#ifdef CONFIG_JFS_SECURITY
1073static int jfs_initxattrs(struct inode *inode, const struct xattr *xattr_array,
1074			  void *fs_info)
1075{
1076	const struct xattr *xattr;
1077	tid_t *tid = fs_info;
1078	char *name;
1079	int err = 0;
1080
1081	for (xattr = xattr_array; xattr->name != NULL; xattr++) {
1082		name = kmalloc(XATTR_SECURITY_PREFIX_LEN +
1083			       strlen(xattr->name) + 1, GFP_NOFS);
1084		if (!name) {
1085			err = -ENOMEM;
1086			break;
1087		}
1088		strcpy(name, XATTR_SECURITY_PREFIX);
1089		strcpy(name + XATTR_SECURITY_PREFIX_LEN, xattr->name);
1090
1091		err = __jfs_setxattr(*tid, inode, name,
1092				     xattr->value, xattr->value_len, 0);
1093		kfree(name);
1094		if (err < 0)
1095			break;
1096	}
1097	return err;
1098}
1099
1100int jfs_init_security(tid_t tid, struct inode *inode, struct inode *dir,
1101		      const struct qstr *qstr)
1102{
1103	return security_inode_init_security(inode, dir, qstr,
1104					    &jfs_initxattrs, &tid);
1105}
1106#endif
1107