Linux Audio

Check our new training course

Loading...
v3.15
   1/*
   2 *   Copyright (C) International Business Machines  Corp., 2000-2004
   3 *   Copyright (C) Christoph Hellwig, 2002
   4 *
   5 *   This program is free software;  you can redistribute it and/or modify
   6 *   it under the terms of the GNU General Public License as published by
   7 *   the Free Software Foundation; either version 2 of the License, or
   8 *   (at your option) any later version.
   9 *
  10 *   This program is distributed in the hope that it will be useful,
  11 *   but WITHOUT ANY WARRANTY;  without even the implied warranty of
  12 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See
  13 *   the GNU General Public License for more details.
  14 *
  15 *   You should have received a copy of the GNU General Public License
  16 *   along with this program;  if not, write to the Free Software
  17 *   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  18 */
  19
  20#include <linux/capability.h>
  21#include <linux/fs.h>
  22#include <linux/xattr.h>
  23#include <linux/posix_acl_xattr.h>
  24#include <linux/slab.h>
  25#include <linux/quotaops.h>
  26#include <linux/security.h>
  27#include "jfs_incore.h"
  28#include "jfs_superblock.h"
  29#include "jfs_dmap.h"
  30#include "jfs_debug.h"
  31#include "jfs_dinode.h"
  32#include "jfs_extent.h"
  33#include "jfs_metapage.h"
  34#include "jfs_xattr.h"
  35#include "jfs_acl.h"
  36
  37/*
  38 *	jfs_xattr.c: extended attribute service
  39 *
  40 * Overall design --
  41 *
  42 * Format:
  43 *
  44 *   Extended attribute lists (jfs_ea_list) consist of an overall size (32 bit
  45 *   value) and a variable (0 or more) number of extended attribute
  46 *   entries.  Each extended attribute entry (jfs_ea) is a <name,value> double
  47 *   where <name> is constructed from a null-terminated ascii string
  48 *   (1 ... 255 bytes in the name) and <value> is arbitrary 8 bit data
  49 *   (1 ... 65535 bytes).  The in-memory format is
  50 *
  51 *   0       1        2        4                4 + namelen + 1
  52 *   +-------+--------+--------+----------------+-------------------+
  53 *   | Flags | Name   | Value  | Name String \0 | Data . . . .      |
  54 *   |       | Length | Length |                |                   |
  55 *   +-------+--------+--------+----------------+-------------------+
  56 *
  57 *   A jfs_ea_list then is structured as
  58 *
  59 *   0            4                   4 + EA_SIZE(ea1)
  60 *   +------------+-------------------+--------------------+-----
  61 *   | Overall EA | First FEA Element | Second FEA Element | .....
  62 *   | List Size  |                   |                    |
  63 *   +------------+-------------------+--------------------+-----
  64 *
  65 *   On-disk:
  66 *
  67 *	FEALISTs are stored on disk using blocks allocated by dbAlloc() and
  68 *	written directly. An EA list may be in-lined in the inode if there is
  69 *	sufficient room available.
  70 */
  71
  72struct ea_buffer {
  73	int flag;		/* Indicates what storage xattr points to */
  74	int max_size;		/* largest xattr that fits in current buffer */
  75	dxd_t new_ea;		/* dxd to replace ea when modifying xattr */
  76	struct metapage *mp;	/* metapage containing ea list */
  77	struct jfs_ea_list *xattr;	/* buffer containing ea list */
  78};
  79
  80/*
  81 * ea_buffer.flag values
  82 */
  83#define EA_INLINE	0x0001
  84#define EA_EXTENT	0x0002
  85#define EA_NEW		0x0004
  86#define EA_MALLOC	0x0008
  87
  88
  89static int is_known_namespace(const char *name)
  90{
  91	if (strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN) &&
  92	    strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN) &&
  93	    strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
  94	    strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN))
  95		return false;
  96
  97	return true;
  98}
  99
 100/*
 101 * These three routines are used to recognize on-disk extended attributes
 102 * that are in a recognized namespace.  If the attribute is not recognized,
 103 * "os2." is prepended to the name
 104 */
 105static int is_os2_xattr(struct jfs_ea *ea)
 106{
 107	return !is_known_namespace(ea->name);
 108}
 109
 110static inline int name_size(struct jfs_ea *ea)
 111{
 112	if (is_os2_xattr(ea))
 113		return ea->namelen + XATTR_OS2_PREFIX_LEN;
 114	else
 115		return ea->namelen;
 116}
 117
 118static inline int copy_name(char *buffer, struct jfs_ea *ea)
 119{
 120	int len = ea->namelen;
 121
 122	if (is_os2_xattr(ea)) {
 123		memcpy(buffer, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN);
 124		buffer += XATTR_OS2_PREFIX_LEN;
 125		len += XATTR_OS2_PREFIX_LEN;
 126	}
 127	memcpy(buffer, ea->name, ea->namelen);
 128	buffer[ea->namelen] = 0;
 129
 130	return len;
 131}
 132
 133/* Forward references */
 134static void ea_release(struct inode *inode, struct ea_buffer *ea_buf);
 135
 136/*
 137 * NAME: ea_write_inline
 138 *
 139 * FUNCTION: Attempt to write an EA inline if area is available
 140 *
 141 * PRE CONDITIONS:
 142 *	Already verified that the specified EA is small enough to fit inline
 143 *
 144 * PARAMETERS:
 145 *	ip	- Inode pointer
 146 *	ealist	- EA list pointer
 147 *	size	- size of ealist in bytes
 148 *	ea	- dxd_t structure to be filled in with necessary EA information
 149 *		  if we successfully copy the EA inline
 150 *
 151 * NOTES:
 152 *	Checks if the inode's inline area is available.  If so, copies EA inline
 153 *	and sets <ea> fields appropriately.  Otherwise, returns failure, EA will
 154 *	have to be put into an extent.
 155 *
 156 * RETURNS: 0 for successful copy to inline area; -1 if area not available
 157 */
 158static int ea_write_inline(struct inode *ip, struct jfs_ea_list *ealist,
 159			   int size, dxd_t * ea)
 160{
 161	struct jfs_inode_info *ji = JFS_IP(ip);
 162
 163	/*
 164	 * Make sure we have an EA -- the NULL EA list is valid, but you
 165	 * can't copy it!
 166	 */
 167	if (ealist && size > sizeof (struct jfs_ea_list)) {
 168		assert(size <= sizeof (ji->i_inline_ea));
 169
 170		/*
 171		 * See if the space is available or if it is already being
 172		 * used for an inline EA.
 173		 */
 174		if (!(ji->mode2 & INLINEEA) && !(ji->ea.flag & DXD_INLINE))
 175			return -EPERM;
 176
 177		DXDsize(ea, size);
 178		DXDlength(ea, 0);
 179		DXDaddress(ea, 0);
 180		memcpy(ji->i_inline_ea, ealist, size);
 181		ea->flag = DXD_INLINE;
 182		ji->mode2 &= ~INLINEEA;
 183	} else {
 184		ea->flag = 0;
 185		DXDsize(ea, 0);
 186		DXDlength(ea, 0);
 187		DXDaddress(ea, 0);
 188
 189		/* Free up INLINE area */
 190		if (ji->ea.flag & DXD_INLINE)
 191			ji->mode2 |= INLINEEA;
 192	}
 193
 194	return 0;
 195}
 196
 197/*
 198 * NAME: ea_write
 199 *
 200 * FUNCTION: Write an EA for an inode
 201 *
 202 * PRE CONDITIONS: EA has been verified
 203 *
 204 * PARAMETERS:
 205 *	ip	- Inode pointer
 206 *	ealist	- EA list pointer
 207 *	size	- size of ealist in bytes
 208 *	ea	- dxd_t structure to be filled in appropriately with where the
 209 *		  EA was copied
 210 *
 211 * NOTES: Will write EA inline if able to, otherwise allocates blocks for an
 212 *	extent and synchronously writes it to those blocks.
 213 *
 214 * RETURNS: 0 for success; Anything else indicates failure
 215 */
 216static int ea_write(struct inode *ip, struct jfs_ea_list *ealist, int size,
 217		       dxd_t * ea)
 218{
 219	struct super_block *sb = ip->i_sb;
 220	struct jfs_inode_info *ji = JFS_IP(ip);
 221	struct jfs_sb_info *sbi = JFS_SBI(sb);
 222	int nblocks;
 223	s64 blkno;
 224	int rc = 0, i;
 225	char *cp;
 226	s32 nbytes, nb;
 227	s32 bytes_to_write;
 228	struct metapage *mp;
 229
 230	/*
 231	 * Quick check to see if this is an in-linable EA.  Short EAs
 232	 * and empty EAs are all in-linable, provided the space exists.
 233	 */
 234	if (!ealist || size <= sizeof (ji->i_inline_ea)) {
 235		if (!ea_write_inline(ip, ealist, size, ea))
 236			return 0;
 237	}
 238
 239	/* figure out how many blocks we need */
 240	nblocks = (size + (sb->s_blocksize - 1)) >> sb->s_blocksize_bits;
 241
 242	/* Allocate new blocks to quota. */
 243	rc = dquot_alloc_block(ip, nblocks);
 244	if (rc)
 245		return rc;
 246
 247	rc = dbAlloc(ip, INOHINT(ip), nblocks, &blkno);
 248	if (rc) {
 249		/*Rollback quota allocation. */
 250		dquot_free_block(ip, nblocks);
 251		return rc;
 252	}
 253
 254	/*
 255	 * Now have nblocks worth of storage to stuff into the FEALIST.
 256	 * loop over the FEALIST copying data into the buffer one page at
 257	 * a time.
 258	 */
 259	cp = (char *) ealist;
 260	nbytes = size;
 261	for (i = 0; i < nblocks; i += sbi->nbperpage) {
 262		/*
 263		 * Determine how many bytes for this request, and round up to
 264		 * the nearest aggregate block size
 265		 */
 266		nb = min(PSIZE, nbytes);
 267		bytes_to_write =
 268		    ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
 269		    << sb->s_blocksize_bits;
 270
 271		if (!(mp = get_metapage(ip, blkno + i, bytes_to_write, 1))) {
 272			rc = -EIO;
 273			goto failed;
 274		}
 275
 276		memcpy(mp->data, cp, nb);
 277
 278		/*
 279		 * We really need a way to propagate errors for
 280		 * forced writes like this one.  --hch
 281		 *
 282		 * (__write_metapage => release_metapage => flush_metapage)
 283		 */
 284#ifdef _JFS_FIXME
 285		if ((rc = flush_metapage(mp))) {
 286			/*
 287			 * the write failed -- this means that the buffer
 288			 * is still assigned and the blocks are not being
 289			 * used.  this seems like the best error recovery
 290			 * we can get ...
 291			 */
 292			goto failed;
 293		}
 294#else
 295		flush_metapage(mp);
 296#endif
 297
 298		cp += PSIZE;
 299		nbytes -= nb;
 300	}
 301
 302	ea->flag = DXD_EXTENT;
 303	DXDsize(ea, le32_to_cpu(ealist->size));
 304	DXDlength(ea, nblocks);
 305	DXDaddress(ea, blkno);
 306
 307	/* Free up INLINE area */
 308	if (ji->ea.flag & DXD_INLINE)
 309		ji->mode2 |= INLINEEA;
 310
 311	return 0;
 312
 313      failed:
 314	/* Rollback quota allocation. */
 315	dquot_free_block(ip, nblocks);
 316
 317	dbFree(ip, blkno, nblocks);
 318	return rc;
 319}
 320
 321/*
 322 * NAME: ea_read_inline
 323 *
 324 * FUNCTION: Read an inlined EA into user's buffer
 325 *
 326 * PARAMETERS:
 327 *	ip	- Inode pointer
 328 *	ealist	- Pointer to buffer to fill in with EA
 329 *
 330 * RETURNS: 0
 331 */
 332static int ea_read_inline(struct inode *ip, struct jfs_ea_list *ealist)
 333{
 334	struct jfs_inode_info *ji = JFS_IP(ip);
 335	int ea_size = sizeDXD(&ji->ea);
 336
 337	if (ea_size == 0) {
 338		ealist->size = 0;
 339		return 0;
 340	}
 341
 342	/* Sanity Check */
 343	if ((sizeDXD(&ji->ea) > sizeof (ji->i_inline_ea)))
 344		return -EIO;
 345	if (le32_to_cpu(((struct jfs_ea_list *) &ji->i_inline_ea)->size)
 346	    != ea_size)
 347		return -EIO;
 348
 349	memcpy(ealist, ji->i_inline_ea, ea_size);
 350	return 0;
 351}
 352
 353/*
 354 * NAME: ea_read
 355 *
 356 * FUNCTION: copy EA data into user's buffer
 357 *
 358 * PARAMETERS:
 359 *	ip	- Inode pointer
 360 *	ealist	- Pointer to buffer to fill in with EA
 361 *
 362 * NOTES:  If EA is inline calls ea_read_inline() to copy EA.
 363 *
 364 * RETURNS: 0 for success; other indicates failure
 365 */
 366static int ea_read(struct inode *ip, struct jfs_ea_list *ealist)
 367{
 368	struct super_block *sb = ip->i_sb;
 369	struct jfs_inode_info *ji = JFS_IP(ip);
 370	struct jfs_sb_info *sbi = JFS_SBI(sb);
 371	int nblocks;
 372	s64 blkno;
 373	char *cp = (char *) ealist;
 374	int i;
 375	int nbytes, nb;
 376	s32 bytes_to_read;
 377	struct metapage *mp;
 378
 379	/* quick check for in-line EA */
 380	if (ji->ea.flag & DXD_INLINE)
 381		return ea_read_inline(ip, ealist);
 382
 383	nbytes = sizeDXD(&ji->ea);
 384	if (!nbytes) {
 385		jfs_error(sb, "nbytes is 0\n");
 386		return -EIO;
 387	}
 388
 389	/*
 390	 * Figure out how many blocks were allocated when this EA list was
 391	 * originally written to disk.
 392	 */
 393	nblocks = lengthDXD(&ji->ea) << sbi->l2nbperpage;
 394	blkno = addressDXD(&ji->ea) << sbi->l2nbperpage;
 395
 396	/*
 397	 * I have found the disk blocks which were originally used to store
 398	 * the FEALIST.  now i loop over each contiguous block copying the
 399	 * data into the buffer.
 400	 */
 401	for (i = 0; i < nblocks; i += sbi->nbperpage) {
 402		/*
 403		 * Determine how many bytes for this request, and round up to
 404		 * the nearest aggregate block size
 405		 */
 406		nb = min(PSIZE, nbytes);
 407		bytes_to_read =
 408		    ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
 409		    << sb->s_blocksize_bits;
 410
 411		if (!(mp = read_metapage(ip, blkno + i, bytes_to_read, 1)))
 412			return -EIO;
 413
 414		memcpy(cp, mp->data, nb);
 415		release_metapage(mp);
 416
 417		cp += PSIZE;
 418		nbytes -= nb;
 419	}
 420
 421	return 0;
 422}
 423
 424/*
 425 * NAME: ea_get
 426 *
 427 * FUNCTION: Returns buffer containing existing extended attributes.
 428 *	     The size of the buffer will be the larger of the existing
 429 *	     attributes size, or min_size.
 430 *
 431 *	     The buffer, which may be inlined in the inode or in the
 432 *	     page cache must be release by calling ea_release or ea_put
 433 *
 434 * PARAMETERS:
 435 *	inode	- Inode pointer
 436 *	ea_buf	- Structure to be populated with ealist and its metadata
 437 *	min_size- minimum size of buffer to be returned
 438 *
 439 * RETURNS: 0 for success; Other indicates failure
 440 */
 441static int ea_get(struct inode *inode, struct ea_buffer *ea_buf, int min_size)
 442{
 443	struct jfs_inode_info *ji = JFS_IP(inode);
 444	struct super_block *sb = inode->i_sb;
 445	int size;
 446	int ea_size = sizeDXD(&ji->ea);
 447	int blocks_needed, current_blocks;
 448	s64 blkno;
 449	int rc;
 450	int quota_allocation = 0;
 451
 452	/* When fsck.jfs clears a bad ea, it doesn't clear the size */
 453	if (ji->ea.flag == 0)
 454		ea_size = 0;
 455
 456	if (ea_size == 0) {
 457		if (min_size == 0) {
 458			ea_buf->flag = 0;
 459			ea_buf->max_size = 0;
 460			ea_buf->xattr = NULL;
 461			return 0;
 462		}
 463		if ((min_size <= sizeof (ji->i_inline_ea)) &&
 464		    (ji->mode2 & INLINEEA)) {
 465			ea_buf->flag = EA_INLINE | EA_NEW;
 466			ea_buf->max_size = sizeof (ji->i_inline_ea);
 467			ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
 468			DXDlength(&ea_buf->new_ea, 0);
 469			DXDaddress(&ea_buf->new_ea, 0);
 470			ea_buf->new_ea.flag = DXD_INLINE;
 471			DXDsize(&ea_buf->new_ea, min_size);
 472			return 0;
 473		}
 474		current_blocks = 0;
 475	} else if (ji->ea.flag & DXD_INLINE) {
 476		if (min_size <= sizeof (ji->i_inline_ea)) {
 477			ea_buf->flag = EA_INLINE;
 478			ea_buf->max_size = sizeof (ji->i_inline_ea);
 479			ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
 480			goto size_check;
 481		}
 482		current_blocks = 0;
 483	} else {
 484		if (!(ji->ea.flag & DXD_EXTENT)) {
 485			jfs_error(sb, "invalid ea.flag\n");
 486			return -EIO;
 487		}
 488		current_blocks = (ea_size + sb->s_blocksize - 1) >>
 489		    sb->s_blocksize_bits;
 490	}
 491	size = max(min_size, ea_size);
 492
 493	if (size > PSIZE) {
 494		/*
 495		 * To keep the rest of the code simple.  Allocate a
 496		 * contiguous buffer to work with
 497		 */
 498		ea_buf->xattr = kmalloc(size, GFP_KERNEL);
 499		if (ea_buf->xattr == NULL)
 500			return -ENOMEM;
 501
 502		ea_buf->flag = EA_MALLOC;
 503		ea_buf->max_size = (size + sb->s_blocksize - 1) &
 504		    ~(sb->s_blocksize - 1);
 505
 506		if (ea_size == 0)
 507			return 0;
 508
 509		if ((rc = ea_read(inode, ea_buf->xattr))) {
 510			kfree(ea_buf->xattr);
 511			ea_buf->xattr = NULL;
 512			return rc;
 513		}
 514		goto size_check;
 515	}
 516	blocks_needed = (min_size + sb->s_blocksize - 1) >>
 517	    sb->s_blocksize_bits;
 518
 519	if (blocks_needed > current_blocks) {
 520		/* Allocate new blocks to quota. */
 521		rc = dquot_alloc_block(inode, blocks_needed);
 522		if (rc)
 523			return -EDQUOT;
 524
 525		quota_allocation = blocks_needed;
 526
 527		rc = dbAlloc(inode, INOHINT(inode), (s64) blocks_needed,
 528			     &blkno);
 529		if (rc)
 530			goto clean_up;
 531
 532		DXDlength(&ea_buf->new_ea, blocks_needed);
 533		DXDaddress(&ea_buf->new_ea, blkno);
 534		ea_buf->new_ea.flag = DXD_EXTENT;
 535		DXDsize(&ea_buf->new_ea, min_size);
 536
 537		ea_buf->flag = EA_EXTENT | EA_NEW;
 538
 539		ea_buf->mp = get_metapage(inode, blkno,
 540					  blocks_needed << sb->s_blocksize_bits,
 541					  1);
 542		if (ea_buf->mp == NULL) {
 543			dbFree(inode, blkno, (s64) blocks_needed);
 544			rc = -EIO;
 545			goto clean_up;
 546		}
 547		ea_buf->xattr = ea_buf->mp->data;
 548		ea_buf->max_size = (min_size + sb->s_blocksize - 1) &
 549		    ~(sb->s_blocksize - 1);
 550		if (ea_size == 0)
 551			return 0;
 552		if ((rc = ea_read(inode, ea_buf->xattr))) {
 553			discard_metapage(ea_buf->mp);
 554			dbFree(inode, blkno, (s64) blocks_needed);
 555			goto clean_up;
 556		}
 557		goto size_check;
 558	}
 559	ea_buf->flag = EA_EXTENT;
 560	ea_buf->mp = read_metapage(inode, addressDXD(&ji->ea),
 561				   lengthDXD(&ji->ea) << sb->s_blocksize_bits,
 562				   1);
 563	if (ea_buf->mp == NULL) {
 564		rc = -EIO;
 565		goto clean_up;
 566	}
 567	ea_buf->xattr = ea_buf->mp->data;
 568	ea_buf->max_size = (ea_size + sb->s_blocksize - 1) &
 569	    ~(sb->s_blocksize - 1);
 570
 571      size_check:
 572	if (EALIST_SIZE(ea_buf->xattr) != ea_size) {
 573		printk(KERN_ERR "ea_get: invalid extended attribute\n");
 574		print_hex_dump(KERN_ERR, "", DUMP_PREFIX_ADDRESS, 16, 1,
 575				     ea_buf->xattr, ea_size, 1);
 576		ea_release(inode, ea_buf);
 577		rc = -EIO;
 578		goto clean_up;
 579	}
 580
 581	return ea_size;
 582
 583      clean_up:
 584	/* Rollback quota allocation */
 585	if (quota_allocation)
 586		dquot_free_block(inode, quota_allocation);
 587
 588	return (rc);
 589}
 590
 591static void ea_release(struct inode *inode, struct ea_buffer *ea_buf)
 592{
 593	if (ea_buf->flag & EA_MALLOC)
 594		kfree(ea_buf->xattr);
 595	else if (ea_buf->flag & EA_EXTENT) {
 596		assert(ea_buf->mp);
 597		release_metapage(ea_buf->mp);
 598
 599		if (ea_buf->flag & EA_NEW)
 600			dbFree(inode, addressDXD(&ea_buf->new_ea),
 601			       lengthDXD(&ea_buf->new_ea));
 602	}
 603}
 604
 605static int ea_put(tid_t tid, struct inode *inode, struct ea_buffer *ea_buf,
 606		  int new_size)
 607{
 608	struct jfs_inode_info *ji = JFS_IP(inode);
 609	unsigned long old_blocks, new_blocks;
 610	int rc = 0;
 611
 612	if (new_size == 0) {
 613		ea_release(inode, ea_buf);
 614		ea_buf = NULL;
 615	} else if (ea_buf->flag & EA_INLINE) {
 616		assert(new_size <= sizeof (ji->i_inline_ea));
 617		ji->mode2 &= ~INLINEEA;
 618		ea_buf->new_ea.flag = DXD_INLINE;
 619		DXDsize(&ea_buf->new_ea, new_size);
 620		DXDaddress(&ea_buf->new_ea, 0);
 621		DXDlength(&ea_buf->new_ea, 0);
 622	} else if (ea_buf->flag & EA_MALLOC) {
 623		rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
 624		kfree(ea_buf->xattr);
 625	} else if (ea_buf->flag & EA_NEW) {
 626		/* We have already allocated a new dxd */
 627		flush_metapage(ea_buf->mp);
 628	} else {
 629		/* ->xattr must point to original ea's metapage */
 630		rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
 631		discard_metapage(ea_buf->mp);
 632	}
 633	if (rc)
 634		return rc;
 635
 636	old_blocks = new_blocks = 0;
 637
 638	if (ji->ea.flag & DXD_EXTENT) {
 639		invalidate_dxd_metapages(inode, ji->ea);
 640		old_blocks = lengthDXD(&ji->ea);
 641	}
 642
 643	if (ea_buf) {
 644		txEA(tid, inode, &ji->ea, &ea_buf->new_ea);
 645		if (ea_buf->new_ea.flag & DXD_EXTENT) {
 646			new_blocks = lengthDXD(&ea_buf->new_ea);
 647			if (ji->ea.flag & DXD_INLINE)
 648				ji->mode2 |= INLINEEA;
 649		}
 650		ji->ea = ea_buf->new_ea;
 651	} else {
 652		txEA(tid, inode, &ji->ea, NULL);
 653		if (ji->ea.flag & DXD_INLINE)
 654			ji->mode2 |= INLINEEA;
 655		ji->ea.flag = 0;
 656		ji->ea.size = 0;
 657	}
 658
 659	/* If old blocks exist, they must be removed from quota allocation. */
 660	if (old_blocks)
 661		dquot_free_block(inode, old_blocks);
 662
 663	inode->i_ctime = CURRENT_TIME;
 664
 665	return 0;
 666}
 667
 668/*
 669 * Most of the permission checking is done by xattr_permission in the vfs.
 670 * We also need to verify that this is a namespace that we recognize.
 671 */
 672static int can_set_xattr(struct inode *inode, const char *name,
 673			 const void *value, size_t value_len)
 674{
 675	if (!strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN)) {
 676		/*
 677		 * This makes sure that we aren't trying to set an
 678		 * attribute in a different namespace by prefixing it
 679		 * with "os2."
 680		 */
 681		if (is_known_namespace(name + XATTR_OS2_PREFIX_LEN))
 682			return -EOPNOTSUPP;
 683		return 0;
 684	}
 685
 686	/*
 687	 * Don't allow setting an attribute in an unknown namespace.
 688	 */
 689	if (strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) &&
 690	    strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
 691	    strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN))
 692		return -EOPNOTSUPP;
 693
 694	return 0;
 695}
 696
 697int __jfs_setxattr(tid_t tid, struct inode *inode, const char *name,
 698		   const void *value, size_t value_len, int flags)
 699{
 700	struct jfs_ea_list *ealist;
 701	struct jfs_ea *ea, *old_ea = NULL, *next_ea = NULL;
 702	struct ea_buffer ea_buf;
 703	int old_ea_size = 0;
 704	int xattr_size;
 705	int new_size;
 706	int namelen = strlen(name);
 707	char *os2name = NULL;
 708	int found = 0;
 709	int rc;
 710	int length;
 711
 712	if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
 713		os2name = kmalloc(namelen - XATTR_OS2_PREFIX_LEN + 1,
 714				  GFP_KERNEL);
 715		if (!os2name)
 716			return -ENOMEM;
 717		strcpy(os2name, name + XATTR_OS2_PREFIX_LEN);
 718		name = os2name;
 719		namelen -= XATTR_OS2_PREFIX_LEN;
 720	}
 721
 722	down_write(&JFS_IP(inode)->xattr_sem);
 723
 724	xattr_size = ea_get(inode, &ea_buf, 0);
 725	if (xattr_size < 0) {
 726		rc = xattr_size;
 727		goto out;
 728	}
 729
 730      again:
 731	ealist = (struct jfs_ea_list *) ea_buf.xattr;
 732	new_size = sizeof (struct jfs_ea_list);
 733
 734	if (xattr_size) {
 735		for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist);
 736		     ea = NEXT_EA(ea)) {
 737			if ((namelen == ea->namelen) &&
 738			    (memcmp(name, ea->name, namelen) == 0)) {
 739				found = 1;
 740				if (flags & XATTR_CREATE) {
 741					rc = -EEXIST;
 742					goto release;
 743				}
 744				old_ea = ea;
 745				old_ea_size = EA_SIZE(ea);
 746				next_ea = NEXT_EA(ea);
 747			} else
 748				new_size += EA_SIZE(ea);
 749		}
 750	}
 751
 752	if (!found) {
 753		if (flags & XATTR_REPLACE) {
 754			rc = -ENODATA;
 755			goto release;
 756		}
 757		if (value == NULL) {
 758			rc = 0;
 759			goto release;
 760		}
 761	}
 762	if (value)
 763		new_size += sizeof (struct jfs_ea) + namelen + 1 + value_len;
 764
 765	if (new_size > ea_buf.max_size) {
 766		/*
 767		 * We need to allocate more space for merged ea list.
 768		 * We should only have loop to again: once.
 769		 */
 770		ea_release(inode, &ea_buf);
 771		xattr_size = ea_get(inode, &ea_buf, new_size);
 772		if (xattr_size < 0) {
 773			rc = xattr_size;
 774			goto out;
 775		}
 776		goto again;
 777	}
 778
 779	/* Remove old ea of the same name */
 780	if (found) {
 781		/* number of bytes following target EA */
 782		length = (char *) END_EALIST(ealist) - (char *) next_ea;
 783		if (length > 0)
 784			memmove(old_ea, next_ea, length);
 785		xattr_size -= old_ea_size;
 786	}
 787
 788	/* Add new entry to the end */
 789	if (value) {
 790		if (xattr_size == 0)
 791			/* Completely new ea list */
 792			xattr_size = sizeof (struct jfs_ea_list);
 793
 794		/*
 795		 * The size of EA value is limitted by on-disk format up to
 796		 *  __le16, there would be an overflow if the size is equal
 797		 * to XATTR_SIZE_MAX (65536).  In order to avoid this issue,
 798		 * we can pre-checkup the value size against USHRT_MAX, and
 799		 * return -E2BIG in this case, which is consistent with the
 800		 * VFS setxattr interface.
 801		 */
 802		if (value_len >= USHRT_MAX) {
 803			rc = -E2BIG;
 804			goto release;
 805		}
 806
 807		ea = (struct jfs_ea *) ((char *) ealist + xattr_size);
 808		ea->flag = 0;
 809		ea->namelen = namelen;
 810		ea->valuelen = (cpu_to_le16(value_len));
 811		memcpy(ea->name, name, namelen);
 812		ea->name[namelen] = 0;
 813		if (value_len)
 814			memcpy(&ea->name[namelen + 1], value, value_len);
 815		xattr_size += EA_SIZE(ea);
 816	}
 817
 818	/* DEBUG - If we did this right, these number match */
 819	if (xattr_size != new_size) {
 820		printk(KERN_ERR
 821		       "__jfs_setxattr: xattr_size = %d, new_size = %d\n",
 822		       xattr_size, new_size);
 823
 824		rc = -EINVAL;
 825		goto release;
 826	}
 827
 828	/*
 829	 * If we're left with an empty list, there's no ea
 830	 */
 831	if (new_size == sizeof (struct jfs_ea_list))
 832		new_size = 0;
 833
 834	ealist->size = cpu_to_le32(new_size);
 835
 836	rc = ea_put(tid, inode, &ea_buf, new_size);
 837
 838	goto out;
 839      release:
 840	ea_release(inode, &ea_buf);
 841      out:
 842	up_write(&JFS_IP(inode)->xattr_sem);
 843
 844	kfree(os2name);
 845
 846	return rc;
 847}
 848
 849int jfs_setxattr(struct dentry *dentry, const char *name, const void *value,
 850		 size_t value_len, int flags)
 851{
 852	struct inode *inode = dentry->d_inode;
 853	struct jfs_inode_info *ji = JFS_IP(inode);
 854	int rc;
 855	tid_t tid;
 856
 857	/*
 858	 * If this is a request for a synthetic attribute in the system.*
 859	 * namespace use the generic infrastructure to resolve a handler
 860	 * for it via sb->s_xattr.
 861	 */
 862	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
 863		return generic_setxattr(dentry, name, value, value_len, flags);
 864
 865	if ((rc = can_set_xattr(inode, name, value, value_len)))
 866		return rc;
 867
 868	if (value == NULL) {	/* empty EA, do not remove */
 869		value = "";
 870		value_len = 0;
 871	}
 872
 873	tid = txBegin(inode->i_sb, 0);
 874	mutex_lock(&ji->commit_mutex);
 875	rc = __jfs_setxattr(tid, dentry->d_inode, name, value, value_len,
 876			    flags);
 877	if (!rc)
 878		rc = txCommit(tid, 1, &inode, 0);
 879	txEnd(tid);
 880	mutex_unlock(&ji->commit_mutex);
 881
 882	return rc;
 883}
 884
 885ssize_t __jfs_getxattr(struct inode *inode, const char *name, void *data,
 886		       size_t buf_size)
 887{
 888	struct jfs_ea_list *ealist;
 889	struct jfs_ea *ea;
 890	struct ea_buffer ea_buf;
 891	int xattr_size;
 892	ssize_t size;
 893	int namelen = strlen(name);
 894	char *value;
 895
 896	down_read(&JFS_IP(inode)->xattr_sem);
 897
 898	xattr_size = ea_get(inode, &ea_buf, 0);
 899
 900	if (xattr_size < 0) {
 901		size = xattr_size;
 902		goto out;
 903	}
 904
 905	if (xattr_size == 0)
 906		goto not_found;
 907
 908	ealist = (struct jfs_ea_list *) ea_buf.xattr;
 909
 910	/* Find the named attribute */
 911	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea))
 912		if ((namelen == ea->namelen) &&
 913		    memcmp(name, ea->name, namelen) == 0) {
 914			/* Found it */
 915			size = le16_to_cpu(ea->valuelen);
 916			if (!data)
 917				goto release;
 918			else if (size > buf_size) {
 919				size = -ERANGE;
 920				goto release;
 921			}
 922			value = ((char *) &ea->name) + ea->namelen + 1;
 923			memcpy(data, value, size);
 924			goto release;
 925		}
 926      not_found:
 927	size = -ENODATA;
 928      release:
 929	ea_release(inode, &ea_buf);
 930      out:
 931	up_read(&JFS_IP(inode)->xattr_sem);
 932
 933	return size;
 934}
 935
 936ssize_t jfs_getxattr(struct dentry *dentry, const char *name, void *data,
 937		     size_t buf_size)
 938{
 939	int err;
 940
 941	/*
 942	 * If this is a request for a synthetic attribute in the system.*
 943	 * namespace use the generic infrastructure to resolve a handler
 944	 * for it via sb->s_xattr.
 945	 */
 946	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
 947		return generic_getxattr(dentry, name, data, buf_size);
 948
 949	if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
 950		/*
 951		 * skip past "os2." prefix
 952		 */
 953		name += XATTR_OS2_PREFIX_LEN;
 954		/*
 955		 * Don't allow retrieving properly prefixed attributes
 956		 * by prepending them with "os2."
 957		 */
 958		if (is_known_namespace(name))
 959			return -EOPNOTSUPP;
 960	}
 961
 962	err = __jfs_getxattr(dentry->d_inode, name, data, buf_size);
 963
 964	return err;
 965}
 966
 967/*
 968 * No special permissions are needed to list attributes except for trusted.*
 969 */
 970static inline int can_list(struct jfs_ea *ea)
 971{
 972	return (strncmp(ea->name, XATTR_TRUSTED_PREFIX,
 973			    XATTR_TRUSTED_PREFIX_LEN) ||
 974		capable(CAP_SYS_ADMIN));
 975}
 976
 977ssize_t jfs_listxattr(struct dentry * dentry, char *data, size_t buf_size)
 978{
 979	struct inode *inode = dentry->d_inode;
 980	char *buffer;
 981	ssize_t size = 0;
 982	int xattr_size;
 983	struct jfs_ea_list *ealist;
 984	struct jfs_ea *ea;
 985	struct ea_buffer ea_buf;
 986
 987	down_read(&JFS_IP(inode)->xattr_sem);
 988
 989	xattr_size = ea_get(inode, &ea_buf, 0);
 990	if (xattr_size < 0) {
 991		size = xattr_size;
 992		goto out;
 993	}
 994
 995	if (xattr_size == 0)
 996		goto release;
 997
 998	ealist = (struct jfs_ea_list *) ea_buf.xattr;
 999
1000	/* compute required size of list */
1001	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
1002		if (can_list(ea))
1003			size += name_size(ea) + 1;
1004	}
1005
1006	if (!data)
1007		goto release;
1008
1009	if (size > buf_size) {
1010		size = -ERANGE;
1011		goto release;
1012	}
1013
1014	/* Copy attribute names to buffer */
1015	buffer = data;
1016	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
1017		if (can_list(ea)) {
1018			int namelen = copy_name(buffer, ea);
1019			buffer += namelen + 1;
1020		}
1021	}
1022
1023      release:
1024	ea_release(inode, &ea_buf);
1025      out:
1026	up_read(&JFS_IP(inode)->xattr_sem);
1027	return size;
1028}
1029
1030int jfs_removexattr(struct dentry *dentry, const char *name)
1031{
1032	struct inode *inode = dentry->d_inode;
1033	struct jfs_inode_info *ji = JFS_IP(inode);
1034	int rc;
1035	tid_t tid;
1036
1037	/*
1038	 * If this is a request for a synthetic attribute in the system.*
1039	 * namespace use the generic infrastructure to resolve a handler
1040	 * for it via sb->s_xattr.
1041	 */
1042	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
1043		return generic_removexattr(dentry, name);
1044
1045	if ((rc = can_set_xattr(inode, name, NULL, 0)))
1046		return rc;
1047
1048	tid = txBegin(inode->i_sb, 0);
1049	mutex_lock(&ji->commit_mutex);
1050	rc = __jfs_setxattr(tid, dentry->d_inode, name, NULL, 0, XATTR_REPLACE);
1051	if (!rc)
1052		rc = txCommit(tid, 1, &inode, 0);
1053	txEnd(tid);
1054	mutex_unlock(&ji->commit_mutex);
1055
1056	return rc;
1057}
1058
1059/*
1060 * List of handlers for synthetic system.* attributes.  All real ondisk
1061 * attributes are handled directly.
1062 */
1063const struct xattr_handler *jfs_xattr_handlers[] = {
1064#ifdef CONFIG_JFS_POSIX_ACL
1065	&posix_acl_access_xattr_handler,
1066	&posix_acl_default_xattr_handler,
1067#endif
1068	NULL,
1069};
1070
1071
1072#ifdef CONFIG_JFS_SECURITY
1073static int jfs_initxattrs(struct inode *inode, const struct xattr *xattr_array,
1074			  void *fs_info)
1075{
1076	const struct xattr *xattr;
1077	tid_t *tid = fs_info;
1078	char *name;
1079	int err = 0;
1080
1081	for (xattr = xattr_array; xattr->name != NULL; xattr++) {
1082		name = kmalloc(XATTR_SECURITY_PREFIX_LEN +
1083			       strlen(xattr->name) + 1, GFP_NOFS);
1084		if (!name) {
1085			err = -ENOMEM;
1086			break;
1087		}
1088		strcpy(name, XATTR_SECURITY_PREFIX);
1089		strcpy(name + XATTR_SECURITY_PREFIX_LEN, xattr->name);
1090
1091		err = __jfs_setxattr(*tid, inode, name,
1092				     xattr->value, xattr->value_len, 0);
1093		kfree(name);
1094		if (err < 0)
1095			break;
1096	}
1097	return err;
1098}
1099
1100int jfs_init_security(tid_t tid, struct inode *inode, struct inode *dir,
1101		      const struct qstr *qstr)
1102{
1103	return security_inode_init_security(inode, dir, qstr,
1104					    &jfs_initxattrs, &tid);
1105}
1106#endif
v4.6
   1/*
   2 *   Copyright (C) International Business Machines  Corp., 2000-2004
   3 *   Copyright (C) Christoph Hellwig, 2002
   4 *
   5 *   This program is free software;  you can redistribute it and/or modify
   6 *   it under the terms of the GNU General Public License as published by
   7 *   the Free Software Foundation; either version 2 of the License, or
   8 *   (at your option) any later version.
   9 *
  10 *   This program is distributed in the hope that it will be useful,
  11 *   but WITHOUT ANY WARRANTY;  without even the implied warranty of
  12 *   MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See
  13 *   the GNU General Public License for more details.
  14 *
  15 *   You should have received a copy of the GNU General Public License
  16 *   along with this program;  if not, write to the Free Software
  17 *   Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
  18 */
  19
  20#include <linux/capability.h>
  21#include <linux/fs.h>
  22#include <linux/xattr.h>
  23#include <linux/posix_acl_xattr.h>
  24#include <linux/slab.h>
  25#include <linux/quotaops.h>
  26#include <linux/security.h>
  27#include "jfs_incore.h"
  28#include "jfs_superblock.h"
  29#include "jfs_dmap.h"
  30#include "jfs_debug.h"
  31#include "jfs_dinode.h"
  32#include "jfs_extent.h"
  33#include "jfs_metapage.h"
  34#include "jfs_xattr.h"
  35#include "jfs_acl.h"
  36
  37/*
  38 *	jfs_xattr.c: extended attribute service
  39 *
  40 * Overall design --
  41 *
  42 * Format:
  43 *
  44 *   Extended attribute lists (jfs_ea_list) consist of an overall size (32 bit
  45 *   value) and a variable (0 or more) number of extended attribute
  46 *   entries.  Each extended attribute entry (jfs_ea) is a <name,value> double
  47 *   where <name> is constructed from a null-terminated ascii string
  48 *   (1 ... 255 bytes in the name) and <value> is arbitrary 8 bit data
  49 *   (1 ... 65535 bytes).  The in-memory format is
  50 *
  51 *   0       1        2        4                4 + namelen + 1
  52 *   +-------+--------+--------+----------------+-------------------+
  53 *   | Flags | Name   | Value  | Name String \0 | Data . . . .      |
  54 *   |       | Length | Length |                |                   |
  55 *   +-------+--------+--------+----------------+-------------------+
  56 *
  57 *   A jfs_ea_list then is structured as
  58 *
  59 *   0            4                   4 + EA_SIZE(ea1)
  60 *   +------------+-------------------+--------------------+-----
  61 *   | Overall EA | First FEA Element | Second FEA Element | .....
  62 *   | List Size  |                   |                    |
  63 *   +------------+-------------------+--------------------+-----
  64 *
  65 *   On-disk:
  66 *
  67 *	FEALISTs are stored on disk using blocks allocated by dbAlloc() and
  68 *	written directly. An EA list may be in-lined in the inode if there is
  69 *	sufficient room available.
  70 */
  71
  72struct ea_buffer {
  73	int flag;		/* Indicates what storage xattr points to */
  74	int max_size;		/* largest xattr that fits in current buffer */
  75	dxd_t new_ea;		/* dxd to replace ea when modifying xattr */
  76	struct metapage *mp;	/* metapage containing ea list */
  77	struct jfs_ea_list *xattr;	/* buffer containing ea list */
  78};
  79
  80/*
  81 * ea_buffer.flag values
  82 */
  83#define EA_INLINE	0x0001
  84#define EA_EXTENT	0x0002
  85#define EA_NEW		0x0004
  86#define EA_MALLOC	0x0008
  87
  88
  89static int is_known_namespace(const char *name)
  90{
  91	if (strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN) &&
  92	    strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN) &&
  93	    strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
  94	    strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN))
  95		return false;
  96
  97	return true;
  98}
  99
 100/*
 101 * These three routines are used to recognize on-disk extended attributes
 102 * that are in a recognized namespace.  If the attribute is not recognized,
 103 * "os2." is prepended to the name
 104 */
 105static int is_os2_xattr(struct jfs_ea *ea)
 106{
 107	return !is_known_namespace(ea->name);
 108}
 109
 110static inline int name_size(struct jfs_ea *ea)
 111{
 112	if (is_os2_xattr(ea))
 113		return ea->namelen + XATTR_OS2_PREFIX_LEN;
 114	else
 115		return ea->namelen;
 116}
 117
 118static inline int copy_name(char *buffer, struct jfs_ea *ea)
 119{
 120	int len = ea->namelen;
 121
 122	if (is_os2_xattr(ea)) {
 123		memcpy(buffer, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN);
 124		buffer += XATTR_OS2_PREFIX_LEN;
 125		len += XATTR_OS2_PREFIX_LEN;
 126	}
 127	memcpy(buffer, ea->name, ea->namelen);
 128	buffer[ea->namelen] = 0;
 129
 130	return len;
 131}
 132
 133/* Forward references */
 134static void ea_release(struct inode *inode, struct ea_buffer *ea_buf);
 135
 136/*
 137 * NAME: ea_write_inline
 138 *
 139 * FUNCTION: Attempt to write an EA inline if area is available
 140 *
 141 * PRE CONDITIONS:
 142 *	Already verified that the specified EA is small enough to fit inline
 143 *
 144 * PARAMETERS:
 145 *	ip	- Inode pointer
 146 *	ealist	- EA list pointer
 147 *	size	- size of ealist in bytes
 148 *	ea	- dxd_t structure to be filled in with necessary EA information
 149 *		  if we successfully copy the EA inline
 150 *
 151 * NOTES:
 152 *	Checks if the inode's inline area is available.  If so, copies EA inline
 153 *	and sets <ea> fields appropriately.  Otherwise, returns failure, EA will
 154 *	have to be put into an extent.
 155 *
 156 * RETURNS: 0 for successful copy to inline area; -1 if area not available
 157 */
 158static int ea_write_inline(struct inode *ip, struct jfs_ea_list *ealist,
 159			   int size, dxd_t * ea)
 160{
 161	struct jfs_inode_info *ji = JFS_IP(ip);
 162
 163	/*
 164	 * Make sure we have an EA -- the NULL EA list is valid, but you
 165	 * can't copy it!
 166	 */
 167	if (ealist && size > sizeof (struct jfs_ea_list)) {
 168		assert(size <= sizeof (ji->i_inline_ea));
 169
 170		/*
 171		 * See if the space is available or if it is already being
 172		 * used for an inline EA.
 173		 */
 174		if (!(ji->mode2 & INLINEEA) && !(ji->ea.flag & DXD_INLINE))
 175			return -EPERM;
 176
 177		DXDsize(ea, size);
 178		DXDlength(ea, 0);
 179		DXDaddress(ea, 0);
 180		memcpy(ji->i_inline_ea, ealist, size);
 181		ea->flag = DXD_INLINE;
 182		ji->mode2 &= ~INLINEEA;
 183	} else {
 184		ea->flag = 0;
 185		DXDsize(ea, 0);
 186		DXDlength(ea, 0);
 187		DXDaddress(ea, 0);
 188
 189		/* Free up INLINE area */
 190		if (ji->ea.flag & DXD_INLINE)
 191			ji->mode2 |= INLINEEA;
 192	}
 193
 194	return 0;
 195}
 196
 197/*
 198 * NAME: ea_write
 199 *
 200 * FUNCTION: Write an EA for an inode
 201 *
 202 * PRE CONDITIONS: EA has been verified
 203 *
 204 * PARAMETERS:
 205 *	ip	- Inode pointer
 206 *	ealist	- EA list pointer
 207 *	size	- size of ealist in bytes
 208 *	ea	- dxd_t structure to be filled in appropriately with where the
 209 *		  EA was copied
 210 *
 211 * NOTES: Will write EA inline if able to, otherwise allocates blocks for an
 212 *	extent and synchronously writes it to those blocks.
 213 *
 214 * RETURNS: 0 for success; Anything else indicates failure
 215 */
 216static int ea_write(struct inode *ip, struct jfs_ea_list *ealist, int size,
 217		       dxd_t * ea)
 218{
 219	struct super_block *sb = ip->i_sb;
 220	struct jfs_inode_info *ji = JFS_IP(ip);
 221	struct jfs_sb_info *sbi = JFS_SBI(sb);
 222	int nblocks;
 223	s64 blkno;
 224	int rc = 0, i;
 225	char *cp;
 226	s32 nbytes, nb;
 227	s32 bytes_to_write;
 228	struct metapage *mp;
 229
 230	/*
 231	 * Quick check to see if this is an in-linable EA.  Short EAs
 232	 * and empty EAs are all in-linable, provided the space exists.
 233	 */
 234	if (!ealist || size <= sizeof (ji->i_inline_ea)) {
 235		if (!ea_write_inline(ip, ealist, size, ea))
 236			return 0;
 237	}
 238
 239	/* figure out how many blocks we need */
 240	nblocks = (size + (sb->s_blocksize - 1)) >> sb->s_blocksize_bits;
 241
 242	/* Allocate new blocks to quota. */
 243	rc = dquot_alloc_block(ip, nblocks);
 244	if (rc)
 245		return rc;
 246
 247	rc = dbAlloc(ip, INOHINT(ip), nblocks, &blkno);
 248	if (rc) {
 249		/*Rollback quota allocation. */
 250		dquot_free_block(ip, nblocks);
 251		return rc;
 252	}
 253
 254	/*
 255	 * Now have nblocks worth of storage to stuff into the FEALIST.
 256	 * loop over the FEALIST copying data into the buffer one page at
 257	 * a time.
 258	 */
 259	cp = (char *) ealist;
 260	nbytes = size;
 261	for (i = 0; i < nblocks; i += sbi->nbperpage) {
 262		/*
 263		 * Determine how many bytes for this request, and round up to
 264		 * the nearest aggregate block size
 265		 */
 266		nb = min(PSIZE, nbytes);
 267		bytes_to_write =
 268		    ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
 269		    << sb->s_blocksize_bits;
 270
 271		if (!(mp = get_metapage(ip, blkno + i, bytes_to_write, 1))) {
 272			rc = -EIO;
 273			goto failed;
 274		}
 275
 276		memcpy(mp->data, cp, nb);
 277
 278		/*
 279		 * We really need a way to propagate errors for
 280		 * forced writes like this one.  --hch
 281		 *
 282		 * (__write_metapage => release_metapage => flush_metapage)
 283		 */
 284#ifdef _JFS_FIXME
 285		if ((rc = flush_metapage(mp))) {
 286			/*
 287			 * the write failed -- this means that the buffer
 288			 * is still assigned and the blocks are not being
 289			 * used.  this seems like the best error recovery
 290			 * we can get ...
 291			 */
 292			goto failed;
 293		}
 294#else
 295		flush_metapage(mp);
 296#endif
 297
 298		cp += PSIZE;
 299		nbytes -= nb;
 300	}
 301
 302	ea->flag = DXD_EXTENT;
 303	DXDsize(ea, le32_to_cpu(ealist->size));
 304	DXDlength(ea, nblocks);
 305	DXDaddress(ea, blkno);
 306
 307	/* Free up INLINE area */
 308	if (ji->ea.flag & DXD_INLINE)
 309		ji->mode2 |= INLINEEA;
 310
 311	return 0;
 312
 313      failed:
 314	/* Rollback quota allocation. */
 315	dquot_free_block(ip, nblocks);
 316
 317	dbFree(ip, blkno, nblocks);
 318	return rc;
 319}
 320
 321/*
 322 * NAME: ea_read_inline
 323 *
 324 * FUNCTION: Read an inlined EA into user's buffer
 325 *
 326 * PARAMETERS:
 327 *	ip	- Inode pointer
 328 *	ealist	- Pointer to buffer to fill in with EA
 329 *
 330 * RETURNS: 0
 331 */
 332static int ea_read_inline(struct inode *ip, struct jfs_ea_list *ealist)
 333{
 334	struct jfs_inode_info *ji = JFS_IP(ip);
 335	int ea_size = sizeDXD(&ji->ea);
 336
 337	if (ea_size == 0) {
 338		ealist->size = 0;
 339		return 0;
 340	}
 341
 342	/* Sanity Check */
 343	if ((sizeDXD(&ji->ea) > sizeof (ji->i_inline_ea)))
 344		return -EIO;
 345	if (le32_to_cpu(((struct jfs_ea_list *) &ji->i_inline_ea)->size)
 346	    != ea_size)
 347		return -EIO;
 348
 349	memcpy(ealist, ji->i_inline_ea, ea_size);
 350	return 0;
 351}
 352
 353/*
 354 * NAME: ea_read
 355 *
 356 * FUNCTION: copy EA data into user's buffer
 357 *
 358 * PARAMETERS:
 359 *	ip	- Inode pointer
 360 *	ealist	- Pointer to buffer to fill in with EA
 361 *
 362 * NOTES:  If EA is inline calls ea_read_inline() to copy EA.
 363 *
 364 * RETURNS: 0 for success; other indicates failure
 365 */
 366static int ea_read(struct inode *ip, struct jfs_ea_list *ealist)
 367{
 368	struct super_block *sb = ip->i_sb;
 369	struct jfs_inode_info *ji = JFS_IP(ip);
 370	struct jfs_sb_info *sbi = JFS_SBI(sb);
 371	int nblocks;
 372	s64 blkno;
 373	char *cp = (char *) ealist;
 374	int i;
 375	int nbytes, nb;
 376	s32 bytes_to_read;
 377	struct metapage *mp;
 378
 379	/* quick check for in-line EA */
 380	if (ji->ea.flag & DXD_INLINE)
 381		return ea_read_inline(ip, ealist);
 382
 383	nbytes = sizeDXD(&ji->ea);
 384	if (!nbytes) {
 385		jfs_error(sb, "nbytes is 0\n");
 386		return -EIO;
 387	}
 388
 389	/*
 390	 * Figure out how many blocks were allocated when this EA list was
 391	 * originally written to disk.
 392	 */
 393	nblocks = lengthDXD(&ji->ea) << sbi->l2nbperpage;
 394	blkno = addressDXD(&ji->ea) << sbi->l2nbperpage;
 395
 396	/*
 397	 * I have found the disk blocks which were originally used to store
 398	 * the FEALIST.  now i loop over each contiguous block copying the
 399	 * data into the buffer.
 400	 */
 401	for (i = 0; i < nblocks; i += sbi->nbperpage) {
 402		/*
 403		 * Determine how many bytes for this request, and round up to
 404		 * the nearest aggregate block size
 405		 */
 406		nb = min(PSIZE, nbytes);
 407		bytes_to_read =
 408		    ((((nb + sb->s_blocksize - 1)) >> sb->s_blocksize_bits))
 409		    << sb->s_blocksize_bits;
 410
 411		if (!(mp = read_metapage(ip, blkno + i, bytes_to_read, 1)))
 412			return -EIO;
 413
 414		memcpy(cp, mp->data, nb);
 415		release_metapage(mp);
 416
 417		cp += PSIZE;
 418		nbytes -= nb;
 419	}
 420
 421	return 0;
 422}
 423
 424/*
 425 * NAME: ea_get
 426 *
 427 * FUNCTION: Returns buffer containing existing extended attributes.
 428 *	     The size of the buffer will be the larger of the existing
 429 *	     attributes size, or min_size.
 430 *
 431 *	     The buffer, which may be inlined in the inode or in the
 432 *	     page cache must be release by calling ea_release or ea_put
 433 *
 434 * PARAMETERS:
 435 *	inode	- Inode pointer
 436 *	ea_buf	- Structure to be populated with ealist and its metadata
 437 *	min_size- minimum size of buffer to be returned
 438 *
 439 * RETURNS: 0 for success; Other indicates failure
 440 */
 441static int ea_get(struct inode *inode, struct ea_buffer *ea_buf, int min_size)
 442{
 443	struct jfs_inode_info *ji = JFS_IP(inode);
 444	struct super_block *sb = inode->i_sb;
 445	int size;
 446	int ea_size = sizeDXD(&ji->ea);
 447	int blocks_needed, current_blocks;
 448	s64 blkno;
 449	int rc;
 450	int quota_allocation = 0;
 451
 452	/* When fsck.jfs clears a bad ea, it doesn't clear the size */
 453	if (ji->ea.flag == 0)
 454		ea_size = 0;
 455
 456	if (ea_size == 0) {
 457		if (min_size == 0) {
 458			ea_buf->flag = 0;
 459			ea_buf->max_size = 0;
 460			ea_buf->xattr = NULL;
 461			return 0;
 462		}
 463		if ((min_size <= sizeof (ji->i_inline_ea)) &&
 464		    (ji->mode2 & INLINEEA)) {
 465			ea_buf->flag = EA_INLINE | EA_NEW;
 466			ea_buf->max_size = sizeof (ji->i_inline_ea);
 467			ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
 468			DXDlength(&ea_buf->new_ea, 0);
 469			DXDaddress(&ea_buf->new_ea, 0);
 470			ea_buf->new_ea.flag = DXD_INLINE;
 471			DXDsize(&ea_buf->new_ea, min_size);
 472			return 0;
 473		}
 474		current_blocks = 0;
 475	} else if (ji->ea.flag & DXD_INLINE) {
 476		if (min_size <= sizeof (ji->i_inline_ea)) {
 477			ea_buf->flag = EA_INLINE;
 478			ea_buf->max_size = sizeof (ji->i_inline_ea);
 479			ea_buf->xattr = (struct jfs_ea_list *) ji->i_inline_ea;
 480			goto size_check;
 481		}
 482		current_blocks = 0;
 483	} else {
 484		if (!(ji->ea.flag & DXD_EXTENT)) {
 485			jfs_error(sb, "invalid ea.flag\n");
 486			return -EIO;
 487		}
 488		current_blocks = (ea_size + sb->s_blocksize - 1) >>
 489		    sb->s_blocksize_bits;
 490	}
 491	size = max(min_size, ea_size);
 492
 493	if (size > PSIZE) {
 494		/*
 495		 * To keep the rest of the code simple.  Allocate a
 496		 * contiguous buffer to work with
 497		 */
 498		ea_buf->xattr = kmalloc(size, GFP_KERNEL);
 499		if (ea_buf->xattr == NULL)
 500			return -ENOMEM;
 501
 502		ea_buf->flag = EA_MALLOC;
 503		ea_buf->max_size = (size + sb->s_blocksize - 1) &
 504		    ~(sb->s_blocksize - 1);
 505
 506		if (ea_size == 0)
 507			return 0;
 508
 509		if ((rc = ea_read(inode, ea_buf->xattr))) {
 510			kfree(ea_buf->xattr);
 511			ea_buf->xattr = NULL;
 512			return rc;
 513		}
 514		goto size_check;
 515	}
 516	blocks_needed = (min_size + sb->s_blocksize - 1) >>
 517	    sb->s_blocksize_bits;
 518
 519	if (blocks_needed > current_blocks) {
 520		/* Allocate new blocks to quota. */
 521		rc = dquot_alloc_block(inode, blocks_needed);
 522		if (rc)
 523			return -EDQUOT;
 524
 525		quota_allocation = blocks_needed;
 526
 527		rc = dbAlloc(inode, INOHINT(inode), (s64) blocks_needed,
 528			     &blkno);
 529		if (rc)
 530			goto clean_up;
 531
 532		DXDlength(&ea_buf->new_ea, blocks_needed);
 533		DXDaddress(&ea_buf->new_ea, blkno);
 534		ea_buf->new_ea.flag = DXD_EXTENT;
 535		DXDsize(&ea_buf->new_ea, min_size);
 536
 537		ea_buf->flag = EA_EXTENT | EA_NEW;
 538
 539		ea_buf->mp = get_metapage(inode, blkno,
 540					  blocks_needed << sb->s_blocksize_bits,
 541					  1);
 542		if (ea_buf->mp == NULL) {
 543			dbFree(inode, blkno, (s64) blocks_needed);
 544			rc = -EIO;
 545			goto clean_up;
 546		}
 547		ea_buf->xattr = ea_buf->mp->data;
 548		ea_buf->max_size = (min_size + sb->s_blocksize - 1) &
 549		    ~(sb->s_blocksize - 1);
 550		if (ea_size == 0)
 551			return 0;
 552		if ((rc = ea_read(inode, ea_buf->xattr))) {
 553			discard_metapage(ea_buf->mp);
 554			dbFree(inode, blkno, (s64) blocks_needed);
 555			goto clean_up;
 556		}
 557		goto size_check;
 558	}
 559	ea_buf->flag = EA_EXTENT;
 560	ea_buf->mp = read_metapage(inode, addressDXD(&ji->ea),
 561				   lengthDXD(&ji->ea) << sb->s_blocksize_bits,
 562				   1);
 563	if (ea_buf->mp == NULL) {
 564		rc = -EIO;
 565		goto clean_up;
 566	}
 567	ea_buf->xattr = ea_buf->mp->data;
 568	ea_buf->max_size = (ea_size + sb->s_blocksize - 1) &
 569	    ~(sb->s_blocksize - 1);
 570
 571      size_check:
 572	if (EALIST_SIZE(ea_buf->xattr) != ea_size) {
 573		printk(KERN_ERR "ea_get: invalid extended attribute\n");
 574		print_hex_dump(KERN_ERR, "", DUMP_PREFIX_ADDRESS, 16, 1,
 575				     ea_buf->xattr, ea_size, 1);
 576		ea_release(inode, ea_buf);
 577		rc = -EIO;
 578		goto clean_up;
 579	}
 580
 581	return ea_size;
 582
 583      clean_up:
 584	/* Rollback quota allocation */
 585	if (quota_allocation)
 586		dquot_free_block(inode, quota_allocation);
 587
 588	return (rc);
 589}
 590
 591static void ea_release(struct inode *inode, struct ea_buffer *ea_buf)
 592{
 593	if (ea_buf->flag & EA_MALLOC)
 594		kfree(ea_buf->xattr);
 595	else if (ea_buf->flag & EA_EXTENT) {
 596		assert(ea_buf->mp);
 597		release_metapage(ea_buf->mp);
 598
 599		if (ea_buf->flag & EA_NEW)
 600			dbFree(inode, addressDXD(&ea_buf->new_ea),
 601			       lengthDXD(&ea_buf->new_ea));
 602	}
 603}
 604
 605static int ea_put(tid_t tid, struct inode *inode, struct ea_buffer *ea_buf,
 606		  int new_size)
 607{
 608	struct jfs_inode_info *ji = JFS_IP(inode);
 609	unsigned long old_blocks, new_blocks;
 610	int rc = 0;
 611
 612	if (new_size == 0) {
 613		ea_release(inode, ea_buf);
 614		ea_buf = NULL;
 615	} else if (ea_buf->flag & EA_INLINE) {
 616		assert(new_size <= sizeof (ji->i_inline_ea));
 617		ji->mode2 &= ~INLINEEA;
 618		ea_buf->new_ea.flag = DXD_INLINE;
 619		DXDsize(&ea_buf->new_ea, new_size);
 620		DXDaddress(&ea_buf->new_ea, 0);
 621		DXDlength(&ea_buf->new_ea, 0);
 622	} else if (ea_buf->flag & EA_MALLOC) {
 623		rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
 624		kfree(ea_buf->xattr);
 625	} else if (ea_buf->flag & EA_NEW) {
 626		/* We have already allocated a new dxd */
 627		flush_metapage(ea_buf->mp);
 628	} else {
 629		/* ->xattr must point to original ea's metapage */
 630		rc = ea_write(inode, ea_buf->xattr, new_size, &ea_buf->new_ea);
 631		discard_metapage(ea_buf->mp);
 632	}
 633	if (rc)
 634		return rc;
 635
 636	old_blocks = new_blocks = 0;
 637
 638	if (ji->ea.flag & DXD_EXTENT) {
 639		invalidate_dxd_metapages(inode, ji->ea);
 640		old_blocks = lengthDXD(&ji->ea);
 641	}
 642
 643	if (ea_buf) {
 644		txEA(tid, inode, &ji->ea, &ea_buf->new_ea);
 645		if (ea_buf->new_ea.flag & DXD_EXTENT) {
 646			new_blocks = lengthDXD(&ea_buf->new_ea);
 647			if (ji->ea.flag & DXD_INLINE)
 648				ji->mode2 |= INLINEEA;
 649		}
 650		ji->ea = ea_buf->new_ea;
 651	} else {
 652		txEA(tid, inode, &ji->ea, NULL);
 653		if (ji->ea.flag & DXD_INLINE)
 654			ji->mode2 |= INLINEEA;
 655		ji->ea.flag = 0;
 656		ji->ea.size = 0;
 657	}
 658
 659	/* If old blocks exist, they must be removed from quota allocation. */
 660	if (old_blocks)
 661		dquot_free_block(inode, old_blocks);
 662
 663	inode->i_ctime = CURRENT_TIME;
 664
 665	return 0;
 666}
 667
 668/*
 669 * Most of the permission checking is done by xattr_permission in the vfs.
 670 * We also need to verify that this is a namespace that we recognize.
 671 */
 672static int can_set_xattr(struct inode *inode, const char *name,
 673			 const void *value, size_t value_len)
 674{
 675	if (!strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN)) {
 676		/*
 677		 * This makes sure that we aren't trying to set an
 678		 * attribute in a different namespace by prefixing it
 679		 * with "os2."
 680		 */
 681		if (is_known_namespace(name + XATTR_OS2_PREFIX_LEN))
 682			return -EOPNOTSUPP;
 683		return 0;
 684	}
 685
 686	/*
 687	 * Don't allow setting an attribute in an unknown namespace.
 688	 */
 689	if (strncmp(name, XATTR_TRUSTED_PREFIX, XATTR_TRUSTED_PREFIX_LEN) &&
 690	    strncmp(name, XATTR_SECURITY_PREFIX, XATTR_SECURITY_PREFIX_LEN) &&
 691	    strncmp(name, XATTR_USER_PREFIX, XATTR_USER_PREFIX_LEN))
 692		return -EOPNOTSUPP;
 693
 694	return 0;
 695}
 696
 697int __jfs_setxattr(tid_t tid, struct inode *inode, const char *name,
 698		   const void *value, size_t value_len, int flags)
 699{
 700	struct jfs_ea_list *ealist;
 701	struct jfs_ea *ea, *old_ea = NULL, *next_ea = NULL;
 702	struct ea_buffer ea_buf;
 703	int old_ea_size = 0;
 704	int xattr_size;
 705	int new_size;
 706	int namelen = strlen(name);
 707	char *os2name = NULL;
 708	int found = 0;
 709	int rc;
 710	int length;
 711
 712	if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
 713		os2name = kmalloc(namelen - XATTR_OS2_PREFIX_LEN + 1,
 714				  GFP_KERNEL);
 715		if (!os2name)
 716			return -ENOMEM;
 717		strcpy(os2name, name + XATTR_OS2_PREFIX_LEN);
 718		name = os2name;
 719		namelen -= XATTR_OS2_PREFIX_LEN;
 720	}
 721
 722	down_write(&JFS_IP(inode)->xattr_sem);
 723
 724	xattr_size = ea_get(inode, &ea_buf, 0);
 725	if (xattr_size < 0) {
 726		rc = xattr_size;
 727		goto out;
 728	}
 729
 730      again:
 731	ealist = (struct jfs_ea_list *) ea_buf.xattr;
 732	new_size = sizeof (struct jfs_ea_list);
 733
 734	if (xattr_size) {
 735		for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist);
 736		     ea = NEXT_EA(ea)) {
 737			if ((namelen == ea->namelen) &&
 738			    (memcmp(name, ea->name, namelen) == 0)) {
 739				found = 1;
 740				if (flags & XATTR_CREATE) {
 741					rc = -EEXIST;
 742					goto release;
 743				}
 744				old_ea = ea;
 745				old_ea_size = EA_SIZE(ea);
 746				next_ea = NEXT_EA(ea);
 747			} else
 748				new_size += EA_SIZE(ea);
 749		}
 750	}
 751
 752	if (!found) {
 753		if (flags & XATTR_REPLACE) {
 754			rc = -ENODATA;
 755			goto release;
 756		}
 757		if (value == NULL) {
 758			rc = 0;
 759			goto release;
 760		}
 761	}
 762	if (value)
 763		new_size += sizeof (struct jfs_ea) + namelen + 1 + value_len;
 764
 765	if (new_size > ea_buf.max_size) {
 766		/*
 767		 * We need to allocate more space for merged ea list.
 768		 * We should only have loop to again: once.
 769		 */
 770		ea_release(inode, &ea_buf);
 771		xattr_size = ea_get(inode, &ea_buf, new_size);
 772		if (xattr_size < 0) {
 773			rc = xattr_size;
 774			goto out;
 775		}
 776		goto again;
 777	}
 778
 779	/* Remove old ea of the same name */
 780	if (found) {
 781		/* number of bytes following target EA */
 782		length = (char *) END_EALIST(ealist) - (char *) next_ea;
 783		if (length > 0)
 784			memmove(old_ea, next_ea, length);
 785		xattr_size -= old_ea_size;
 786	}
 787
 788	/* Add new entry to the end */
 789	if (value) {
 790		if (xattr_size == 0)
 791			/* Completely new ea list */
 792			xattr_size = sizeof (struct jfs_ea_list);
 793
 794		/*
 795		 * The size of EA value is limitted by on-disk format up to
 796		 *  __le16, there would be an overflow if the size is equal
 797		 * to XATTR_SIZE_MAX (65536).  In order to avoid this issue,
 798		 * we can pre-checkup the value size against USHRT_MAX, and
 799		 * return -E2BIG in this case, which is consistent with the
 800		 * VFS setxattr interface.
 801		 */
 802		if (value_len >= USHRT_MAX) {
 803			rc = -E2BIG;
 804			goto release;
 805		}
 806
 807		ea = (struct jfs_ea *) ((char *) ealist + xattr_size);
 808		ea->flag = 0;
 809		ea->namelen = namelen;
 810		ea->valuelen = (cpu_to_le16(value_len));
 811		memcpy(ea->name, name, namelen);
 812		ea->name[namelen] = 0;
 813		if (value_len)
 814			memcpy(&ea->name[namelen + 1], value, value_len);
 815		xattr_size += EA_SIZE(ea);
 816	}
 817
 818	/* DEBUG - If we did this right, these number match */
 819	if (xattr_size != new_size) {
 820		printk(KERN_ERR
 821		       "__jfs_setxattr: xattr_size = %d, new_size = %d\n",
 822		       xattr_size, new_size);
 823
 824		rc = -EINVAL;
 825		goto release;
 826	}
 827
 828	/*
 829	 * If we're left with an empty list, there's no ea
 830	 */
 831	if (new_size == sizeof (struct jfs_ea_list))
 832		new_size = 0;
 833
 834	ealist->size = cpu_to_le32(new_size);
 835
 836	rc = ea_put(tid, inode, &ea_buf, new_size);
 837
 838	goto out;
 839      release:
 840	ea_release(inode, &ea_buf);
 841      out:
 842	up_write(&JFS_IP(inode)->xattr_sem);
 843
 844	kfree(os2name);
 845
 846	return rc;
 847}
 848
 849int jfs_setxattr(struct dentry *dentry, const char *name, const void *value,
 850		 size_t value_len, int flags)
 851{
 852	struct inode *inode = d_inode(dentry);
 853	struct jfs_inode_info *ji = JFS_IP(inode);
 854	int rc;
 855	tid_t tid;
 856
 857	/*
 858	 * If this is a request for a synthetic attribute in the system.*
 859	 * namespace use the generic infrastructure to resolve a handler
 860	 * for it via sb->s_xattr.
 861	 */
 862	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
 863		return generic_setxattr(dentry, name, value, value_len, flags);
 864
 865	if ((rc = can_set_xattr(inode, name, value, value_len)))
 866		return rc;
 867
 868	if (value == NULL) {	/* empty EA, do not remove */
 869		value = "";
 870		value_len = 0;
 871	}
 872
 873	tid = txBegin(inode->i_sb, 0);
 874	mutex_lock(&ji->commit_mutex);
 875	rc = __jfs_setxattr(tid, d_inode(dentry), name, value, value_len,
 876			    flags);
 877	if (!rc)
 878		rc = txCommit(tid, 1, &inode, 0);
 879	txEnd(tid);
 880	mutex_unlock(&ji->commit_mutex);
 881
 882	return rc;
 883}
 884
 885ssize_t __jfs_getxattr(struct inode *inode, const char *name, void *data,
 886		       size_t buf_size)
 887{
 888	struct jfs_ea_list *ealist;
 889	struct jfs_ea *ea;
 890	struct ea_buffer ea_buf;
 891	int xattr_size;
 892	ssize_t size;
 893	int namelen = strlen(name);
 894	char *value;
 895
 896	down_read(&JFS_IP(inode)->xattr_sem);
 897
 898	xattr_size = ea_get(inode, &ea_buf, 0);
 899
 900	if (xattr_size < 0) {
 901		size = xattr_size;
 902		goto out;
 903	}
 904
 905	if (xattr_size == 0)
 906		goto not_found;
 907
 908	ealist = (struct jfs_ea_list *) ea_buf.xattr;
 909
 910	/* Find the named attribute */
 911	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea))
 912		if ((namelen == ea->namelen) &&
 913		    memcmp(name, ea->name, namelen) == 0) {
 914			/* Found it */
 915			size = le16_to_cpu(ea->valuelen);
 916			if (!data)
 917				goto release;
 918			else if (size > buf_size) {
 919				size = -ERANGE;
 920				goto release;
 921			}
 922			value = ((char *) &ea->name) + ea->namelen + 1;
 923			memcpy(data, value, size);
 924			goto release;
 925		}
 926      not_found:
 927	size = -ENODATA;
 928      release:
 929	ea_release(inode, &ea_buf);
 930      out:
 931	up_read(&JFS_IP(inode)->xattr_sem);
 932
 933	return size;
 934}
 935
 936ssize_t jfs_getxattr(struct dentry *dentry, const char *name, void *data,
 937		     size_t buf_size)
 938{
 939	int err;
 940
 941	/*
 942	 * If this is a request for a synthetic attribute in the system.*
 943	 * namespace use the generic infrastructure to resolve a handler
 944	 * for it via sb->s_xattr.
 945	 */
 946	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
 947		return generic_getxattr(dentry, name, data, buf_size);
 948
 949	if (strncmp(name, XATTR_OS2_PREFIX, XATTR_OS2_PREFIX_LEN) == 0) {
 950		/*
 951		 * skip past "os2." prefix
 952		 */
 953		name += XATTR_OS2_PREFIX_LEN;
 954		/*
 955		 * Don't allow retrieving properly prefixed attributes
 956		 * by prepending them with "os2."
 957		 */
 958		if (is_known_namespace(name))
 959			return -EOPNOTSUPP;
 960	}
 961
 962	err = __jfs_getxattr(d_inode(dentry), name, data, buf_size);
 963
 964	return err;
 965}
 966
 967/*
 968 * No special permissions are needed to list attributes except for trusted.*
 969 */
 970static inline int can_list(struct jfs_ea *ea)
 971{
 972	return (strncmp(ea->name, XATTR_TRUSTED_PREFIX,
 973			    XATTR_TRUSTED_PREFIX_LEN) ||
 974		capable(CAP_SYS_ADMIN));
 975}
 976
 977ssize_t jfs_listxattr(struct dentry * dentry, char *data, size_t buf_size)
 978{
 979	struct inode *inode = d_inode(dentry);
 980	char *buffer;
 981	ssize_t size = 0;
 982	int xattr_size;
 983	struct jfs_ea_list *ealist;
 984	struct jfs_ea *ea;
 985	struct ea_buffer ea_buf;
 986
 987	down_read(&JFS_IP(inode)->xattr_sem);
 988
 989	xattr_size = ea_get(inode, &ea_buf, 0);
 990	if (xattr_size < 0) {
 991		size = xattr_size;
 992		goto out;
 993	}
 994
 995	if (xattr_size == 0)
 996		goto release;
 997
 998	ealist = (struct jfs_ea_list *) ea_buf.xattr;
 999
1000	/* compute required size of list */
1001	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
1002		if (can_list(ea))
1003			size += name_size(ea) + 1;
1004	}
1005
1006	if (!data)
1007		goto release;
1008
1009	if (size > buf_size) {
1010		size = -ERANGE;
1011		goto release;
1012	}
1013
1014	/* Copy attribute names to buffer */
1015	buffer = data;
1016	for (ea = FIRST_EA(ealist); ea < END_EALIST(ealist); ea = NEXT_EA(ea)) {
1017		if (can_list(ea)) {
1018			int namelen = copy_name(buffer, ea);
1019			buffer += namelen + 1;
1020		}
1021	}
1022
1023      release:
1024	ea_release(inode, &ea_buf);
1025      out:
1026	up_read(&JFS_IP(inode)->xattr_sem);
1027	return size;
1028}
1029
1030int jfs_removexattr(struct dentry *dentry, const char *name)
1031{
1032	struct inode *inode = d_inode(dentry);
1033	struct jfs_inode_info *ji = JFS_IP(inode);
1034	int rc;
1035	tid_t tid;
1036
1037	/*
1038	 * If this is a request for a synthetic attribute in the system.*
1039	 * namespace use the generic infrastructure to resolve a handler
1040	 * for it via sb->s_xattr.
1041	 */
1042	if (!strncmp(name, XATTR_SYSTEM_PREFIX, XATTR_SYSTEM_PREFIX_LEN))
1043		return generic_removexattr(dentry, name);
1044
1045	if ((rc = can_set_xattr(inode, name, NULL, 0)))
1046		return rc;
1047
1048	tid = txBegin(inode->i_sb, 0);
1049	mutex_lock(&ji->commit_mutex);
1050	rc = __jfs_setxattr(tid, d_inode(dentry), name, NULL, 0, XATTR_REPLACE);
1051	if (!rc)
1052		rc = txCommit(tid, 1, &inode, 0);
1053	txEnd(tid);
1054	mutex_unlock(&ji->commit_mutex);
1055
1056	return rc;
1057}
1058
1059/*
1060 * List of handlers for synthetic system.* attributes.  All real ondisk
1061 * attributes are handled directly.
1062 */
1063const struct xattr_handler *jfs_xattr_handlers[] = {
1064#ifdef CONFIG_JFS_POSIX_ACL
1065	&posix_acl_access_xattr_handler,
1066	&posix_acl_default_xattr_handler,
1067#endif
1068	NULL,
1069};
1070
1071
1072#ifdef CONFIG_JFS_SECURITY
1073static int jfs_initxattrs(struct inode *inode, const struct xattr *xattr_array,
1074			  void *fs_info)
1075{
1076	const struct xattr *xattr;
1077	tid_t *tid = fs_info;
1078	char *name;
1079	int err = 0;
1080
1081	for (xattr = xattr_array; xattr->name != NULL; xattr++) {
1082		name = kmalloc(XATTR_SECURITY_PREFIX_LEN +
1083			       strlen(xattr->name) + 1, GFP_NOFS);
1084		if (!name) {
1085			err = -ENOMEM;
1086			break;
1087		}
1088		strcpy(name, XATTR_SECURITY_PREFIX);
1089		strcpy(name + XATTR_SECURITY_PREFIX_LEN, xattr->name);
1090
1091		err = __jfs_setxattr(*tid, inode, name,
1092				     xattr->value, xattr->value_len, 0);
1093		kfree(name);
1094		if (err < 0)
1095			break;
1096	}
1097	return err;
1098}
1099
1100int jfs_init_security(tid_t tid, struct inode *inode, struct inode *dir,
1101		      const struct qstr *qstr)
1102{
1103	return security_inode_init_security(inode, dir, qstr,
1104					    &jfs_initxattrs, &tid);
1105}
1106#endif