2 * linux/fs/ext4/xattr.c
4 * Copyright (C) 2001-2003 Andreas Gruenbacher, <agruen@suse.de>
6 * Fix by Harrison Xing <harrison@mountainviewdata.com>.
7 * Ext4 code with a lot of help from Eric Jarman <ejarman@acm.org>.
8 * Extended attributes for symlinks and special files added per
9 * suggestion of Luka Renko <luka.renko@hermes.si>.
10 * xattr consolidation Copyright (c) 2004 James Morris <jmorris@redhat.com>,
12 * ea-in-inode support by Alex Tomas <alex@clusterfs.com> aka bzzz
13 * and Andreas Gruenbacher <agruen@suse.de>.
17 * Extended attributes are stored directly in inodes (on file systems with
18 * inodes bigger than 128 bytes) and on additional disk blocks. The i_file_acl
19 * field contains the block number if an inode uses an additional block. All
20 * attributes must fit in the inode and one additional block. Blocks that
21 * contain the identical set of attributes may be shared among several inodes.
22 * Identical blocks are detected by keeping a cache of blocks that have
23 * recently been accessed.
25 * The attributes in inodes and on blocks have a different header; the entries
26 * are stored in the same format:
28 * +------------------+
31 * | entry 2 | | growing downwards
36 * | value 3 | | growing upwards
38 * +------------------+
40 * The header is followed by multiple entry descriptors. In disk blocks, the
41 * entry descriptors are kept sorted. In inodes, they are unsorted. The
42 * attribute values are aligned to the end of the block in no specific order.
46 * EXT4_I(inode)->i_file_acl is protected by EXT4_I(inode)->xattr_sem.
47 * EA blocks are only changed if they are exclusive to an inode, so
48 * holding xattr_sem also means that nothing but the EA block's reference
49 * count can change. Multiple writers to the same block are synchronized
53 #include <linux/init.h>
55 #include <linux/slab.h>
56 #include <linux/mbcache.h>
57 #include <linux/quotaops.h>
58 #include "ext4_jbd2.h"
63 #ifdef EXT4_XATTR_DEBUG
64 # define ea_idebug(inode, f...) do { \
65 printk(KERN_DEBUG "inode %s:%lu: ", \
66 inode->i_sb->s_id, inode->i_ino); \
70 # define ea_bdebug(bh, f...) do { \
71 printk(KERN_DEBUG "block %pg:%lu: ", \
72 bh->b_bdev, (unsigned long) bh->b_blocknr); \
77 # define ea_idebug(inode, fmt, ...) no_printk(fmt, ##__VA_ARGS__)
78 # define ea_bdebug(bh, fmt, ...) no_printk(fmt, ##__VA_ARGS__)
81 static void ext4_xattr_cache_insert(struct mb_cache
*, struct buffer_head
*);
82 static struct buffer_head
*ext4_xattr_cache_find(struct inode
*,
83 struct ext4_xattr_header
*,
84 struct mb_cache_entry
**);
85 static void ext4_xattr_rehash(struct ext4_xattr_header
*,
86 struct ext4_xattr_entry
*);
87 static int ext4_xattr_list(struct dentry
*dentry
, char *buffer
,
90 static const struct xattr_handler
*ext4_xattr_handler_map
[] = {
91 [EXT4_XATTR_INDEX_USER
] = &ext4_xattr_user_handler
,
92 #ifdef CONFIG_EXT4_FS_POSIX_ACL
93 [EXT4_XATTR_INDEX_POSIX_ACL_ACCESS
] = &posix_acl_access_xattr_handler
,
94 [EXT4_XATTR_INDEX_POSIX_ACL_DEFAULT
] = &posix_acl_default_xattr_handler
,
96 [EXT4_XATTR_INDEX_TRUSTED
] = &ext4_xattr_trusted_handler
,
97 #ifdef CONFIG_EXT4_FS_SECURITY
98 [EXT4_XATTR_INDEX_SECURITY
] = &ext4_xattr_security_handler
,
102 const struct xattr_handler
*ext4_xattr_handlers
[] = {
103 &ext4_xattr_user_handler
,
104 &ext4_xattr_trusted_handler
,
105 #ifdef CONFIG_EXT4_FS_POSIX_ACL
106 &posix_acl_access_xattr_handler
,
107 &posix_acl_default_xattr_handler
,
109 #ifdef CONFIG_EXT4_FS_SECURITY
110 &ext4_xattr_security_handler
,
115 #define EXT4_GET_MB_CACHE(inode) (((struct ext4_sb_info *) \
116 inode->i_sb->s_fs_info)->s_mb_cache)
118 static __le32
ext4_xattr_block_csum(struct inode
*inode
,
120 struct ext4_xattr_header
*hdr
)
122 struct ext4_sb_info
*sbi
= EXT4_SB(inode
->i_sb
);
125 __le64 dsk_block_nr
= cpu_to_le64(block_nr
);
127 save_csum
= hdr
->h_checksum
;
129 csum
= ext4_chksum(sbi
, sbi
->s_csum_seed
, (__u8
*)&dsk_block_nr
,
130 sizeof(dsk_block_nr
));
131 csum
= ext4_chksum(sbi
, csum
, (__u8
*)hdr
,
132 EXT4_BLOCK_SIZE(inode
->i_sb
));
134 hdr
->h_checksum
= save_csum
;
135 return cpu_to_le32(csum
);
138 static int ext4_xattr_block_csum_verify(struct inode
*inode
,
140 struct ext4_xattr_header
*hdr
)
142 if (ext4_has_metadata_csum(inode
->i_sb
) &&
143 (hdr
->h_checksum
!= ext4_xattr_block_csum(inode
, block_nr
, hdr
)))
148 static void ext4_xattr_block_csum_set(struct inode
*inode
,
150 struct ext4_xattr_header
*hdr
)
152 if (!ext4_has_metadata_csum(inode
->i_sb
))
155 hdr
->h_checksum
= ext4_xattr_block_csum(inode
, block_nr
, hdr
);
158 static inline int ext4_handle_dirty_xattr_block(handle_t
*handle
,
160 struct buffer_head
*bh
)
162 ext4_xattr_block_csum_set(inode
, bh
->b_blocknr
, BHDR(bh
));
163 return ext4_handle_dirty_metadata(handle
, inode
, bh
);
166 static inline const struct xattr_handler
*
167 ext4_xattr_handler(int name_index
)
169 const struct xattr_handler
*handler
= NULL
;
171 if (name_index
> 0 && name_index
< ARRAY_SIZE(ext4_xattr_handler_map
))
172 handler
= ext4_xattr_handler_map
[name_index
];
177 * Inode operation listxattr()
179 * d_inode(dentry)->i_mutex: don't care
182 ext4_listxattr(struct dentry
*dentry
, char *buffer
, size_t size
)
184 return ext4_xattr_list(dentry
, buffer
, size
);
188 ext4_xattr_check_names(struct ext4_xattr_entry
*entry
, void *end
,
191 struct ext4_xattr_entry
*e
= entry
;
193 while (!IS_LAST_ENTRY(e
)) {
194 struct ext4_xattr_entry
*next
= EXT4_XATTR_NEXT(e
);
195 if ((void *)next
>= end
)
196 return -EFSCORRUPTED
;
200 while (!IS_LAST_ENTRY(entry
)) {
201 if (entry
->e_value_size
!= 0 &&
202 (value_start
+ le16_to_cpu(entry
->e_value_offs
) <
203 (void *)e
+ sizeof(__u32
) ||
204 value_start
+ le16_to_cpu(entry
->e_value_offs
) +
205 le32_to_cpu(entry
->e_value_size
) > end
))
206 return -EFSCORRUPTED
;
207 entry
= EXT4_XATTR_NEXT(entry
);
214 ext4_xattr_check_block(struct inode
*inode
, struct buffer_head
*bh
)
218 if (buffer_verified(bh
))
221 if (BHDR(bh
)->h_magic
!= cpu_to_le32(EXT4_XATTR_MAGIC
) ||
222 BHDR(bh
)->h_blocks
!= cpu_to_le32(1))
223 return -EFSCORRUPTED
;
224 if (!ext4_xattr_block_csum_verify(inode
, bh
->b_blocknr
, BHDR(bh
)))
226 error
= ext4_xattr_check_names(BFIRST(bh
), bh
->b_data
+ bh
->b_size
,
229 set_buffer_verified(bh
);
234 __xattr_check_inode(struct inode
*inode
, struct ext4_xattr_ibody_header
*header
,
235 void *end
, const char *function
, unsigned int line
)
237 struct ext4_xattr_entry
*entry
= IFIRST(header
);
238 int error
= -EFSCORRUPTED
;
240 if (((void *) header
>= end
) ||
241 (header
->h_magic
!= le32_to_cpu(EXT4_XATTR_MAGIC
)))
243 error
= ext4_xattr_check_names(entry
, end
, entry
);
246 __ext4_error_inode(inode
, function
, line
, 0,
247 "corrupted in-inode xattr");
251 #define xattr_check_inode(inode, header, end) \
252 __xattr_check_inode((inode), (header), (end), __func__, __LINE__)
255 ext4_xattr_check_entry(struct ext4_xattr_entry
*entry
, size_t size
)
257 size_t value_size
= le32_to_cpu(entry
->e_value_size
);
259 if (entry
->e_value_block
!= 0 || value_size
> size
||
260 le16_to_cpu(entry
->e_value_offs
) + value_size
> size
)
261 return -EFSCORRUPTED
;
266 ext4_xattr_find_entry(struct ext4_xattr_entry
**pentry
, int name_index
,
267 const char *name
, size_t size
, int sorted
)
269 struct ext4_xattr_entry
*entry
;
275 name_len
= strlen(name
);
277 for (; !IS_LAST_ENTRY(entry
); entry
= EXT4_XATTR_NEXT(entry
)) {
278 cmp
= name_index
- entry
->e_name_index
;
280 cmp
= name_len
- entry
->e_name_len
;
282 cmp
= memcmp(name
, entry
->e_name
, name_len
);
283 if (cmp
<= 0 && (sorted
|| cmp
== 0))
287 if (!cmp
&& ext4_xattr_check_entry(entry
, size
))
288 return -EFSCORRUPTED
;
289 return cmp
? -ENODATA
: 0;
293 ext4_xattr_block_get(struct inode
*inode
, int name_index
, const char *name
,
294 void *buffer
, size_t buffer_size
)
296 struct buffer_head
*bh
= NULL
;
297 struct ext4_xattr_entry
*entry
;
300 struct mb_cache
*ext4_mb_cache
= EXT4_GET_MB_CACHE(inode
);
302 ea_idebug(inode
, "name=%d.%s, buffer=%p, buffer_size=%ld",
303 name_index
, name
, buffer
, (long)buffer_size
);
306 if (!EXT4_I(inode
)->i_file_acl
)
308 ea_idebug(inode
, "reading block %llu",
309 (unsigned long long)EXT4_I(inode
)->i_file_acl
);
310 bh
= sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
);
313 ea_bdebug(bh
, "b_count=%d, refcount=%d",
314 atomic_read(&(bh
->b_count
)), le32_to_cpu(BHDR(bh
)->h_refcount
));
315 if (ext4_xattr_check_block(inode
, bh
)) {
317 EXT4_ERROR_INODE(inode
, "bad block %llu",
318 EXT4_I(inode
)->i_file_acl
);
319 error
= -EFSCORRUPTED
;
322 ext4_xattr_cache_insert(ext4_mb_cache
, bh
);
324 error
= ext4_xattr_find_entry(&entry
, name_index
, name
, bh
->b_size
, 1);
325 if (error
== -EFSCORRUPTED
)
329 size
= le32_to_cpu(entry
->e_value_size
);
332 if (size
> buffer_size
)
334 memcpy(buffer
, bh
->b_data
+ le16_to_cpu(entry
->e_value_offs
),
345 ext4_xattr_ibody_get(struct inode
*inode
, int name_index
, const char *name
,
346 void *buffer
, size_t buffer_size
)
348 struct ext4_xattr_ibody_header
*header
;
349 struct ext4_xattr_entry
*entry
;
350 struct ext4_inode
*raw_inode
;
351 struct ext4_iloc iloc
;
356 if (!ext4_test_inode_state(inode
, EXT4_STATE_XATTR
))
358 error
= ext4_get_inode_loc(inode
, &iloc
);
361 raw_inode
= ext4_raw_inode(&iloc
);
362 header
= IHDR(inode
, raw_inode
);
363 entry
= IFIRST(header
);
364 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
365 error
= xattr_check_inode(inode
, header
, end
);
368 error
= ext4_xattr_find_entry(&entry
, name_index
, name
,
369 end
- (void *)entry
, 0);
372 size
= le32_to_cpu(entry
->e_value_size
);
375 if (size
> buffer_size
)
377 memcpy(buffer
, (void *)IFIRST(header
) +
378 le16_to_cpu(entry
->e_value_offs
), size
);
390 * Copy an extended attribute into the buffer
391 * provided, or compute the buffer size required.
392 * Buffer is NULL to compute the size of the buffer required.
394 * Returns a negative error number on failure, or the number of bytes
395 * used / required on success.
398 ext4_xattr_get(struct inode
*inode
, int name_index
, const char *name
,
399 void *buffer
, size_t buffer_size
)
403 if (strlen(name
) > 255)
406 down_read(&EXT4_I(inode
)->xattr_sem
);
407 error
= ext4_xattr_ibody_get(inode
, name_index
, name
, buffer
,
409 if (error
== -ENODATA
)
410 error
= ext4_xattr_block_get(inode
, name_index
, name
, buffer
,
412 up_read(&EXT4_I(inode
)->xattr_sem
);
417 ext4_xattr_list_entries(struct dentry
*dentry
, struct ext4_xattr_entry
*entry
,
418 char *buffer
, size_t buffer_size
)
420 size_t rest
= buffer_size
;
422 for (; !IS_LAST_ENTRY(entry
); entry
= EXT4_XATTR_NEXT(entry
)) {
423 const struct xattr_handler
*handler
=
424 ext4_xattr_handler(entry
->e_name_index
);
426 if (handler
&& (!handler
->list
|| handler
->list(dentry
))) {
427 const char *prefix
= handler
->prefix
?: handler
->name
;
428 size_t prefix_len
= strlen(prefix
);
429 size_t size
= prefix_len
+ entry
->e_name_len
+ 1;
434 memcpy(buffer
, prefix
, prefix_len
);
435 buffer
+= prefix_len
;
436 memcpy(buffer
, entry
->e_name
, entry
->e_name_len
);
437 buffer
+= entry
->e_name_len
;
443 return buffer_size
- rest
; /* total size */
447 ext4_xattr_block_list(struct dentry
*dentry
, char *buffer
, size_t buffer_size
)
449 struct inode
*inode
= d_inode(dentry
);
450 struct buffer_head
*bh
= NULL
;
452 struct mb_cache
*ext4_mb_cache
= EXT4_GET_MB_CACHE(inode
);
454 ea_idebug(inode
, "buffer=%p, buffer_size=%ld",
455 buffer
, (long)buffer_size
);
458 if (!EXT4_I(inode
)->i_file_acl
)
460 ea_idebug(inode
, "reading block %llu",
461 (unsigned long long)EXT4_I(inode
)->i_file_acl
);
462 bh
= sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
);
466 ea_bdebug(bh
, "b_count=%d, refcount=%d",
467 atomic_read(&(bh
->b_count
)), le32_to_cpu(BHDR(bh
)->h_refcount
));
468 if (ext4_xattr_check_block(inode
, bh
)) {
469 EXT4_ERROR_INODE(inode
, "bad block %llu",
470 EXT4_I(inode
)->i_file_acl
);
471 error
= -EFSCORRUPTED
;
474 ext4_xattr_cache_insert(ext4_mb_cache
, bh
);
475 error
= ext4_xattr_list_entries(dentry
, BFIRST(bh
), buffer
, buffer_size
);
484 ext4_xattr_ibody_list(struct dentry
*dentry
, char *buffer
, size_t buffer_size
)
486 struct inode
*inode
= d_inode(dentry
);
487 struct ext4_xattr_ibody_header
*header
;
488 struct ext4_inode
*raw_inode
;
489 struct ext4_iloc iloc
;
493 if (!ext4_test_inode_state(inode
, EXT4_STATE_XATTR
))
495 error
= ext4_get_inode_loc(inode
, &iloc
);
498 raw_inode
= ext4_raw_inode(&iloc
);
499 header
= IHDR(inode
, raw_inode
);
500 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
501 error
= xattr_check_inode(inode
, header
, end
);
504 error
= ext4_xattr_list_entries(dentry
, IFIRST(header
),
505 buffer
, buffer_size
);
515 * Copy a list of attribute names into the buffer
516 * provided, or compute the buffer size required.
517 * Buffer is NULL to compute the size of the buffer required.
519 * Returns a negative error number on failure, or the number of bytes
520 * used / required on success.
523 ext4_xattr_list(struct dentry
*dentry
, char *buffer
, size_t buffer_size
)
527 down_read(&EXT4_I(d_inode(dentry
))->xattr_sem
);
528 ret
= ret2
= ext4_xattr_ibody_list(dentry
, buffer
, buffer_size
);
535 ret
= ext4_xattr_block_list(dentry
, buffer
, buffer_size
);
540 up_read(&EXT4_I(d_inode(dentry
))->xattr_sem
);
545 * If the EXT4_FEATURE_COMPAT_EXT_ATTR feature of this file system is
548 static void ext4_xattr_update_super_block(handle_t
*handle
,
549 struct super_block
*sb
)
551 if (ext4_has_feature_xattr(sb
))
554 BUFFER_TRACE(EXT4_SB(sb
)->s_sbh
, "get_write_access");
555 if (ext4_journal_get_write_access(handle
, EXT4_SB(sb
)->s_sbh
) == 0) {
556 ext4_set_feature_xattr(sb
);
557 ext4_handle_dirty_super(handle
, sb
);
562 * Release the xattr block BH: If the reference count is > 1, decrement it;
563 * otherwise free the block.
566 ext4_xattr_release_block(handle_t
*handle
, struct inode
*inode
,
567 struct buffer_head
*bh
)
569 struct mb_cache
*ext4_mb_cache
= EXT4_GET_MB_CACHE(inode
);
573 BUFFER_TRACE(bh
, "get_write_access");
574 error
= ext4_journal_get_write_access(handle
, bh
);
579 hash
= le32_to_cpu(BHDR(bh
)->h_hash
);
580 ref
= le32_to_cpu(BHDR(bh
)->h_refcount
);
582 ea_bdebug(bh
, "refcount now=0; freeing");
584 * This must happen under buffer lock for
585 * ext4_xattr_block_set() to reliably detect freed block
587 mb_cache_entry_delete_block(ext4_mb_cache
, hash
, bh
->b_blocknr
);
590 ext4_free_blocks(handle
, inode
, bh
, 0, 1,
591 EXT4_FREE_BLOCKS_METADATA
|
592 EXT4_FREE_BLOCKS_FORGET
);
595 BHDR(bh
)->h_refcount
= cpu_to_le32(ref
);
596 if (ref
== EXT4_XATTR_REFCOUNT_MAX
- 1) {
597 struct mb_cache_entry
*ce
;
599 ce
= mb_cache_entry_get(ext4_mb_cache
, hash
,
603 mb_cache_entry_put(ext4_mb_cache
, ce
);
608 * Beware of this ugliness: Releasing of xattr block references
609 * from different inodes can race and so we have to protect
610 * from a race where someone else frees the block (and releases
611 * its journal_head) before we are done dirtying the buffer. In
612 * nojournal mode this race is harmless and we actually cannot
613 * call ext4_handle_dirty_xattr_block() with locked buffer as
614 * that function can call sync_dirty_buffer() so for that case
615 * we handle the dirtying after unlocking the buffer.
617 if (ext4_handle_valid(handle
))
618 error
= ext4_handle_dirty_xattr_block(handle
, inode
,
621 if (!ext4_handle_valid(handle
))
622 error
= ext4_handle_dirty_xattr_block(handle
, inode
,
625 ext4_handle_sync(handle
);
626 dquot_free_block(inode
, EXT4_C2B(EXT4_SB(inode
->i_sb
), 1));
627 ea_bdebug(bh
, "refcount now=%d; releasing",
628 le32_to_cpu(BHDR(bh
)->h_refcount
));
631 ext4_std_error(inode
->i_sb
, error
);
636 * Find the available free space for EAs. This also returns the total number of
637 * bytes used by EA entries.
639 static size_t ext4_xattr_free_space(struct ext4_xattr_entry
*last
,
640 size_t *min_offs
, void *base
, int *total
)
642 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
643 if (!last
->e_value_block
&& last
->e_value_size
) {
644 size_t offs
= le16_to_cpu(last
->e_value_offs
);
645 if (offs
< *min_offs
)
649 *total
+= EXT4_XATTR_LEN(last
->e_name_len
);
651 return (*min_offs
- ((void *)last
- base
) - sizeof(__u32
));
655 ext4_xattr_set_entry(struct ext4_xattr_info
*i
, struct ext4_xattr_search
*s
)
657 struct ext4_xattr_entry
*last
;
658 size_t free
, min_offs
= s
->end
- s
->base
, name_len
= strlen(i
->name
);
660 /* Compute min_offs and last. */
662 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
663 if (!last
->e_value_block
&& last
->e_value_size
) {
664 size_t offs
= le16_to_cpu(last
->e_value_offs
);
669 free
= min_offs
- ((void *)last
- s
->base
) - sizeof(__u32
);
671 if (!s
->here
->e_value_block
&& s
->here
->e_value_size
) {
672 size_t size
= le32_to_cpu(s
->here
->e_value_size
);
673 free
+= EXT4_XATTR_SIZE(size
);
675 free
+= EXT4_XATTR_LEN(name_len
);
678 if (free
< EXT4_XATTR_LEN(name_len
) +
679 EXT4_XATTR_SIZE(i
->value_len
))
683 if (i
->value
&& s
->not_found
) {
684 /* Insert the new name. */
685 size_t size
= EXT4_XATTR_LEN(name_len
);
686 size_t rest
= (void *)last
- (void *)s
->here
+ sizeof(__u32
);
687 memmove((void *)s
->here
+ size
, s
->here
, rest
);
688 memset(s
->here
, 0, size
);
689 s
->here
->e_name_index
= i
->name_index
;
690 s
->here
->e_name_len
= name_len
;
691 memcpy(s
->here
->e_name
, i
->name
, name_len
);
693 if (!s
->here
->e_value_block
&& s
->here
->e_value_size
) {
694 void *first_val
= s
->base
+ min_offs
;
695 size_t offs
= le16_to_cpu(s
->here
->e_value_offs
);
696 void *val
= s
->base
+ offs
;
697 size_t size
= EXT4_XATTR_SIZE(
698 le32_to_cpu(s
->here
->e_value_size
));
700 if (i
->value
&& size
== EXT4_XATTR_SIZE(i
->value_len
)) {
701 /* The old and the new value have the same
702 size. Just replace. */
703 s
->here
->e_value_size
=
704 cpu_to_le32(i
->value_len
);
705 if (i
->value
== EXT4_ZERO_XATTR_VALUE
) {
706 memset(val
, 0, size
);
708 /* Clear pad bytes first. */
709 memset(val
+ size
- EXT4_XATTR_PAD
, 0,
711 memcpy(val
, i
->value
, i
->value_len
);
716 /* Remove the old value. */
717 memmove(first_val
+ size
, first_val
, val
- first_val
);
718 memset(first_val
, 0, size
);
719 s
->here
->e_value_size
= 0;
720 s
->here
->e_value_offs
= 0;
723 /* Adjust all value offsets. */
725 while (!IS_LAST_ENTRY(last
)) {
726 size_t o
= le16_to_cpu(last
->e_value_offs
);
727 if (!last
->e_value_block
&&
728 last
->e_value_size
&& o
< offs
)
730 cpu_to_le16(o
+ size
);
731 last
= EXT4_XATTR_NEXT(last
);
735 /* Remove the old name. */
736 size_t size
= EXT4_XATTR_LEN(name_len
);
737 last
= ENTRY((void *)last
- size
);
738 memmove(s
->here
, (void *)s
->here
+ size
,
739 (void *)last
- (void *)s
->here
+ sizeof(__u32
));
740 memset(last
, 0, size
);
745 /* Insert the new value. */
746 s
->here
->e_value_size
= cpu_to_le32(i
->value_len
);
748 size_t size
= EXT4_XATTR_SIZE(i
->value_len
);
749 void *val
= s
->base
+ min_offs
- size
;
750 s
->here
->e_value_offs
= cpu_to_le16(min_offs
- size
);
751 if (i
->value
== EXT4_ZERO_XATTR_VALUE
) {
752 memset(val
, 0, size
);
754 /* Clear the pad bytes first. */
755 memset(val
+ size
- EXT4_XATTR_PAD
, 0,
757 memcpy(val
, i
->value
, i
->value_len
);
764 struct ext4_xattr_block_find
{
765 struct ext4_xattr_search s
;
766 struct buffer_head
*bh
;
770 ext4_xattr_block_find(struct inode
*inode
, struct ext4_xattr_info
*i
,
771 struct ext4_xattr_block_find
*bs
)
773 struct super_block
*sb
= inode
->i_sb
;
776 ea_idebug(inode
, "name=%d.%s, value=%p, value_len=%ld",
777 i
->name_index
, i
->name
, i
->value
, (long)i
->value_len
);
779 if (EXT4_I(inode
)->i_file_acl
) {
780 /* The inode already has an extended attribute block. */
781 bs
->bh
= sb_bread(sb
, EXT4_I(inode
)->i_file_acl
);
785 ea_bdebug(bs
->bh
, "b_count=%d, refcount=%d",
786 atomic_read(&(bs
->bh
->b_count
)),
787 le32_to_cpu(BHDR(bs
->bh
)->h_refcount
));
788 if (ext4_xattr_check_block(inode
, bs
->bh
)) {
789 EXT4_ERROR_INODE(inode
, "bad block %llu",
790 EXT4_I(inode
)->i_file_acl
);
791 error
= -EFSCORRUPTED
;
794 /* Find the named attribute. */
795 bs
->s
.base
= BHDR(bs
->bh
);
796 bs
->s
.first
= BFIRST(bs
->bh
);
797 bs
->s
.end
= bs
->bh
->b_data
+ bs
->bh
->b_size
;
798 bs
->s
.here
= bs
->s
.first
;
799 error
= ext4_xattr_find_entry(&bs
->s
.here
, i
->name_index
,
800 i
->name
, bs
->bh
->b_size
, 1);
801 if (error
&& error
!= -ENODATA
)
803 bs
->s
.not_found
= error
;
812 ext4_xattr_block_set(handle_t
*handle
, struct inode
*inode
,
813 struct ext4_xattr_info
*i
,
814 struct ext4_xattr_block_find
*bs
)
816 struct super_block
*sb
= inode
->i_sb
;
817 struct buffer_head
*new_bh
= NULL
;
818 struct ext4_xattr_search
*s
= &bs
->s
;
819 struct mb_cache_entry
*ce
= NULL
;
821 struct mb_cache
*ext4_mb_cache
= EXT4_GET_MB_CACHE(inode
);
823 #define header(x) ((struct ext4_xattr_header *)(x))
825 if (i
->value
&& i
->value_len
> sb
->s_blocksize
)
828 BUFFER_TRACE(bs
->bh
, "get_write_access");
829 error
= ext4_journal_get_write_access(handle
, bs
->bh
);
834 if (header(s
->base
)->h_refcount
== cpu_to_le32(1)) {
835 __u32 hash
= le32_to_cpu(BHDR(bs
->bh
)->h_hash
);
838 * This must happen under buffer lock for
839 * ext4_xattr_block_set() to reliably detect modified
842 mb_cache_entry_delete_block(ext4_mb_cache
, hash
,
844 ea_bdebug(bs
->bh
, "modifying in-place");
845 error
= ext4_xattr_set_entry(i
, s
);
847 if (!IS_LAST_ENTRY(s
->first
))
848 ext4_xattr_rehash(header(s
->base
),
850 ext4_xattr_cache_insert(ext4_mb_cache
,
853 unlock_buffer(bs
->bh
);
854 if (error
== -EFSCORRUPTED
)
857 error
= ext4_handle_dirty_xattr_block(handle
,
864 int offset
= (char *)s
->here
- bs
->bh
->b_data
;
866 unlock_buffer(bs
->bh
);
867 ea_bdebug(bs
->bh
, "cloning");
868 s
->base
= kmalloc(bs
->bh
->b_size
, GFP_NOFS
);
872 memcpy(s
->base
, BHDR(bs
->bh
), bs
->bh
->b_size
);
873 s
->first
= ENTRY(header(s
->base
)+1);
874 header(s
->base
)->h_refcount
= cpu_to_le32(1);
875 s
->here
= ENTRY(s
->base
+ offset
);
876 s
->end
= s
->base
+ bs
->bh
->b_size
;
879 /* Allocate a buffer where we construct the new block. */
880 s
->base
= kzalloc(sb
->s_blocksize
, GFP_NOFS
);
881 /* assert(header == s->base) */
885 header(s
->base
)->h_magic
= cpu_to_le32(EXT4_XATTR_MAGIC
);
886 header(s
->base
)->h_blocks
= cpu_to_le32(1);
887 header(s
->base
)->h_refcount
= cpu_to_le32(1);
888 s
->first
= ENTRY(header(s
->base
)+1);
889 s
->here
= ENTRY(header(s
->base
)+1);
890 s
->end
= s
->base
+ sb
->s_blocksize
;
893 error
= ext4_xattr_set_entry(i
, s
);
894 if (error
== -EFSCORRUPTED
)
898 if (!IS_LAST_ENTRY(s
->first
))
899 ext4_xattr_rehash(header(s
->base
), s
->here
);
902 if (!IS_LAST_ENTRY(s
->first
)) {
903 new_bh
= ext4_xattr_cache_find(inode
, header(s
->base
), &ce
);
905 /* We found an identical block in the cache. */
906 if (new_bh
== bs
->bh
)
907 ea_bdebug(new_bh
, "keeping");
911 /* The old block is released after updating
913 error
= dquot_alloc_block(inode
,
914 EXT4_C2B(EXT4_SB(sb
), 1));
917 BUFFER_TRACE(new_bh
, "get_write_access");
918 error
= ext4_journal_get_write_access(handle
,
924 * We have to be careful about races with
925 * freeing, rehashing or adding references to
926 * xattr block. Once we hold buffer lock xattr
927 * block's state is stable so we can check
928 * whether the block got freed / rehashed or
929 * not. Since we unhash mbcache entry under
930 * buffer lock when freeing / rehashing xattr
931 * block, checking whether entry is still
932 * hashed is reliable. Same rules hold for
933 * e_reusable handling.
935 if (hlist_bl_unhashed(&ce
->e_hash_list
) ||
938 * Undo everything and check mbcache
941 unlock_buffer(new_bh
);
942 dquot_free_block(inode
,
943 EXT4_C2B(EXT4_SB(sb
),
946 mb_cache_entry_put(ext4_mb_cache
, ce
);
951 ref
= le32_to_cpu(BHDR(new_bh
)->h_refcount
) + 1;
952 BHDR(new_bh
)->h_refcount
= cpu_to_le32(ref
);
953 if (ref
>= EXT4_XATTR_REFCOUNT_MAX
)
955 ea_bdebug(new_bh
, "reusing; refcount now=%d",
957 unlock_buffer(new_bh
);
958 error
= ext4_handle_dirty_xattr_block(handle
,
964 mb_cache_entry_touch(ext4_mb_cache
, ce
);
965 mb_cache_entry_put(ext4_mb_cache
, ce
);
967 } else if (bs
->bh
&& s
->base
== bs
->bh
->b_data
) {
968 /* We were modifying this block in-place. */
969 ea_bdebug(bs
->bh
, "keeping this block");
973 /* We need to allocate a new block */
974 ext4_fsblk_t goal
, block
;
976 goal
= ext4_group_first_block_no(sb
,
977 EXT4_I(inode
)->i_block_group
);
979 /* non-extent files can't have physical blocks past 2^32 */
980 if (!(ext4_test_inode_flag(inode
, EXT4_INODE_EXTENTS
)))
981 goal
= goal
& EXT4_MAX_BLOCK_FILE_PHYS
;
983 block
= ext4_new_meta_blocks(handle
, inode
, goal
, 0,
988 if (!(ext4_test_inode_flag(inode
, EXT4_INODE_EXTENTS
)))
989 BUG_ON(block
> EXT4_MAX_BLOCK_FILE_PHYS
);
991 ea_idebug(inode
, "creating block %llu",
992 (unsigned long long)block
);
994 new_bh
= sb_getblk(sb
, block
);
995 if (unlikely(!new_bh
)) {
998 ext4_free_blocks(handle
, inode
, NULL
, block
, 1,
999 EXT4_FREE_BLOCKS_METADATA
);
1002 lock_buffer(new_bh
);
1003 error
= ext4_journal_get_create_access(handle
, new_bh
);
1005 unlock_buffer(new_bh
);
1009 memcpy(new_bh
->b_data
, s
->base
, new_bh
->b_size
);
1010 set_buffer_uptodate(new_bh
);
1011 unlock_buffer(new_bh
);
1012 ext4_xattr_cache_insert(ext4_mb_cache
, new_bh
);
1013 error
= ext4_handle_dirty_xattr_block(handle
,
1020 /* Update the inode. */
1021 EXT4_I(inode
)->i_file_acl
= new_bh
? new_bh
->b_blocknr
: 0;
1023 /* Drop the previous xattr block. */
1024 if (bs
->bh
&& bs
->bh
!= new_bh
)
1025 ext4_xattr_release_block(handle
, inode
, bs
->bh
);
1030 mb_cache_entry_put(ext4_mb_cache
, ce
);
1032 if (!(bs
->bh
&& s
->base
== bs
->bh
->b_data
))
1038 dquot_free_block(inode
, EXT4_C2B(EXT4_SB(sb
), 1));
1042 EXT4_ERROR_INODE(inode
, "bad block %llu",
1043 EXT4_I(inode
)->i_file_acl
);
1049 int ext4_xattr_ibody_find(struct inode
*inode
, struct ext4_xattr_info
*i
,
1050 struct ext4_xattr_ibody_find
*is
)
1052 struct ext4_xattr_ibody_header
*header
;
1053 struct ext4_inode
*raw_inode
;
1056 if (EXT4_I(inode
)->i_extra_isize
== 0)
1058 raw_inode
= ext4_raw_inode(&is
->iloc
);
1059 header
= IHDR(inode
, raw_inode
);
1060 is
->s
.base
= is
->s
.first
= IFIRST(header
);
1061 is
->s
.here
= is
->s
.first
;
1062 is
->s
.end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
1063 if (ext4_test_inode_state(inode
, EXT4_STATE_XATTR
)) {
1064 error
= xattr_check_inode(inode
, header
, is
->s
.end
);
1067 /* Find the named attribute. */
1068 error
= ext4_xattr_find_entry(&is
->s
.here
, i
->name_index
,
1069 i
->name
, is
->s
.end
-
1070 (void *)is
->s
.base
, 0);
1071 if (error
&& error
!= -ENODATA
)
1073 is
->s
.not_found
= error
;
1078 int ext4_xattr_ibody_inline_set(handle_t
*handle
, struct inode
*inode
,
1079 struct ext4_xattr_info
*i
,
1080 struct ext4_xattr_ibody_find
*is
)
1082 struct ext4_xattr_ibody_header
*header
;
1083 struct ext4_xattr_search
*s
= &is
->s
;
1086 if (EXT4_I(inode
)->i_extra_isize
== 0)
1088 error
= ext4_xattr_set_entry(i
, s
);
1090 if (error
== -ENOSPC
&&
1091 ext4_has_inline_data(inode
)) {
1092 error
= ext4_try_to_evict_inline_data(handle
, inode
,
1093 EXT4_XATTR_LEN(strlen(i
->name
) +
1094 EXT4_XATTR_SIZE(i
->value_len
)));
1097 error
= ext4_xattr_ibody_find(inode
, i
, is
);
1100 error
= ext4_xattr_set_entry(i
, s
);
1105 header
= IHDR(inode
, ext4_raw_inode(&is
->iloc
));
1106 if (!IS_LAST_ENTRY(s
->first
)) {
1107 header
->h_magic
= cpu_to_le32(EXT4_XATTR_MAGIC
);
1108 ext4_set_inode_state(inode
, EXT4_STATE_XATTR
);
1110 header
->h_magic
= cpu_to_le32(0);
1111 ext4_clear_inode_state(inode
, EXT4_STATE_XATTR
);
1116 static int ext4_xattr_ibody_set(handle_t
*handle
, struct inode
*inode
,
1117 struct ext4_xattr_info
*i
,
1118 struct ext4_xattr_ibody_find
*is
)
1120 struct ext4_xattr_ibody_header
*header
;
1121 struct ext4_xattr_search
*s
= &is
->s
;
1124 if (EXT4_I(inode
)->i_extra_isize
== 0)
1126 error
= ext4_xattr_set_entry(i
, s
);
1129 header
= IHDR(inode
, ext4_raw_inode(&is
->iloc
));
1130 if (!IS_LAST_ENTRY(s
->first
)) {
1131 header
->h_magic
= cpu_to_le32(EXT4_XATTR_MAGIC
);
1132 ext4_set_inode_state(inode
, EXT4_STATE_XATTR
);
1134 header
->h_magic
= cpu_to_le32(0);
1135 ext4_clear_inode_state(inode
, EXT4_STATE_XATTR
);
1140 static int ext4_xattr_value_same(struct ext4_xattr_search
*s
,
1141 struct ext4_xattr_info
*i
)
1145 if (le32_to_cpu(s
->here
->e_value_size
) != i
->value_len
)
1147 value
= ((void *)s
->base
) + le16_to_cpu(s
->here
->e_value_offs
);
1148 return !memcmp(value
, i
->value
, i
->value_len
);
1152 * ext4_xattr_set_handle()
1154 * Create, replace or remove an extended attribute for this inode. Value
1155 * is NULL to remove an existing extended attribute, and non-NULL to
1156 * either replace an existing extended attribute, or create a new extended
1157 * attribute. The flags XATTR_REPLACE and XATTR_CREATE
1158 * specify that an extended attribute must exist and must not exist
1159 * previous to the call, respectively.
1161 * Returns 0, or a negative error number on failure.
1164 ext4_xattr_set_handle(handle_t
*handle
, struct inode
*inode
, int name_index
,
1165 const char *name
, const void *value
, size_t value_len
,
1168 struct ext4_xattr_info i
= {
1169 .name_index
= name_index
,
1172 .value_len
= value_len
,
1175 struct ext4_xattr_ibody_find is
= {
1176 .s
= { .not_found
= -ENODATA
, },
1178 struct ext4_xattr_block_find bs
= {
1179 .s
= { .not_found
= -ENODATA
, },
1181 unsigned long no_expand
;
1186 if (strlen(name
) > 255)
1188 down_write(&EXT4_I(inode
)->xattr_sem
);
1189 no_expand
= ext4_test_inode_state(inode
, EXT4_STATE_NO_EXPAND
);
1190 ext4_set_inode_state(inode
, EXT4_STATE_NO_EXPAND
);
1192 error
= ext4_reserve_inode_write(handle
, inode
, &is
.iloc
);
1196 if (ext4_test_inode_state(inode
, EXT4_STATE_NEW
)) {
1197 struct ext4_inode
*raw_inode
= ext4_raw_inode(&is
.iloc
);
1198 memset(raw_inode
, 0, EXT4_SB(inode
->i_sb
)->s_inode_size
);
1199 ext4_clear_inode_state(inode
, EXT4_STATE_NEW
);
1202 error
= ext4_xattr_ibody_find(inode
, &i
, &is
);
1206 error
= ext4_xattr_block_find(inode
, &i
, &bs
);
1209 if (is
.s
.not_found
&& bs
.s
.not_found
) {
1211 if (flags
& XATTR_REPLACE
)
1218 if (flags
& XATTR_CREATE
)
1222 if (!is
.s
.not_found
)
1223 error
= ext4_xattr_ibody_set(handle
, inode
, &i
, &is
);
1224 else if (!bs
.s
.not_found
)
1225 error
= ext4_xattr_block_set(handle
, inode
, &i
, &bs
);
1228 /* Xattr value did not change? Save us some work and bail out */
1229 if (!is
.s
.not_found
&& ext4_xattr_value_same(&is
.s
, &i
))
1231 if (!bs
.s
.not_found
&& ext4_xattr_value_same(&bs
.s
, &i
))
1234 error
= ext4_xattr_ibody_set(handle
, inode
, &i
, &is
);
1235 if (!error
&& !bs
.s
.not_found
) {
1237 error
= ext4_xattr_block_set(handle
, inode
, &i
, &bs
);
1238 } else if (error
== -ENOSPC
) {
1239 if (EXT4_I(inode
)->i_file_acl
&& !bs
.s
.base
) {
1240 error
= ext4_xattr_block_find(inode
, &i
, &bs
);
1244 error
= ext4_xattr_block_set(handle
, inode
, &i
, &bs
);
1247 if (!is
.s
.not_found
) {
1249 error
= ext4_xattr_ibody_set(handle
, inode
, &i
,
1255 ext4_xattr_update_super_block(handle
, inode
->i_sb
);
1256 inode
->i_ctime
= ext4_current_time(inode
);
1258 ext4_clear_inode_state(inode
, EXT4_STATE_NO_EXPAND
);
1259 error
= ext4_mark_iloc_dirty(handle
, inode
, &is
.iloc
);
1261 * The bh is consumed by ext4_mark_iloc_dirty, even with
1266 ext4_handle_sync(handle
);
1273 ext4_clear_inode_state(inode
, EXT4_STATE_NO_EXPAND
);
1274 up_write(&EXT4_I(inode
)->xattr_sem
);
1281 * Like ext4_xattr_set_handle, but start from an inode. This extended
1282 * attribute modification is a filesystem transaction by itself.
1284 * Returns 0, or a negative error number on failure.
1287 ext4_xattr_set(struct inode
*inode
, int name_index
, const char *name
,
1288 const void *value
, size_t value_len
, int flags
)
1291 int error
, retries
= 0;
1292 int credits
= ext4_jbd2_credits_xattr(inode
);
1295 handle
= ext4_journal_start(inode
, EXT4_HT_XATTR
, credits
);
1296 if (IS_ERR(handle
)) {
1297 error
= PTR_ERR(handle
);
1301 error
= ext4_xattr_set_handle(handle
, inode
, name_index
, name
,
1302 value
, value_len
, flags
);
1303 error2
= ext4_journal_stop(handle
);
1304 if (error
== -ENOSPC
&&
1305 ext4_should_retry_alloc(inode
->i_sb
, &retries
))
1315 * Shift the EA entries in the inode to create space for the increased
1318 static void ext4_xattr_shift_entries(struct ext4_xattr_entry
*entry
,
1319 int value_offs_shift
, void *to
,
1320 void *from
, size_t n
, int blocksize
)
1322 struct ext4_xattr_entry
*last
= entry
;
1325 /* Adjust the value offsets of the entries */
1326 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
1327 if (!last
->e_value_block
&& last
->e_value_size
) {
1328 new_offs
= le16_to_cpu(last
->e_value_offs
) +
1330 BUG_ON(new_offs
+ le32_to_cpu(last
->e_value_size
)
1332 last
->e_value_offs
= cpu_to_le16(new_offs
);
1335 /* Shift the entries by n bytes */
1336 memmove(to
, from
, n
);
1340 * Expand an inode by new_extra_isize bytes when EAs are present.
1341 * Returns 0 on success or negative error number on failure.
1343 int ext4_expand_extra_isize_ea(struct inode
*inode
, int new_extra_isize
,
1344 struct ext4_inode
*raw_inode
, handle_t
*handle
)
1346 struct ext4_xattr_ibody_header
*header
;
1347 struct ext4_xattr_entry
*entry
, *last
, *first
;
1348 struct buffer_head
*bh
= NULL
;
1349 struct ext4_xattr_ibody_find
*is
= NULL
;
1350 struct ext4_xattr_block_find
*bs
= NULL
;
1351 char *buffer
= NULL
, *b_entry_name
= NULL
;
1352 size_t min_offs
, free
;
1354 void *base
, *start
, *end
;
1355 int extra_isize
= 0, error
= 0, tried_min_extra_isize
= 0;
1356 int s_min_extra_isize
= le16_to_cpu(EXT4_SB(inode
->i_sb
)->s_es
->s_min_extra_isize
);
1358 down_write(&EXT4_I(inode
)->xattr_sem
);
1360 if (EXT4_I(inode
)->i_extra_isize
>= new_extra_isize
) {
1361 up_write(&EXT4_I(inode
)->xattr_sem
);
1365 header
= IHDR(inode
, raw_inode
);
1366 entry
= IFIRST(header
);
1369 * Check if enough free space is available in the inode to shift the
1370 * entries ahead by new_extra_isize.
1373 base
= start
= entry
;
1374 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
1375 min_offs
= end
- base
;
1377 total_ino
= sizeof(struct ext4_xattr_ibody_header
);
1379 error
= xattr_check_inode(inode
, header
, end
);
1383 free
= ext4_xattr_free_space(last
, &min_offs
, base
, &total_ino
);
1384 if (free
>= new_extra_isize
) {
1385 entry
= IFIRST(header
);
1386 ext4_xattr_shift_entries(entry
, EXT4_I(inode
)->i_extra_isize
1387 - new_extra_isize
, (void *)raw_inode
+
1388 EXT4_GOOD_OLD_INODE_SIZE
+ new_extra_isize
,
1389 (void *)header
, total_ino
,
1390 inode
->i_sb
->s_blocksize
);
1391 EXT4_I(inode
)->i_extra_isize
= new_extra_isize
;
1397 * Enough free space isn't available in the inode, check if
1398 * EA block can hold new_extra_isize bytes.
1400 if (EXT4_I(inode
)->i_file_acl
) {
1401 bh
= sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
);
1405 if (ext4_xattr_check_block(inode
, bh
)) {
1406 EXT4_ERROR_INODE(inode
, "bad block %llu",
1407 EXT4_I(inode
)->i_file_acl
);
1408 error
= -EFSCORRUPTED
;
1413 end
= bh
->b_data
+ bh
->b_size
;
1414 min_offs
= end
- base
;
1415 free
= ext4_xattr_free_space(first
, &min_offs
, base
, NULL
);
1416 if (free
< new_extra_isize
) {
1417 if (!tried_min_extra_isize
&& s_min_extra_isize
) {
1418 tried_min_extra_isize
++;
1419 new_extra_isize
= s_min_extra_isize
;
1427 free
= inode
->i_sb
->s_blocksize
;
1430 while (new_extra_isize
> 0) {
1431 size_t offs
, size
, entry_size
;
1432 struct ext4_xattr_entry
*small_entry
= NULL
;
1433 struct ext4_xattr_info i
= {
1437 unsigned int total_size
; /* EA entry size + value size */
1438 unsigned int shift_bytes
; /* No. of bytes to shift EAs by? */
1439 unsigned int min_total_size
= ~0U;
1441 is
= kzalloc(sizeof(struct ext4_xattr_ibody_find
), GFP_NOFS
);
1442 bs
= kzalloc(sizeof(struct ext4_xattr_block_find
), GFP_NOFS
);
1448 is
->s
.not_found
= -ENODATA
;
1449 bs
->s
.not_found
= -ENODATA
;
1453 last
= IFIRST(header
);
1454 /* Find the entry best suited to be pushed into EA block */
1456 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
1458 EXT4_XATTR_SIZE(le32_to_cpu(last
->e_value_size
)) +
1459 EXT4_XATTR_LEN(last
->e_name_len
);
1460 if (total_size
<= free
&& total_size
< min_total_size
) {
1461 if (total_size
< new_extra_isize
) {
1465 min_total_size
= total_size
;
1470 if (entry
== NULL
) {
1472 entry
= small_entry
;
1474 if (!tried_min_extra_isize
&&
1475 s_min_extra_isize
) {
1476 tried_min_extra_isize
++;
1477 new_extra_isize
= s_min_extra_isize
;
1478 kfree(is
); is
= NULL
;
1479 kfree(bs
); bs
= NULL
;
1487 offs
= le16_to_cpu(entry
->e_value_offs
);
1488 size
= le32_to_cpu(entry
->e_value_size
);
1489 entry_size
= EXT4_XATTR_LEN(entry
->e_name_len
);
1490 i
.name_index
= entry
->e_name_index
,
1491 buffer
= kmalloc(EXT4_XATTR_SIZE(size
), GFP_NOFS
);
1492 b_entry_name
= kmalloc(entry
->e_name_len
+ 1, GFP_NOFS
);
1493 if (!buffer
|| !b_entry_name
) {
1497 /* Save the entry name and the entry value */
1498 memcpy(buffer
, (void *)IFIRST(header
) + offs
,
1499 EXT4_XATTR_SIZE(size
));
1500 memcpy(b_entry_name
, entry
->e_name
, entry
->e_name_len
);
1501 b_entry_name
[entry
->e_name_len
] = '\0';
1502 i
.name
= b_entry_name
;
1504 error
= ext4_get_inode_loc(inode
, &is
->iloc
);
1508 error
= ext4_xattr_ibody_find(inode
, &i
, is
);
1512 /* Remove the chosen entry from the inode */
1513 error
= ext4_xattr_ibody_set(handle
, inode
, &i
, is
);
1517 entry
= IFIRST(header
);
1518 if (entry_size
+ EXT4_XATTR_SIZE(size
) >= new_extra_isize
)
1519 shift_bytes
= new_extra_isize
;
1521 shift_bytes
= entry_size
+ size
;
1522 /* Adjust the offsets and shift the remaining entries ahead */
1523 ext4_xattr_shift_entries(entry
, EXT4_I(inode
)->i_extra_isize
-
1524 shift_bytes
, (void *)raw_inode
+
1525 EXT4_GOOD_OLD_INODE_SIZE
+ extra_isize
+ shift_bytes
,
1526 (void *)header
, total_ino
- entry_size
,
1527 inode
->i_sb
->s_blocksize
);
1529 extra_isize
+= shift_bytes
;
1530 new_extra_isize
-= shift_bytes
;
1531 EXT4_I(inode
)->i_extra_isize
= extra_isize
;
1533 i
.name
= b_entry_name
;
1536 error
= ext4_xattr_block_find(inode
, &i
, bs
);
1540 /* Add entry which was removed from the inode into the block */
1541 error
= ext4_xattr_block_set(handle
, inode
, &i
, bs
);
1544 kfree(b_entry_name
);
1546 b_entry_name
= NULL
;
1548 brelse(is
->iloc
.bh
);
1553 up_write(&EXT4_I(inode
)->xattr_sem
);
1557 kfree(b_entry_name
);
1560 brelse(is
->iloc
.bh
);
1564 up_write(&EXT4_I(inode
)->xattr_sem
);
1571 * ext4_xattr_delete_inode()
1573 * Free extended attribute resources associated with this inode. This
1574 * is called immediately before an inode is freed. We have exclusive
1575 * access to the inode.
1578 ext4_xattr_delete_inode(handle_t
*handle
, struct inode
*inode
)
1580 struct buffer_head
*bh
= NULL
;
1582 if (!EXT4_I(inode
)->i_file_acl
)
1584 bh
= sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
);
1586 EXT4_ERROR_INODE(inode
, "block %llu read error",
1587 EXT4_I(inode
)->i_file_acl
);
1590 if (BHDR(bh
)->h_magic
!= cpu_to_le32(EXT4_XATTR_MAGIC
) ||
1591 BHDR(bh
)->h_blocks
!= cpu_to_le32(1)) {
1592 EXT4_ERROR_INODE(inode
, "bad block %llu",
1593 EXT4_I(inode
)->i_file_acl
);
1596 ext4_xattr_release_block(handle
, inode
, bh
);
1597 EXT4_I(inode
)->i_file_acl
= 0;
1604 * ext4_xattr_cache_insert()
1606 * Create a new entry in the extended attribute cache, and insert
1607 * it unless such an entry is already in the cache.
1609 * Returns 0, or a negative error number on failure.
1612 ext4_xattr_cache_insert(struct mb_cache
*ext4_mb_cache
, struct buffer_head
*bh
)
1614 struct ext4_xattr_header
*header
= BHDR(bh
);
1615 __u32 hash
= le32_to_cpu(header
->h_hash
);
1616 int reusable
= le32_to_cpu(header
->h_refcount
) <
1617 EXT4_XATTR_REFCOUNT_MAX
;
1620 error
= mb_cache_entry_create(ext4_mb_cache
, GFP_NOFS
, hash
,
1621 bh
->b_blocknr
, reusable
);
1623 if (error
== -EBUSY
)
1624 ea_bdebug(bh
, "already in cache");
1626 ea_bdebug(bh
, "inserting [%x]", (int)hash
);
1632 * Compare two extended attribute blocks for equality.
1634 * Returns 0 if the blocks are equal, 1 if they differ, and
1635 * a negative error number on errors.
1638 ext4_xattr_cmp(struct ext4_xattr_header
*header1
,
1639 struct ext4_xattr_header
*header2
)
1641 struct ext4_xattr_entry
*entry1
, *entry2
;
1643 entry1
= ENTRY(header1
+1);
1644 entry2
= ENTRY(header2
+1);
1645 while (!IS_LAST_ENTRY(entry1
)) {
1646 if (IS_LAST_ENTRY(entry2
))
1648 if (entry1
->e_hash
!= entry2
->e_hash
||
1649 entry1
->e_name_index
!= entry2
->e_name_index
||
1650 entry1
->e_name_len
!= entry2
->e_name_len
||
1651 entry1
->e_value_size
!= entry2
->e_value_size
||
1652 memcmp(entry1
->e_name
, entry2
->e_name
, entry1
->e_name_len
))
1654 if (entry1
->e_value_block
!= 0 || entry2
->e_value_block
!= 0)
1655 return -EFSCORRUPTED
;
1656 if (memcmp((char *)header1
+ le16_to_cpu(entry1
->e_value_offs
),
1657 (char *)header2
+ le16_to_cpu(entry2
->e_value_offs
),
1658 le32_to_cpu(entry1
->e_value_size
)))
1661 entry1
= EXT4_XATTR_NEXT(entry1
);
1662 entry2
= EXT4_XATTR_NEXT(entry2
);
1664 if (!IS_LAST_ENTRY(entry2
))
1670 * ext4_xattr_cache_find()
1672 * Find an identical extended attribute block.
1674 * Returns a pointer to the block found, or NULL if such a block was
1675 * not found or an error occurred.
1677 static struct buffer_head
*
1678 ext4_xattr_cache_find(struct inode
*inode
, struct ext4_xattr_header
*header
,
1679 struct mb_cache_entry
**pce
)
1681 __u32 hash
= le32_to_cpu(header
->h_hash
);
1682 struct mb_cache_entry
*ce
;
1683 struct mb_cache
*ext4_mb_cache
= EXT4_GET_MB_CACHE(inode
);
1685 if (!header
->h_hash
)
1686 return NULL
; /* never share */
1687 ea_idebug(inode
, "looking for cached blocks [%x]", (int)hash
);
1688 ce
= mb_cache_entry_find_first(ext4_mb_cache
, hash
);
1690 struct buffer_head
*bh
;
1692 bh
= sb_bread(inode
->i_sb
, ce
->e_block
);
1694 EXT4_ERROR_INODE(inode
, "block %lu read error",
1695 (unsigned long) ce
->e_block
);
1696 } else if (ext4_xattr_cmp(header
, BHDR(bh
)) == 0) {
1701 ce
= mb_cache_entry_find_next(ext4_mb_cache
, ce
);
1706 #define NAME_HASH_SHIFT 5
1707 #define VALUE_HASH_SHIFT 16
1710 * ext4_xattr_hash_entry()
1712 * Compute the hash of an extended attribute.
1714 static inline void ext4_xattr_hash_entry(struct ext4_xattr_header
*header
,
1715 struct ext4_xattr_entry
*entry
)
1718 char *name
= entry
->e_name
;
1721 for (n
= 0; n
< entry
->e_name_len
; n
++) {
1722 hash
= (hash
<< NAME_HASH_SHIFT
) ^
1723 (hash
>> (8*sizeof(hash
) - NAME_HASH_SHIFT
)) ^
1727 if (entry
->e_value_block
== 0 && entry
->e_value_size
!= 0) {
1728 __le32
*value
= (__le32
*)((char *)header
+
1729 le16_to_cpu(entry
->e_value_offs
));
1730 for (n
= (le32_to_cpu(entry
->e_value_size
) +
1731 EXT4_XATTR_ROUND
) >> EXT4_XATTR_PAD_BITS
; n
; n
--) {
1732 hash
= (hash
<< VALUE_HASH_SHIFT
) ^
1733 (hash
>> (8*sizeof(hash
) - VALUE_HASH_SHIFT
)) ^
1734 le32_to_cpu(*value
++);
1737 entry
->e_hash
= cpu_to_le32(hash
);
1740 #undef NAME_HASH_SHIFT
1741 #undef VALUE_HASH_SHIFT
1743 #define BLOCK_HASH_SHIFT 16
1746 * ext4_xattr_rehash()
1748 * Re-compute the extended attribute hash value after an entry has changed.
1750 static void ext4_xattr_rehash(struct ext4_xattr_header
*header
,
1751 struct ext4_xattr_entry
*entry
)
1753 struct ext4_xattr_entry
*here
;
1756 ext4_xattr_hash_entry(header
, entry
);
1757 here
= ENTRY(header
+1);
1758 while (!IS_LAST_ENTRY(here
)) {
1759 if (!here
->e_hash
) {
1760 /* Block is not shared if an entry's hash value == 0 */
1764 hash
= (hash
<< BLOCK_HASH_SHIFT
) ^
1765 (hash
>> (8*sizeof(hash
) - BLOCK_HASH_SHIFT
)) ^
1766 le32_to_cpu(here
->e_hash
);
1767 here
= EXT4_XATTR_NEXT(here
);
1769 header
->h_hash
= cpu_to_le32(hash
);
1772 #undef BLOCK_HASH_SHIFT
1774 #define HASH_BUCKET_BITS 10
1777 ext4_xattr_create_cache(void)
1779 return mb_cache_create(HASH_BUCKET_BITS
);
1782 void ext4_xattr_destroy_cache(struct mb_cache
*cache
)
1785 mb_cache_destroy(cache
);