1 // SPDX-License-Identifier: GPL-2.0
3 * linux/fs/ext4/xattr.c
5 * Copyright (C) 2001-2003 Andreas Gruenbacher, <agruen@suse.de>
7 * Fix by Harrison Xing <harrison@mountainviewdata.com>.
8 * Ext4 code with a lot of help from Eric Jarman <ejarman@acm.org>.
9 * Extended attributes for symlinks and special files added per
10 * suggestion of Luka Renko <luka.renko@hermes.si>.
11 * xattr consolidation Copyright (c) 2004 James Morris <jmorris@redhat.com>,
13 * ea-in-inode support by Alex Tomas <alex@clusterfs.com> aka bzzz
14 * and Andreas Gruenbacher <agruen@suse.de>.
18 * Extended attributes are stored directly in inodes (on file systems with
19 * inodes bigger than 128 bytes) and on additional disk blocks. The i_file_acl
20 * field contains the block number if an inode uses an additional block. All
21 * attributes must fit in the inode and one additional block. Blocks that
22 * contain the identical set of attributes may be shared among several inodes.
23 * Identical blocks are detected by keeping a cache of blocks that have
24 * recently been accessed.
26 * The attributes in inodes and on blocks have a different header; the entries
27 * are stored in the same format:
29 * +------------------+
32 * | entry 2 | | growing downwards
37 * | value 3 | | growing upwards
39 * +------------------+
41 * The header is followed by multiple entry descriptors. In disk blocks, the
42 * entry descriptors are kept sorted. In inodes, they are unsorted. The
43 * attribute values are aligned to the end of the block in no specific order.
47 * EXT4_I(inode)->i_file_acl is protected by EXT4_I(inode)->xattr_sem.
48 * EA blocks are only changed if they are exclusive to an inode, so
49 * holding xattr_sem also means that nothing but the EA block's reference
50 * count can change. Multiple writers to the same block are synchronized
54 #include <linux/init.h>
56 #include <linux/slab.h>
57 #include <linux/mbcache.h>
58 #include <linux/quotaops.h>
59 #include <linux/iversion.h>
60 #include "ext4_jbd2.h"
65 #ifdef EXT4_XATTR_DEBUG
66 # define ea_idebug(inode, fmt, ...) \
67 printk(KERN_DEBUG "inode %s:%lu: " fmt "\n", \
68 inode->i_sb->s_id, inode->i_ino, ##__VA_ARGS__)
69 # define ea_bdebug(bh, fmt, ...) \
70 printk(KERN_DEBUG "block %pg:%lu: " fmt "\n", \
71 bh->b_bdev, (unsigned long)bh->b_blocknr, ##__VA_ARGS__)
73 # define ea_idebug(inode, fmt, ...) no_printk(fmt, ##__VA_ARGS__)
74 # define ea_bdebug(bh, fmt, ...) no_printk(fmt, ##__VA_ARGS__)
77 static void ext4_xattr_block_cache_insert(struct mb_cache
*,
78 struct buffer_head
*);
79 static struct buffer_head
*
80 ext4_xattr_block_cache_find(struct inode
*, struct ext4_xattr_header
*,
81 struct mb_cache_entry
**);
82 static __le32
ext4_xattr_hash_entry(char *name
, size_t name_len
, __le32
*value
,
84 static __le32
ext4_xattr_hash_entry_signed(char *name
, size_t name_len
, __le32
*value
,
86 static void ext4_xattr_rehash(struct ext4_xattr_header
*);
88 static const struct xattr_handler
* const ext4_xattr_handler_map
[] = {
89 [EXT4_XATTR_INDEX_USER
] = &ext4_xattr_user_handler
,
90 #ifdef CONFIG_EXT4_FS_POSIX_ACL
91 [EXT4_XATTR_INDEX_POSIX_ACL_ACCESS
] = &nop_posix_acl_access
,
92 [EXT4_XATTR_INDEX_POSIX_ACL_DEFAULT
] = &nop_posix_acl_default
,
94 [EXT4_XATTR_INDEX_TRUSTED
] = &ext4_xattr_trusted_handler
,
95 #ifdef CONFIG_EXT4_FS_SECURITY
96 [EXT4_XATTR_INDEX_SECURITY
] = &ext4_xattr_security_handler
,
98 [EXT4_XATTR_INDEX_HURD
] = &ext4_xattr_hurd_handler
,
101 const struct xattr_handler
* const ext4_xattr_handlers
[] = {
102 &ext4_xattr_user_handler
,
103 &ext4_xattr_trusted_handler
,
104 #ifdef CONFIG_EXT4_FS_SECURITY
105 &ext4_xattr_security_handler
,
107 &ext4_xattr_hurd_handler
,
111 #define EA_BLOCK_CACHE(inode) (((struct ext4_sb_info *) \
112 inode->i_sb->s_fs_info)->s_ea_block_cache)
114 #define EA_INODE_CACHE(inode) (((struct ext4_sb_info *) \
115 inode->i_sb->s_fs_info)->s_ea_inode_cache)
118 ext4_expand_inode_array(struct ext4_xattr_inode_array
**ea_inode_array
,
119 struct inode
*inode
);
121 #ifdef CONFIG_LOCKDEP
122 void ext4_xattr_inode_set_class(struct inode
*ea_inode
)
124 struct ext4_inode_info
*ei
= EXT4_I(ea_inode
);
126 lockdep_set_subclass(&ea_inode
->i_rwsem
, 1);
127 (void) ei
; /* shut up clang warning if !CONFIG_LOCKDEP */
128 lockdep_set_subclass(&ei
->i_data_sem
, I_DATA_SEM_EA
);
132 static __le32
ext4_xattr_block_csum(struct inode
*inode
,
134 struct ext4_xattr_header
*hdr
)
136 struct ext4_sb_info
*sbi
= EXT4_SB(inode
->i_sb
);
138 __le64 dsk_block_nr
= cpu_to_le64(block_nr
);
139 __u32 dummy_csum
= 0;
140 int offset
= offsetof(struct ext4_xattr_header
, h_checksum
);
142 csum
= ext4_chksum(sbi
, sbi
->s_csum_seed
, (__u8
*)&dsk_block_nr
,
143 sizeof(dsk_block_nr
));
144 csum
= ext4_chksum(sbi
, csum
, (__u8
*)hdr
, offset
);
145 csum
= ext4_chksum(sbi
, csum
, (__u8
*)&dummy_csum
, sizeof(dummy_csum
));
146 offset
+= sizeof(dummy_csum
);
147 csum
= ext4_chksum(sbi
, csum
, (__u8
*)hdr
+ offset
,
148 EXT4_BLOCK_SIZE(inode
->i_sb
) - offset
);
150 return cpu_to_le32(csum
);
153 static int ext4_xattr_block_csum_verify(struct inode
*inode
,
154 struct buffer_head
*bh
)
156 struct ext4_xattr_header
*hdr
= BHDR(bh
);
159 if (ext4_has_metadata_csum(inode
->i_sb
)) {
161 ret
= (hdr
->h_checksum
== ext4_xattr_block_csum(inode
,
162 bh
->b_blocknr
, hdr
));
168 static void ext4_xattr_block_csum_set(struct inode
*inode
,
169 struct buffer_head
*bh
)
171 if (ext4_has_metadata_csum(inode
->i_sb
))
172 BHDR(bh
)->h_checksum
= ext4_xattr_block_csum(inode
,
173 bh
->b_blocknr
, BHDR(bh
));
176 static inline const char *ext4_xattr_prefix(int name_index
,
177 struct dentry
*dentry
)
179 const struct xattr_handler
*handler
= NULL
;
181 if (name_index
> 0 && name_index
< ARRAY_SIZE(ext4_xattr_handler_map
))
182 handler
= ext4_xattr_handler_map
[name_index
];
184 if (!xattr_handler_can_list(handler
, dentry
))
187 return xattr_prefix(handler
);
191 check_xattrs(struct inode
*inode
, struct buffer_head
*bh
,
192 struct ext4_xattr_entry
*entry
, void *end
, void *value_start
,
193 const char *function
, unsigned int line
)
195 struct ext4_xattr_entry
*e
= entry
;
196 int err
= -EFSCORRUPTED
;
200 if (BHDR(bh
)->h_magic
!= cpu_to_le32(EXT4_XATTR_MAGIC
) ||
201 BHDR(bh
)->h_blocks
!= cpu_to_le32(1)) {
202 err_str
= "invalid header";
205 if (buffer_verified(bh
))
207 if (!ext4_xattr_block_csum_verify(inode
, bh
)) {
209 err_str
= "invalid checksum";
213 struct ext4_xattr_ibody_header
*header
= value_start
;
216 if (end
- (void *)header
< sizeof(*header
) + sizeof(u32
)) {
217 err_str
= "in-inode xattr block too small";
220 if (header
->h_magic
!= cpu_to_le32(EXT4_XATTR_MAGIC
)) {
221 err_str
= "bad magic number in in-inode xattr";
226 /* Find the end of the names list */
227 while (!IS_LAST_ENTRY(e
)) {
228 struct ext4_xattr_entry
*next
= EXT4_XATTR_NEXT(e
);
229 if ((void *)next
>= end
) {
230 err_str
= "e_name out of bounds";
233 if (strnlen(e
->e_name
, e
->e_name_len
) != e
->e_name_len
) {
234 err_str
= "bad e_name length";
240 /* Check the values */
241 while (!IS_LAST_ENTRY(entry
)) {
242 u32 size
= le32_to_cpu(entry
->e_value_size
);
243 unsigned long ea_ino
= le32_to_cpu(entry
->e_value_inum
);
245 if (!ext4_has_feature_ea_inode(inode
->i_sb
) && ea_ino
) {
246 err_str
= "ea_inode specified without ea_inode feature enabled";
249 if (ea_ino
&& ((ea_ino
== EXT4_ROOT_INO
) ||
250 !ext4_valid_inum(inode
->i_sb
, ea_ino
))) {
251 err_str
= "invalid ea_ino";
254 if (size
> EXT4_XATTR_SIZE_MAX
) {
255 err_str
= "e_value size too large";
259 if (size
!= 0 && entry
->e_value_inum
== 0) {
260 u16 offs
= le16_to_cpu(entry
->e_value_offs
);
264 * The value cannot overlap the names, and the value
265 * with padding cannot extend beyond 'end'. Check both
266 * the padded and unpadded sizes, since the size may
267 * overflow to 0 when adding padding.
269 if (offs
> end
- value_start
) {
270 err_str
= "e_value out of bounds";
273 value
= value_start
+ offs
;
274 if (value
< (void *)e
+ sizeof(u32
) ||
275 size
> end
- value
||
276 EXT4_XATTR_SIZE(size
) > end
- value
) {
277 err_str
= "overlapping e_value ";
281 entry
= EXT4_XATTR_NEXT(entry
);
284 set_buffer_verified(bh
);
289 __ext4_error_inode(inode
, function
, line
, 0, -err
,
290 "corrupted xattr block %llu: %s",
291 (unsigned long long) bh
->b_blocknr
,
294 __ext4_error_inode(inode
, function
, line
, 0, -err
,
295 "corrupted in-inode xattr: %s", err_str
);
300 __ext4_xattr_check_block(struct inode
*inode
, struct buffer_head
*bh
,
301 const char *function
, unsigned int line
)
303 return check_xattrs(inode
, bh
, BFIRST(bh
), bh
->b_data
+ bh
->b_size
,
304 bh
->b_data
, function
, line
);
307 #define ext4_xattr_check_block(inode, bh) \
308 __ext4_xattr_check_block((inode), (bh), __func__, __LINE__)
312 __xattr_check_inode(struct inode
*inode
, struct ext4_xattr_ibody_header
*header
,
313 void *end
, const char *function
, unsigned int line
)
315 return check_xattrs(inode
, NULL
, IFIRST(header
), end
, IFIRST(header
),
319 #define xattr_check_inode(inode, header, end) \
320 __xattr_check_inode((inode), (header), (end), __func__, __LINE__)
323 xattr_find_entry(struct inode
*inode
, struct ext4_xattr_entry
**pentry
,
324 void *end
, int name_index
, const char *name
, int sorted
)
326 struct ext4_xattr_entry
*entry
, *next
;
332 name_len
= strlen(name
);
333 for (entry
= *pentry
; !IS_LAST_ENTRY(entry
); entry
= next
) {
334 next
= EXT4_XATTR_NEXT(entry
);
335 if ((void *) next
>= end
) {
336 EXT4_ERROR_INODE(inode
, "corrupted xattr entries");
337 return -EFSCORRUPTED
;
339 cmp
= name_index
- entry
->e_name_index
;
341 cmp
= name_len
- entry
->e_name_len
;
343 cmp
= memcmp(name
, entry
->e_name
, name_len
);
344 if (cmp
<= 0 && (sorted
|| cmp
== 0))
348 return cmp
? -ENODATA
: 0;
352 ext4_xattr_inode_hash(struct ext4_sb_info
*sbi
, const void *buffer
, size_t size
)
354 return ext4_chksum(sbi
, sbi
->s_csum_seed
, buffer
, size
);
357 static u64
ext4_xattr_inode_get_ref(struct inode
*ea_inode
)
359 return ((u64
) inode_get_ctime_sec(ea_inode
) << 32) |
360 (u32
) inode_peek_iversion_raw(ea_inode
);
363 static void ext4_xattr_inode_set_ref(struct inode
*ea_inode
, u64 ref_count
)
365 inode_set_ctime(ea_inode
, (u32
)(ref_count
>> 32), 0);
366 inode_set_iversion_raw(ea_inode
, ref_count
& 0xffffffff);
369 static u32
ext4_xattr_inode_get_hash(struct inode
*ea_inode
)
371 return (u32
) inode_get_atime_sec(ea_inode
);
374 static void ext4_xattr_inode_set_hash(struct inode
*ea_inode
, u32 hash
)
376 inode_set_atime(ea_inode
, hash
, 0);
380 * Read the EA value from an inode.
382 static int ext4_xattr_inode_read(struct inode
*ea_inode
, void *buf
, size_t size
)
384 int blocksize
= 1 << ea_inode
->i_blkbits
;
385 int bh_count
= (size
+ blocksize
- 1) >> ea_inode
->i_blkbits
;
386 int tail_size
= (size
% blocksize
) ?: blocksize
;
387 struct buffer_head
*bhs_inline
[8];
388 struct buffer_head
**bhs
= bhs_inline
;
391 if (bh_count
> ARRAY_SIZE(bhs_inline
)) {
392 bhs
= kmalloc_array(bh_count
, sizeof(*bhs
), GFP_NOFS
);
397 ret
= ext4_bread_batch(ea_inode
, 0 /* block */, bh_count
,
398 true /* wait */, bhs
);
402 for (i
= 0; i
< bh_count
; i
++) {
403 /* There shouldn't be any holes in ea_inode. */
408 memcpy((char *)buf
+ blocksize
* i
, bhs
[i
]->b_data
,
409 i
< bh_count
- 1 ? blocksize
: tail_size
);
413 for (i
= 0; i
< bh_count
; i
++)
416 if (bhs
!= bhs_inline
)
421 #define EXT4_XATTR_INODE_GET_PARENT(inode) ((__u32)(inode_get_mtime_sec(inode)))
423 static int ext4_xattr_inode_iget(struct inode
*parent
, unsigned long ea_ino
,
424 u32 ea_inode_hash
, struct inode
**ea_inode
)
430 * We have to check for this corruption early as otherwise
431 * iget_locked() could wait indefinitely for the state of our
434 if (parent
->i_ino
== ea_ino
) {
435 ext4_error(parent
->i_sb
,
436 "Parent and EA inode have the same ino %lu", ea_ino
);
437 return -EFSCORRUPTED
;
440 inode
= ext4_iget(parent
->i_sb
, ea_ino
, EXT4_IGET_EA_INODE
);
442 err
= PTR_ERR(inode
);
443 ext4_error(parent
->i_sb
,
444 "error while reading EA inode %lu err=%d", ea_ino
,
448 ext4_xattr_inode_set_class(inode
);
451 * Check whether this is an old Lustre-style xattr inode. Lustre
452 * implementation does not have hash validation, rather it has a
453 * backpointer from ea_inode to the parent inode.
455 if (ea_inode_hash
!= ext4_xattr_inode_get_hash(inode
) &&
456 EXT4_XATTR_INODE_GET_PARENT(inode
) == parent
->i_ino
&&
457 inode
->i_generation
== parent
->i_generation
) {
458 ext4_set_inode_state(inode
, EXT4_STATE_LUSTRE_EA_INODE
);
459 ext4_xattr_inode_set_ref(inode
, 1);
461 inode_lock_nested(inode
, I_MUTEX_XATTR
);
462 inode
->i_flags
|= S_NOQUOTA
;
470 /* Remove entry from mbcache when EA inode is getting evicted */
471 void ext4_evict_ea_inode(struct inode
*inode
)
473 struct mb_cache_entry
*oe
;
475 if (!EA_INODE_CACHE(inode
))
477 /* Wait for entry to get unused so that we can remove it */
478 while ((oe
= mb_cache_entry_delete_or_get(EA_INODE_CACHE(inode
),
479 ext4_xattr_inode_get_hash(inode
), inode
->i_ino
))) {
480 mb_cache_entry_wait_unused(oe
);
481 mb_cache_entry_put(EA_INODE_CACHE(inode
), oe
);
486 ext4_xattr_inode_verify_hashes(struct inode
*ea_inode
,
487 struct ext4_xattr_entry
*entry
, void *buffer
,
492 /* Verify stored hash matches calculated hash. */
493 hash
= ext4_xattr_inode_hash(EXT4_SB(ea_inode
->i_sb
), buffer
, size
);
494 if (hash
!= ext4_xattr_inode_get_hash(ea_inode
))
495 return -EFSCORRUPTED
;
498 __le32 e_hash
, tmp_data
;
500 /* Verify entry hash. */
501 tmp_data
= cpu_to_le32(hash
);
502 e_hash
= ext4_xattr_hash_entry(entry
->e_name
, entry
->e_name_len
,
505 if (e_hash
== entry
->e_hash
)
509 * Not good. Maybe the entry hash was calculated
510 * using the buggy signed char version?
512 e_hash
= ext4_xattr_hash_entry_signed(entry
->e_name
, entry
->e_name_len
,
514 /* Still no match - bad */
515 if (e_hash
!= entry
->e_hash
)
516 return -EFSCORRUPTED
;
518 /* Let people know about old hash */
519 pr_warn_once("ext4: filesystem with signed xattr name hash");
525 * Read xattr value from the EA inode.
528 ext4_xattr_inode_get(struct inode
*inode
, struct ext4_xattr_entry
*entry
,
529 void *buffer
, size_t size
)
531 struct mb_cache
*ea_inode_cache
= EA_INODE_CACHE(inode
);
532 struct inode
*ea_inode
;
535 err
= ext4_xattr_inode_iget(inode
, le32_to_cpu(entry
->e_value_inum
),
536 le32_to_cpu(entry
->e_hash
), &ea_inode
);
542 if (i_size_read(ea_inode
) != size
) {
543 ext4_warning_inode(ea_inode
,
544 "ea_inode file size=%llu entry size=%zu",
545 i_size_read(ea_inode
), size
);
550 err
= ext4_xattr_inode_read(ea_inode
, buffer
, size
);
554 if (!ext4_test_inode_state(ea_inode
, EXT4_STATE_LUSTRE_EA_INODE
)) {
555 err
= ext4_xattr_inode_verify_hashes(ea_inode
, entry
, buffer
,
558 ext4_warning_inode(ea_inode
,
559 "EA inode hash validation failed");
564 mb_cache_entry_create(ea_inode_cache
, GFP_NOFS
,
565 ext4_xattr_inode_get_hash(ea_inode
),
566 ea_inode
->i_ino
, true /* reusable */);
574 ext4_xattr_block_get(struct inode
*inode
, int name_index
, const char *name
,
575 void *buffer
, size_t buffer_size
)
577 struct buffer_head
*bh
= NULL
;
578 struct ext4_xattr_entry
*entry
;
582 struct mb_cache
*ea_block_cache
= EA_BLOCK_CACHE(inode
);
584 ea_idebug(inode
, "name=%d.%s, buffer=%p, buffer_size=%ld",
585 name_index
, name
, buffer
, (long)buffer_size
);
587 if (!EXT4_I(inode
)->i_file_acl
)
589 ea_idebug(inode
, "reading block %llu",
590 (unsigned long long)EXT4_I(inode
)->i_file_acl
);
591 bh
= ext4_sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
594 ea_bdebug(bh
, "b_count=%d, refcount=%d",
595 atomic_read(&(bh
->b_count
)), le32_to_cpu(BHDR(bh
)->h_refcount
));
596 error
= ext4_xattr_check_block(inode
, bh
);
599 ext4_xattr_block_cache_insert(ea_block_cache
, bh
);
601 end
= bh
->b_data
+ bh
->b_size
;
602 error
= xattr_find_entry(inode
, &entry
, end
, name_index
, name
, 1);
605 size
= le32_to_cpu(entry
->e_value_size
);
607 if (unlikely(size
> EXT4_XATTR_SIZE_MAX
))
610 if (size
> buffer_size
)
612 if (entry
->e_value_inum
) {
613 error
= ext4_xattr_inode_get(inode
, entry
, buffer
,
618 u16 offset
= le16_to_cpu(entry
->e_value_offs
);
619 void *p
= bh
->b_data
+ offset
;
621 if (unlikely(p
+ size
> end
))
623 memcpy(buffer
, p
, size
);
634 ext4_xattr_ibody_get(struct inode
*inode
, int name_index
, const char *name
,
635 void *buffer
, size_t buffer_size
)
637 struct ext4_xattr_ibody_header
*header
;
638 struct ext4_xattr_entry
*entry
;
639 struct ext4_inode
*raw_inode
;
640 struct ext4_iloc iloc
;
645 if (!ext4_test_inode_state(inode
, EXT4_STATE_XATTR
))
647 error
= ext4_get_inode_loc(inode
, &iloc
);
650 raw_inode
= ext4_raw_inode(&iloc
);
651 header
= IHDR(inode
, raw_inode
);
652 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
653 error
= xattr_check_inode(inode
, header
, end
);
656 entry
= IFIRST(header
);
657 error
= xattr_find_entry(inode
, &entry
, end
, name_index
, name
, 0);
660 size
= le32_to_cpu(entry
->e_value_size
);
662 if (unlikely(size
> EXT4_XATTR_SIZE_MAX
))
665 if (size
> buffer_size
)
667 if (entry
->e_value_inum
) {
668 error
= ext4_xattr_inode_get(inode
, entry
, buffer
,
673 u16 offset
= le16_to_cpu(entry
->e_value_offs
);
674 void *p
= (void *)IFIRST(header
) + offset
;
676 if (unlikely(p
+ size
> end
))
678 memcpy(buffer
, p
, size
);
691 * Copy an extended attribute into the buffer
692 * provided, or compute the buffer size required.
693 * Buffer is NULL to compute the size of the buffer required.
695 * Returns a negative error number on failure, or the number of bytes
696 * used / required on success.
699 ext4_xattr_get(struct inode
*inode
, int name_index
, const char *name
,
700 void *buffer
, size_t buffer_size
)
704 if (unlikely(ext4_forced_shutdown(inode
->i_sb
)))
707 if (strlen(name
) > 255)
710 down_read(&EXT4_I(inode
)->xattr_sem
);
711 error
= ext4_xattr_ibody_get(inode
, name_index
, name
, buffer
,
713 if (error
== -ENODATA
)
714 error
= ext4_xattr_block_get(inode
, name_index
, name
, buffer
,
716 up_read(&EXT4_I(inode
)->xattr_sem
);
721 ext4_xattr_list_entries(struct dentry
*dentry
, struct ext4_xattr_entry
*entry
,
722 char *buffer
, size_t buffer_size
)
724 size_t rest
= buffer_size
;
726 for (; !IS_LAST_ENTRY(entry
); entry
= EXT4_XATTR_NEXT(entry
)) {
729 prefix
= ext4_xattr_prefix(entry
->e_name_index
, dentry
);
731 size_t prefix_len
= strlen(prefix
);
732 size_t size
= prefix_len
+ entry
->e_name_len
+ 1;
737 memcpy(buffer
, prefix
, prefix_len
);
738 buffer
+= prefix_len
;
739 memcpy(buffer
, entry
->e_name
, entry
->e_name_len
);
740 buffer
+= entry
->e_name_len
;
746 return buffer_size
- rest
; /* total size */
750 ext4_xattr_block_list(struct dentry
*dentry
, char *buffer
, size_t buffer_size
)
752 struct inode
*inode
= d_inode(dentry
);
753 struct buffer_head
*bh
= NULL
;
756 ea_idebug(inode
, "buffer=%p, buffer_size=%ld",
757 buffer
, (long)buffer_size
);
759 if (!EXT4_I(inode
)->i_file_acl
)
761 ea_idebug(inode
, "reading block %llu",
762 (unsigned long long)EXT4_I(inode
)->i_file_acl
);
763 bh
= ext4_sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
766 ea_bdebug(bh
, "b_count=%d, refcount=%d",
767 atomic_read(&(bh
->b_count
)), le32_to_cpu(BHDR(bh
)->h_refcount
));
768 error
= ext4_xattr_check_block(inode
, bh
);
771 ext4_xattr_block_cache_insert(EA_BLOCK_CACHE(inode
), bh
);
772 error
= ext4_xattr_list_entries(dentry
, BFIRST(bh
), buffer
,
780 ext4_xattr_ibody_list(struct dentry
*dentry
, char *buffer
, size_t buffer_size
)
782 struct inode
*inode
= d_inode(dentry
);
783 struct ext4_xattr_ibody_header
*header
;
784 struct ext4_inode
*raw_inode
;
785 struct ext4_iloc iloc
;
789 if (!ext4_test_inode_state(inode
, EXT4_STATE_XATTR
))
791 error
= ext4_get_inode_loc(inode
, &iloc
);
794 raw_inode
= ext4_raw_inode(&iloc
);
795 header
= IHDR(inode
, raw_inode
);
796 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
797 error
= xattr_check_inode(inode
, header
, end
);
800 error
= ext4_xattr_list_entries(dentry
, IFIRST(header
),
801 buffer
, buffer_size
);
809 * Inode operation listxattr()
811 * d_inode(dentry)->i_rwsem: don't care
813 * Copy a list of attribute names into the buffer
814 * provided, or compute the buffer size required.
815 * Buffer is NULL to compute the size of the buffer required.
817 * Returns a negative error number on failure, or the number of bytes
818 * used / required on success.
821 ext4_listxattr(struct dentry
*dentry
, char *buffer
, size_t buffer_size
)
825 down_read(&EXT4_I(d_inode(dentry
))->xattr_sem
);
826 ret
= ret2
= ext4_xattr_ibody_list(dentry
, buffer
, buffer_size
);
833 ret
= ext4_xattr_block_list(dentry
, buffer
, buffer_size
);
838 up_read(&EXT4_I(d_inode(dentry
))->xattr_sem
);
843 * If the EXT4_FEATURE_COMPAT_EXT_ATTR feature of this file system is
846 static void ext4_xattr_update_super_block(handle_t
*handle
,
847 struct super_block
*sb
)
849 if (ext4_has_feature_xattr(sb
))
852 BUFFER_TRACE(EXT4_SB(sb
)->s_sbh
, "get_write_access");
853 if (ext4_journal_get_write_access(handle
, sb
, EXT4_SB(sb
)->s_sbh
,
854 EXT4_JTR_NONE
) == 0) {
855 lock_buffer(EXT4_SB(sb
)->s_sbh
);
856 ext4_set_feature_xattr(sb
);
857 ext4_superblock_csum_set(sb
);
858 unlock_buffer(EXT4_SB(sb
)->s_sbh
);
859 ext4_handle_dirty_metadata(handle
, NULL
, EXT4_SB(sb
)->s_sbh
);
863 int ext4_get_inode_usage(struct inode
*inode
, qsize_t
*usage
)
865 struct ext4_iloc iloc
= { .bh
= NULL
};
866 struct buffer_head
*bh
= NULL
;
867 struct ext4_inode
*raw_inode
;
868 struct ext4_xattr_ibody_header
*header
;
869 struct ext4_xattr_entry
*entry
;
870 qsize_t ea_inode_refs
= 0;
874 lockdep_assert_held_read(&EXT4_I(inode
)->xattr_sem
);
876 if (ext4_test_inode_state(inode
, EXT4_STATE_XATTR
)) {
877 ret
= ext4_get_inode_loc(inode
, &iloc
);
880 raw_inode
= ext4_raw_inode(&iloc
);
881 header
= IHDR(inode
, raw_inode
);
882 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
883 ret
= xattr_check_inode(inode
, header
, end
);
887 for (entry
= IFIRST(header
); !IS_LAST_ENTRY(entry
);
888 entry
= EXT4_XATTR_NEXT(entry
))
889 if (entry
->e_value_inum
)
893 if (EXT4_I(inode
)->i_file_acl
) {
894 bh
= ext4_sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
901 ret
= ext4_xattr_check_block(inode
, bh
);
905 for (entry
= BFIRST(bh
); !IS_LAST_ENTRY(entry
);
906 entry
= EXT4_XATTR_NEXT(entry
))
907 if (entry
->e_value_inum
)
910 *usage
= ea_inode_refs
+ 1;
918 static inline size_t round_up_cluster(struct inode
*inode
, size_t length
)
920 struct super_block
*sb
= inode
->i_sb
;
921 size_t cluster_size
= 1 << (EXT4_SB(sb
)->s_cluster_bits
+
923 size_t mask
= ~(cluster_size
- 1);
925 return (length
+ cluster_size
- 1) & mask
;
928 static int ext4_xattr_inode_alloc_quota(struct inode
*inode
, size_t len
)
932 err
= dquot_alloc_inode(inode
);
935 err
= dquot_alloc_space_nodirty(inode
, round_up_cluster(inode
, len
));
937 dquot_free_inode(inode
);
941 static void ext4_xattr_inode_free_quota(struct inode
*parent
,
942 struct inode
*ea_inode
,
946 ext4_test_inode_state(ea_inode
, EXT4_STATE_LUSTRE_EA_INODE
))
948 dquot_free_space_nodirty(parent
, round_up_cluster(parent
, len
));
949 dquot_free_inode(parent
);
952 int __ext4_xattr_set_credits(struct super_block
*sb
, struct inode
*inode
,
953 struct buffer_head
*block_bh
, size_t value_len
,
960 * 1) Owner inode update
961 * 2) Ref count update on old xattr block
963 * 4) block bitmap update for new xattr block
964 * 5) group descriptor for new xattr block
965 * 6) block bitmap update for old xattr block
966 * 7) group descriptor for old block
968 * 6 & 7 can happen if we have two racing threads T_a and T_b
969 * which are each trying to set an xattr on inodes I_a and I_b
970 * which were both initially sharing an xattr block.
975 credits
+= EXT4_MAXQUOTAS_TRANS_BLOCKS(sb
);
978 * In case of inline data, we may push out the data to a block,
979 * so we need to reserve credits for this eventuality
981 if (inode
&& ext4_has_inline_data(inode
))
982 credits
+= ext4_writepage_trans_blocks(inode
) + 1;
984 /* We are done if ea_inode feature is not enabled. */
985 if (!ext4_has_feature_ea_inode(sb
))
988 /* New ea_inode, inode map, block bitmap, group descriptor. */
992 blocks
= (value_len
+ sb
->s_blocksize
- 1) >> sb
->s_blocksize_bits
;
994 /* Indirection block or one level of extent tree. */
997 /* Block bitmap and group descriptor updates for each block. */
998 credits
+= blocks
* 2;
1000 /* Blocks themselves. */
1004 /* Dereference ea_inode holding old xattr value.
1005 * Old ea_inode, inode map, block bitmap, group descriptor.
1009 /* Data blocks for old ea_inode. */
1010 blocks
= XATTR_SIZE_MAX
>> sb
->s_blocksize_bits
;
1012 /* Indirection block or one level of extent tree for old
1017 /* Block bitmap and group descriptor updates for each block. */
1018 credits
+= blocks
* 2;
1021 /* We may need to clone the existing xattr block in which case we need
1022 * to increment ref counts for existing ea_inodes referenced by it.
1025 struct ext4_xattr_entry
*entry
= BFIRST(block_bh
);
1027 for (; !IS_LAST_ENTRY(entry
); entry
= EXT4_XATTR_NEXT(entry
))
1028 if (entry
->e_value_inum
)
1029 /* Ref count update on ea_inode. */
1035 static int ext4_xattr_inode_update_ref(handle_t
*handle
, struct inode
*ea_inode
,
1038 struct ext4_iloc iloc
;
1042 inode_lock_nested(ea_inode
, I_MUTEX_XATTR
);
1044 ret
= ext4_reserve_inode_write(handle
, ea_inode
, &iloc
);
1048 ref_count
= ext4_xattr_inode_get_ref(ea_inode
);
1049 ref_count
+= ref_change
;
1050 ext4_xattr_inode_set_ref(ea_inode
, ref_count
);
1052 if (ref_change
> 0) {
1053 WARN_ONCE(ref_count
<= 0, "EA inode %lu ref_count=%lld",
1054 ea_inode
->i_ino
, ref_count
);
1056 if (ref_count
== 1) {
1057 WARN_ONCE(ea_inode
->i_nlink
, "EA inode %lu i_nlink=%u",
1058 ea_inode
->i_ino
, ea_inode
->i_nlink
);
1060 set_nlink(ea_inode
, 1);
1061 ext4_orphan_del(handle
, ea_inode
);
1064 WARN_ONCE(ref_count
< 0, "EA inode %lu ref_count=%lld",
1065 ea_inode
->i_ino
, ref_count
);
1067 if (ref_count
== 0) {
1068 WARN_ONCE(ea_inode
->i_nlink
!= 1,
1069 "EA inode %lu i_nlink=%u",
1070 ea_inode
->i_ino
, ea_inode
->i_nlink
);
1072 clear_nlink(ea_inode
);
1073 ext4_orphan_add(handle
, ea_inode
);
1077 ret
= ext4_mark_iloc_dirty(handle
, ea_inode
, &iloc
);
1079 ext4_warning_inode(ea_inode
,
1080 "ext4_mark_iloc_dirty() failed ret=%d", ret
);
1082 inode_unlock(ea_inode
);
1086 static int ext4_xattr_inode_inc_ref(handle_t
*handle
, struct inode
*ea_inode
)
1088 return ext4_xattr_inode_update_ref(handle
, ea_inode
, 1);
1091 static int ext4_xattr_inode_dec_ref(handle_t
*handle
, struct inode
*ea_inode
)
1093 return ext4_xattr_inode_update_ref(handle
, ea_inode
, -1);
1096 static int ext4_xattr_inode_inc_ref_all(handle_t
*handle
, struct inode
*parent
,
1097 struct ext4_xattr_entry
*first
)
1099 struct inode
*ea_inode
;
1100 struct ext4_xattr_entry
*entry
;
1101 struct ext4_xattr_entry
*failed_entry
;
1102 unsigned int ea_ino
;
1105 for (entry
= first
; !IS_LAST_ENTRY(entry
);
1106 entry
= EXT4_XATTR_NEXT(entry
)) {
1107 if (!entry
->e_value_inum
)
1109 ea_ino
= le32_to_cpu(entry
->e_value_inum
);
1110 err
= ext4_xattr_inode_iget(parent
, ea_ino
,
1111 le32_to_cpu(entry
->e_hash
),
1115 err
= ext4_xattr_inode_inc_ref(handle
, ea_inode
);
1117 ext4_warning_inode(ea_inode
, "inc ref error %d", err
);
1127 failed_entry
= entry
;
1129 for (entry
= first
; entry
!= failed_entry
;
1130 entry
= EXT4_XATTR_NEXT(entry
)) {
1131 if (!entry
->e_value_inum
)
1133 ea_ino
= le32_to_cpu(entry
->e_value_inum
);
1134 err
= ext4_xattr_inode_iget(parent
, ea_ino
,
1135 le32_to_cpu(entry
->e_hash
),
1138 ext4_warning(parent
->i_sb
,
1139 "cleanup ea_ino %u iget error %d", ea_ino
,
1143 err
= ext4_xattr_inode_dec_ref(handle
, ea_inode
);
1145 ext4_warning_inode(ea_inode
, "cleanup dec ref error %d",
1152 static int ext4_xattr_restart_fn(handle_t
*handle
, struct inode
*inode
,
1153 struct buffer_head
*bh
, bool block_csum
, bool dirty
)
1159 ext4_xattr_block_csum_set(inode
, bh
);
1160 error
= ext4_handle_dirty_metadata(handle
, NULL
, bh
);
1162 ext4_warning(inode
->i_sb
, "Handle metadata (error %d)",
1171 ext4_xattr_inode_dec_ref_all(handle_t
*handle
, struct inode
*parent
,
1172 struct buffer_head
*bh
,
1173 struct ext4_xattr_entry
*first
, bool block_csum
,
1174 struct ext4_xattr_inode_array
**ea_inode_array
,
1175 int extra_credits
, bool skip_quota
)
1177 struct inode
*ea_inode
;
1178 struct ext4_xattr_entry
*entry
;
1180 unsigned int ea_ino
;
1184 /* One credit for dec ref on ea_inode, one for orphan list addition, */
1185 credits
= 2 + extra_credits
;
1187 for (entry
= first
; !IS_LAST_ENTRY(entry
);
1188 entry
= EXT4_XATTR_NEXT(entry
)) {
1189 if (!entry
->e_value_inum
)
1191 ea_ino
= le32_to_cpu(entry
->e_value_inum
);
1192 err
= ext4_xattr_inode_iget(parent
, ea_ino
,
1193 le32_to_cpu(entry
->e_hash
),
1198 err
= ext4_expand_inode_array(ea_inode_array
, ea_inode
);
1200 ext4_warning_inode(ea_inode
,
1201 "Expand inode array err=%d", err
);
1206 err
= ext4_journal_ensure_credits_fn(handle
, credits
, credits
,
1207 ext4_free_metadata_revoke_credits(parent
->i_sb
, 1),
1208 ext4_xattr_restart_fn(handle
, parent
, bh
, block_csum
,
1211 ext4_warning_inode(ea_inode
, "Ensure credits err=%d",
1216 err
= ext4_journal_get_write_access(handle
,
1217 parent
->i_sb
, bh
, EXT4_JTR_NONE
);
1219 ext4_warning_inode(ea_inode
,
1220 "Re-get write access err=%d",
1226 err
= ext4_xattr_inode_dec_ref(handle
, ea_inode
);
1228 ext4_warning_inode(ea_inode
, "ea_inode dec ref err=%d",
1234 ext4_xattr_inode_free_quota(parent
, ea_inode
,
1235 le32_to_cpu(entry
->e_value_size
));
1238 * Forget about ea_inode within the same transaction that
1239 * decrements the ref count. This avoids duplicate decrements in
1240 * case the rest of the work spills over to subsequent
1243 entry
->e_value_inum
= 0;
1244 entry
->e_value_size
= 0;
1251 * Note that we are deliberately skipping csum calculation for
1252 * the final update because we do not expect any journal
1253 * restarts until xattr block is freed.
1256 err
= ext4_handle_dirty_metadata(handle
, NULL
, bh
);
1258 ext4_warning_inode(parent
,
1259 "handle dirty metadata err=%d", err
);
1264 * Release the xattr block BH: If the reference count is > 1, decrement it;
1265 * otherwise free the block.
1268 ext4_xattr_release_block(handle_t
*handle
, struct inode
*inode
,
1269 struct buffer_head
*bh
,
1270 struct ext4_xattr_inode_array
**ea_inode_array
,
1273 struct mb_cache
*ea_block_cache
= EA_BLOCK_CACHE(inode
);
1277 BUFFER_TRACE(bh
, "get_write_access");
1278 error
= ext4_journal_get_write_access(handle
, inode
->i_sb
, bh
,
1285 hash
= le32_to_cpu(BHDR(bh
)->h_hash
);
1286 ref
= le32_to_cpu(BHDR(bh
)->h_refcount
);
1288 ea_bdebug(bh
, "refcount now=0; freeing");
1290 * This must happen under buffer lock for
1291 * ext4_xattr_block_set() to reliably detect freed block
1293 if (ea_block_cache
) {
1294 struct mb_cache_entry
*oe
;
1296 oe
= mb_cache_entry_delete_or_get(ea_block_cache
, hash
,
1300 mb_cache_entry_wait_unused(oe
);
1301 mb_cache_entry_put(ea_block_cache
, oe
);
1308 if (ext4_has_feature_ea_inode(inode
->i_sb
))
1309 ext4_xattr_inode_dec_ref_all(handle
, inode
, bh
,
1311 true /* block_csum */,
1314 true /* skip_quota */);
1315 ext4_free_blocks(handle
, inode
, bh
, 0, 1,
1316 EXT4_FREE_BLOCKS_METADATA
|
1317 EXT4_FREE_BLOCKS_FORGET
);
1320 BHDR(bh
)->h_refcount
= cpu_to_le32(ref
);
1321 if (ref
== EXT4_XATTR_REFCOUNT_MAX
- 1) {
1322 struct mb_cache_entry
*ce
;
1324 if (ea_block_cache
) {
1325 ce
= mb_cache_entry_get(ea_block_cache
, hash
,
1328 set_bit(MBE_REUSABLE_B
, &ce
->e_flags
);
1329 mb_cache_entry_put(ea_block_cache
, ce
);
1334 ext4_xattr_block_csum_set(inode
, bh
);
1336 * Beware of this ugliness: Releasing of xattr block references
1337 * from different inodes can race and so we have to protect
1338 * from a race where someone else frees the block (and releases
1339 * its journal_head) before we are done dirtying the buffer. In
1340 * nojournal mode this race is harmless and we actually cannot
1341 * call ext4_handle_dirty_metadata() with locked buffer as
1342 * that function can call sync_dirty_buffer() so for that case
1343 * we handle the dirtying after unlocking the buffer.
1345 if (ext4_handle_valid(handle
))
1346 error
= ext4_handle_dirty_metadata(handle
, inode
, bh
);
1348 if (!ext4_handle_valid(handle
))
1349 error
= ext4_handle_dirty_metadata(handle
, inode
, bh
);
1351 ext4_handle_sync(handle
);
1352 dquot_free_block(inode
, EXT4_C2B(EXT4_SB(inode
->i_sb
), 1));
1353 ea_bdebug(bh
, "refcount now=%d; releasing",
1354 le32_to_cpu(BHDR(bh
)->h_refcount
));
1357 ext4_std_error(inode
->i_sb
, error
);
1362 * Find the available free space for EAs. This also returns the total number of
1363 * bytes used by EA entries.
1365 static size_t ext4_xattr_free_space(struct ext4_xattr_entry
*last
,
1366 size_t *min_offs
, void *base
, int *total
)
1368 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
1369 if (!last
->e_value_inum
&& last
->e_value_size
) {
1370 size_t offs
= le16_to_cpu(last
->e_value_offs
);
1371 if (offs
< *min_offs
)
1375 *total
+= EXT4_XATTR_LEN(last
->e_name_len
);
1377 return (*min_offs
- ((void *)last
- base
) - sizeof(__u32
));
1381 * Write the value of the EA in an inode.
1383 static int ext4_xattr_inode_write(handle_t
*handle
, struct inode
*ea_inode
,
1384 const void *buf
, int bufsize
)
1386 struct buffer_head
*bh
= NULL
;
1387 unsigned long block
= 0;
1388 int blocksize
= ea_inode
->i_sb
->s_blocksize
;
1389 int max_blocks
= (bufsize
+ blocksize
- 1) >> ea_inode
->i_blkbits
;
1390 int csize
, wsize
= 0;
1391 int ret
= 0, ret2
= 0;
1395 while (ret
>= 0 && ret
< max_blocks
) {
1396 struct ext4_map_blocks map
;
1397 map
.m_lblk
= block
+= ret
;
1398 map
.m_len
= max_blocks
-= ret
;
1400 ret
= ext4_map_blocks(handle
, ea_inode
, &map
,
1401 EXT4_GET_BLOCKS_CREATE
);
1403 ext4_mark_inode_dirty(handle
, ea_inode
);
1404 if (ret
== -ENOSPC
&&
1405 ext4_should_retry_alloc(ea_inode
->i_sb
, &retries
)) {
1417 while (wsize
< bufsize
) {
1419 csize
= (bufsize
- wsize
) > blocksize
? blocksize
:
1421 bh
= ext4_getblk(handle
, ea_inode
, block
, 0);
1426 EXT4_ERROR_INODE(ea_inode
,
1427 "ext4_getblk() return bh = NULL");
1428 return -EFSCORRUPTED
;
1430 ret
= ext4_journal_get_write_access(handle
, ea_inode
->i_sb
, bh
,
1435 memcpy(bh
->b_data
, buf
, csize
);
1437 * Zero out block tail to avoid writing uninitialized memory
1440 if (csize
< blocksize
)
1441 memset(bh
->b_data
+ csize
, 0, blocksize
- csize
);
1442 set_buffer_uptodate(bh
);
1443 ext4_handle_dirty_metadata(handle
, ea_inode
, bh
);
1450 inode_lock(ea_inode
);
1451 i_size_write(ea_inode
, wsize
);
1452 ext4_update_i_disksize(ea_inode
, wsize
);
1453 inode_unlock(ea_inode
);
1455 ret2
= ext4_mark_inode_dirty(handle
, ea_inode
);
1456 if (unlikely(ret2
&& !ret
))
1466 * Create an inode to store the value of a large EA.
1468 static struct inode
*ext4_xattr_inode_create(handle_t
*handle
,
1469 struct inode
*inode
, u32 hash
)
1471 struct inode
*ea_inode
= NULL
;
1472 uid_t owner
[2] = { i_uid_read(inode
), i_gid_read(inode
) };
1475 if (inode
->i_sb
->s_root
== NULL
) {
1476 ext4_warning(inode
->i_sb
,
1477 "refuse to create EA inode when umounting");
1479 return ERR_PTR(-EINVAL
);
1483 * Let the next inode be the goal, so we try and allocate the EA inode
1484 * in the same group, or nearby one.
1486 ea_inode
= ext4_new_inode(handle
, inode
->i_sb
->s_root
->d_inode
,
1487 S_IFREG
| 0600, NULL
, inode
->i_ino
+ 1, owner
,
1489 if (!IS_ERR(ea_inode
)) {
1490 ea_inode
->i_op
= &ext4_file_inode_operations
;
1491 ea_inode
->i_fop
= &ext4_file_operations
;
1492 ext4_set_aops(ea_inode
);
1493 ext4_xattr_inode_set_class(ea_inode
);
1494 unlock_new_inode(ea_inode
);
1495 ext4_xattr_inode_set_ref(ea_inode
, 1);
1496 ext4_xattr_inode_set_hash(ea_inode
, hash
);
1497 err
= ext4_mark_inode_dirty(handle
, ea_inode
);
1499 err
= ext4_inode_attach_jinode(ea_inode
);
1501 if (ext4_xattr_inode_dec_ref(handle
, ea_inode
))
1502 ext4_warning_inode(ea_inode
,
1503 "cleanup dec ref error %d", err
);
1505 return ERR_PTR(err
);
1509 * Xattr inodes are shared therefore quota charging is performed
1510 * at a higher level.
1512 dquot_free_inode(ea_inode
);
1513 dquot_drop(ea_inode
);
1514 inode_lock(ea_inode
);
1515 ea_inode
->i_flags
|= S_NOQUOTA
;
1516 inode_unlock(ea_inode
);
1522 static struct inode
*
1523 ext4_xattr_inode_cache_find(struct inode
*inode
, const void *value
,
1524 size_t value_len
, u32 hash
)
1526 struct inode
*ea_inode
;
1527 struct mb_cache_entry
*ce
;
1528 struct mb_cache
*ea_inode_cache
= EA_INODE_CACHE(inode
);
1531 if (!ea_inode_cache
)
1534 ce
= mb_cache_entry_find_first(ea_inode_cache
, hash
);
1538 WARN_ON_ONCE(ext4_handle_valid(journal_current_handle()) &&
1539 !(current
->flags
& PF_MEMALLOC_NOFS
));
1541 ea_data
= kvmalloc(value_len
, GFP_KERNEL
);
1543 mb_cache_entry_put(ea_inode_cache
, ce
);
1548 ea_inode
= ext4_iget(inode
->i_sb
, ce
->e_value
,
1549 EXT4_IGET_EA_INODE
);
1550 if (IS_ERR(ea_inode
))
1552 ext4_xattr_inode_set_class(ea_inode
);
1553 if (i_size_read(ea_inode
) == value_len
&&
1554 !ext4_xattr_inode_read(ea_inode
, ea_data
, value_len
) &&
1555 !ext4_xattr_inode_verify_hashes(ea_inode
, NULL
, ea_data
,
1557 !memcmp(value
, ea_data
, value_len
)) {
1558 mb_cache_entry_touch(ea_inode_cache
, ce
);
1559 mb_cache_entry_put(ea_inode_cache
, ce
);
1565 ce
= mb_cache_entry_find_next(ea_inode_cache
, ce
);
1572 * Add value of the EA in an inode.
1574 static struct inode
*ext4_xattr_inode_lookup_create(handle_t
*handle
,
1575 struct inode
*inode
, const void *value
, size_t value_len
)
1577 struct inode
*ea_inode
;
1581 /* Account inode & space to quota even if sharing... */
1582 err
= ext4_xattr_inode_alloc_quota(inode
, value_len
);
1584 return ERR_PTR(err
);
1586 hash
= ext4_xattr_inode_hash(EXT4_SB(inode
->i_sb
), value
, value_len
);
1587 ea_inode
= ext4_xattr_inode_cache_find(inode
, value
, value_len
, hash
);
1589 err
= ext4_xattr_inode_inc_ref(handle
, ea_inode
);
1595 /* Create an inode for the EA value */
1596 ea_inode
= ext4_xattr_inode_create(handle
, inode
, hash
);
1597 if (IS_ERR(ea_inode
)) {
1598 ext4_xattr_inode_free_quota(inode
, NULL
, value_len
);
1602 err
= ext4_xattr_inode_write(handle
, ea_inode
, value
, value_len
);
1604 if (ext4_xattr_inode_dec_ref(handle
, ea_inode
))
1605 ext4_warning_inode(ea_inode
, "cleanup dec ref error %d", err
);
1609 if (EA_INODE_CACHE(inode
))
1610 mb_cache_entry_create(EA_INODE_CACHE(inode
), GFP_NOFS
, hash
,
1611 ea_inode
->i_ino
, true /* reusable */);
1615 ext4_xattr_inode_free_quota(inode
, NULL
, value_len
);
1616 return ERR_PTR(err
);
1620 * Reserve min(block_size/8, 1024) bytes for xattr entries/names if ea_inode
1621 * feature is enabled.
1623 #define EXT4_XATTR_BLOCK_RESERVE(inode) min(i_blocksize(inode)/8, 1024U)
1625 static int ext4_xattr_set_entry(struct ext4_xattr_info
*i
,
1626 struct ext4_xattr_search
*s
,
1627 handle_t
*handle
, struct inode
*inode
,
1628 struct inode
*new_ea_inode
,
1631 struct ext4_xattr_entry
*last
, *next
;
1632 struct ext4_xattr_entry
*here
= s
->here
;
1633 size_t min_offs
= s
->end
- s
->base
, name_len
= strlen(i
->name
);
1634 int in_inode
= i
->in_inode
;
1635 struct inode
*old_ea_inode
= NULL
;
1636 size_t old_size
, new_size
;
1639 /* Space used by old and new values. */
1640 old_size
= (!s
->not_found
&& !here
->e_value_inum
) ?
1641 EXT4_XATTR_SIZE(le32_to_cpu(here
->e_value_size
)) : 0;
1642 new_size
= (i
->value
&& !in_inode
) ? EXT4_XATTR_SIZE(i
->value_len
) : 0;
1645 * Optimization for the simple case when old and new values have the
1646 * same padded sizes. Not applicable if external inodes are involved.
1648 if (new_size
&& new_size
== old_size
) {
1649 size_t offs
= le16_to_cpu(here
->e_value_offs
);
1650 void *val
= s
->base
+ offs
;
1652 here
->e_value_size
= cpu_to_le32(i
->value_len
);
1653 if (i
->value
== EXT4_ZERO_XATTR_VALUE
) {
1654 memset(val
, 0, new_size
);
1656 memcpy(val
, i
->value
, i
->value_len
);
1657 /* Clear padding bytes. */
1658 memset(val
+ i
->value_len
, 0, new_size
- i
->value_len
);
1663 /* Compute min_offs and last. */
1665 for (; !IS_LAST_ENTRY(last
); last
= next
) {
1666 next
= EXT4_XATTR_NEXT(last
);
1667 if ((void *)next
>= s
->end
) {
1668 EXT4_ERROR_INODE(inode
, "corrupted xattr entries");
1669 ret
= -EFSCORRUPTED
;
1672 if (!last
->e_value_inum
&& last
->e_value_size
) {
1673 size_t offs
= le16_to_cpu(last
->e_value_offs
);
1674 if (offs
< min_offs
)
1679 /* Check whether we have enough space. */
1683 free
= min_offs
- ((void *)last
- s
->base
) - sizeof(__u32
);
1685 free
+= EXT4_XATTR_LEN(name_len
) + old_size
;
1687 if (free
< EXT4_XATTR_LEN(name_len
) + new_size
) {
1693 * If storing the value in an external inode is an option,
1694 * reserve space for xattr entries/names in the external
1695 * attribute block so that a long value does not occupy the
1696 * whole space and prevent further entries being added.
1698 if (ext4_has_feature_ea_inode(inode
->i_sb
) &&
1699 new_size
&& is_block
&&
1700 (min_offs
+ old_size
- new_size
) <
1701 EXT4_XATTR_BLOCK_RESERVE(inode
)) {
1708 * Getting access to old and new ea inodes is subject to failures.
1709 * Finish that work before doing any modifications to the xattr data.
1711 if (!s
->not_found
&& here
->e_value_inum
) {
1712 ret
= ext4_xattr_inode_iget(inode
,
1713 le32_to_cpu(here
->e_value_inum
),
1714 le32_to_cpu(here
->e_hash
),
1717 old_ea_inode
= NULL
;
1721 /* We are ready to release ref count on the old_ea_inode. */
1722 ret
= ext4_xattr_inode_dec_ref(handle
, old_ea_inode
);
1726 ext4_xattr_inode_free_quota(inode
, old_ea_inode
,
1727 le32_to_cpu(here
->e_value_size
));
1730 /* No failures allowed past this point. */
1732 if (!s
->not_found
&& here
->e_value_size
&& !here
->e_value_inum
) {
1733 /* Remove the old value. */
1734 void *first_val
= s
->base
+ min_offs
;
1735 size_t offs
= le16_to_cpu(here
->e_value_offs
);
1736 void *val
= s
->base
+ offs
;
1738 memmove(first_val
+ old_size
, first_val
, val
- first_val
);
1739 memset(first_val
, 0, old_size
);
1740 min_offs
+= old_size
;
1742 /* Adjust all value offsets. */
1744 while (!IS_LAST_ENTRY(last
)) {
1745 size_t o
= le16_to_cpu(last
->e_value_offs
);
1747 if (!last
->e_value_inum
&&
1748 last
->e_value_size
&& o
< offs
)
1749 last
->e_value_offs
= cpu_to_le16(o
+ old_size
);
1750 last
= EXT4_XATTR_NEXT(last
);
1755 /* Remove old name. */
1756 size_t size
= EXT4_XATTR_LEN(name_len
);
1758 last
= ENTRY((void *)last
- size
);
1759 memmove(here
, (void *)here
+ size
,
1760 (void *)last
- (void *)here
+ sizeof(__u32
));
1761 memset(last
, 0, size
);
1764 * Update i_inline_off - moved ibody region might contain
1765 * system.data attribute. Handling a failure here won't
1766 * cause other complications for setting an xattr.
1768 if (!is_block
&& ext4_has_inline_data(inode
)) {
1769 ret
= ext4_find_inline_data_nolock(inode
);
1771 ext4_warning_inode(inode
,
1772 "unable to update i_inline_off");
1776 } else if (s
->not_found
) {
1777 /* Insert new name. */
1778 size_t size
= EXT4_XATTR_LEN(name_len
);
1779 size_t rest
= (void *)last
- (void *)here
+ sizeof(__u32
);
1781 memmove((void *)here
+ size
, here
, rest
);
1782 memset(here
, 0, size
);
1783 here
->e_name_index
= i
->name_index
;
1784 here
->e_name_len
= name_len
;
1785 memcpy(here
->e_name
, i
->name
, name_len
);
1787 /* This is an update, reset value info. */
1788 here
->e_value_inum
= 0;
1789 here
->e_value_offs
= 0;
1790 here
->e_value_size
= 0;
1794 /* Insert new value. */
1796 here
->e_value_inum
= cpu_to_le32(new_ea_inode
->i_ino
);
1797 } else if (i
->value_len
) {
1798 void *val
= s
->base
+ min_offs
- new_size
;
1800 here
->e_value_offs
= cpu_to_le16(min_offs
- new_size
);
1801 if (i
->value
== EXT4_ZERO_XATTR_VALUE
) {
1802 memset(val
, 0, new_size
);
1804 memcpy(val
, i
->value
, i
->value_len
);
1805 /* Clear padding bytes. */
1806 memset(val
+ i
->value_len
, 0,
1807 new_size
- i
->value_len
);
1810 here
->e_value_size
= cpu_to_le32(i
->value_len
);
1817 /* Entry hash calculation. */
1822 * Feed crc32c hash instead of the raw value for entry
1823 * hash calculation. This is to avoid walking
1824 * potentially long value buffer again.
1826 crc32c_hash
= cpu_to_le32(
1827 ext4_xattr_inode_get_hash(new_ea_inode
));
1828 hash
= ext4_xattr_hash_entry(here
->e_name
,
1831 } else if (is_block
) {
1832 __le32
*value
= s
->base
+ le16_to_cpu(
1833 here
->e_value_offs
);
1835 hash
= ext4_xattr_hash_entry(here
->e_name
,
1836 here
->e_name_len
, value
,
1839 here
->e_hash
= hash
;
1843 ext4_xattr_rehash((struct ext4_xattr_header
*)s
->base
);
1851 struct ext4_xattr_block_find
{
1852 struct ext4_xattr_search s
;
1853 struct buffer_head
*bh
;
1857 ext4_xattr_block_find(struct inode
*inode
, struct ext4_xattr_info
*i
,
1858 struct ext4_xattr_block_find
*bs
)
1860 struct super_block
*sb
= inode
->i_sb
;
1863 ea_idebug(inode
, "name=%d.%s, value=%p, value_len=%ld",
1864 i
->name_index
, i
->name
, i
->value
, (long)i
->value_len
);
1866 if (EXT4_I(inode
)->i_file_acl
) {
1867 /* The inode already has an extended attribute block. */
1868 bs
->bh
= ext4_sb_bread(sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
1869 if (IS_ERR(bs
->bh
)) {
1870 error
= PTR_ERR(bs
->bh
);
1874 ea_bdebug(bs
->bh
, "b_count=%d, refcount=%d",
1875 atomic_read(&(bs
->bh
->b_count
)),
1876 le32_to_cpu(BHDR(bs
->bh
)->h_refcount
));
1877 error
= ext4_xattr_check_block(inode
, bs
->bh
);
1880 /* Find the named attribute. */
1881 bs
->s
.base
= BHDR(bs
->bh
);
1882 bs
->s
.first
= BFIRST(bs
->bh
);
1883 bs
->s
.end
= bs
->bh
->b_data
+ bs
->bh
->b_size
;
1884 bs
->s
.here
= bs
->s
.first
;
1885 error
= xattr_find_entry(inode
, &bs
->s
.here
, bs
->s
.end
,
1886 i
->name_index
, i
->name
, 1);
1887 if (error
&& error
!= -ENODATA
)
1889 bs
->s
.not_found
= error
;
1895 ext4_xattr_block_set(handle_t
*handle
, struct inode
*inode
,
1896 struct ext4_xattr_info
*i
,
1897 struct ext4_xattr_block_find
*bs
)
1899 struct super_block
*sb
= inode
->i_sb
;
1900 struct buffer_head
*new_bh
= NULL
;
1901 struct ext4_xattr_search s_copy
= bs
->s
;
1902 struct ext4_xattr_search
*s
= &s_copy
;
1903 struct mb_cache_entry
*ce
= NULL
;
1905 struct mb_cache
*ea_block_cache
= EA_BLOCK_CACHE(inode
);
1906 struct inode
*ea_inode
= NULL
, *tmp_inode
;
1907 size_t old_ea_inode_quota
= 0;
1908 unsigned int ea_ino
;
1910 #define header(x) ((struct ext4_xattr_header *)(x))
1912 /* If we need EA inode, prepare it before locking the buffer */
1913 if (i
->value
&& i
->in_inode
) {
1914 WARN_ON_ONCE(!i
->value_len
);
1916 ea_inode
= ext4_xattr_inode_lookup_create(handle
, inode
,
1917 i
->value
, i
->value_len
);
1918 if (IS_ERR(ea_inode
)) {
1919 error
= PTR_ERR(ea_inode
);
1926 int offset
= (char *)s
->here
- bs
->bh
->b_data
;
1928 BUFFER_TRACE(bs
->bh
, "get_write_access");
1929 error
= ext4_journal_get_write_access(handle
, sb
, bs
->bh
,
1934 lock_buffer(bs
->bh
);
1936 if (header(s
->base
)->h_refcount
== cpu_to_le32(1)) {
1937 __u32 hash
= le32_to_cpu(BHDR(bs
->bh
)->h_hash
);
1940 * This must happen under buffer lock for
1941 * ext4_xattr_block_set() to reliably detect modified
1944 if (ea_block_cache
) {
1945 struct mb_cache_entry
*oe
;
1947 oe
= mb_cache_entry_delete_or_get(ea_block_cache
,
1948 hash
, bs
->bh
->b_blocknr
);
1951 * Xattr block is getting reused. Leave
1954 mb_cache_entry_put(ea_block_cache
, oe
);
1958 ea_bdebug(bs
->bh
, "modifying in-place");
1959 error
= ext4_xattr_set_entry(i
, s
, handle
, inode
,
1960 ea_inode
, true /* is_block */);
1961 ext4_xattr_block_csum_set(inode
, bs
->bh
);
1962 unlock_buffer(bs
->bh
);
1963 if (error
== -EFSCORRUPTED
)
1966 error
= ext4_handle_dirty_metadata(handle
,
1974 unlock_buffer(bs
->bh
);
1975 ea_bdebug(bs
->bh
, "cloning");
1976 s
->base
= kmemdup(BHDR(bs
->bh
), bs
->bh
->b_size
, GFP_NOFS
);
1978 if (s
->base
== NULL
)
1980 s
->first
= ENTRY(header(s
->base
)+1);
1981 header(s
->base
)->h_refcount
= cpu_to_le32(1);
1982 s
->here
= ENTRY(s
->base
+ offset
);
1983 s
->end
= s
->base
+ bs
->bh
->b_size
;
1986 * If existing entry points to an xattr inode, we need
1987 * to prevent ext4_xattr_set_entry() from decrementing
1988 * ref count on it because the reference belongs to the
1989 * original block. In this case, make the entry look
1990 * like it has an empty value.
1992 if (!s
->not_found
&& s
->here
->e_value_inum
) {
1993 ea_ino
= le32_to_cpu(s
->here
->e_value_inum
);
1994 error
= ext4_xattr_inode_iget(inode
, ea_ino
,
1995 le32_to_cpu(s
->here
->e_hash
),
2000 if (!ext4_test_inode_state(tmp_inode
,
2001 EXT4_STATE_LUSTRE_EA_INODE
)) {
2003 * Defer quota free call for previous
2004 * inode until success is guaranteed.
2006 old_ea_inode_quota
= le32_to_cpu(
2007 s
->here
->e_value_size
);
2011 s
->here
->e_value_inum
= 0;
2012 s
->here
->e_value_size
= 0;
2015 /* Allocate a buffer where we construct the new block. */
2016 s
->base
= kzalloc(sb
->s_blocksize
, GFP_NOFS
);
2018 if (s
->base
== NULL
)
2020 header(s
->base
)->h_magic
= cpu_to_le32(EXT4_XATTR_MAGIC
);
2021 header(s
->base
)->h_blocks
= cpu_to_le32(1);
2022 header(s
->base
)->h_refcount
= cpu_to_le32(1);
2023 s
->first
= ENTRY(header(s
->base
)+1);
2024 s
->here
= ENTRY(header(s
->base
)+1);
2025 s
->end
= s
->base
+ sb
->s_blocksize
;
2028 error
= ext4_xattr_set_entry(i
, s
, handle
, inode
, ea_inode
,
2029 true /* is_block */);
2030 if (error
== -EFSCORRUPTED
)
2036 if (!IS_LAST_ENTRY(s
->first
)) {
2037 new_bh
= ext4_xattr_block_cache_find(inode
, header(s
->base
), &ce
);
2038 if (IS_ERR(new_bh
)) {
2039 error
= PTR_ERR(new_bh
);
2045 /* We found an identical block in the cache. */
2046 if (new_bh
== bs
->bh
)
2047 ea_bdebug(new_bh
, "keeping");
2051 #ifdef EXT4_XATTR_DEBUG
2052 WARN_ON_ONCE(dquot_initialize_needed(inode
));
2054 /* The old block is released after updating
2056 error
= dquot_alloc_block(inode
,
2057 EXT4_C2B(EXT4_SB(sb
), 1));
2060 BUFFER_TRACE(new_bh
, "get_write_access");
2061 error
= ext4_journal_get_write_access(
2066 lock_buffer(new_bh
);
2068 * We have to be careful about races with
2069 * adding references to xattr block. Once we
2070 * hold buffer lock xattr block's state is
2071 * stable so we can check the additional
2074 ref
= le32_to_cpu(BHDR(new_bh
)->h_refcount
) + 1;
2075 if (ref
> EXT4_XATTR_REFCOUNT_MAX
) {
2077 * Undo everything and check mbcache
2080 unlock_buffer(new_bh
);
2081 dquot_free_block(inode
,
2082 EXT4_C2B(EXT4_SB(sb
),
2085 mb_cache_entry_put(ea_block_cache
, ce
);
2090 BHDR(new_bh
)->h_refcount
= cpu_to_le32(ref
);
2091 if (ref
== EXT4_XATTR_REFCOUNT_MAX
)
2092 clear_bit(MBE_REUSABLE_B
, &ce
->e_flags
);
2093 ea_bdebug(new_bh
, "reusing; refcount now=%d",
2095 ext4_xattr_block_csum_set(inode
, new_bh
);
2096 unlock_buffer(new_bh
);
2097 error
= ext4_handle_dirty_metadata(handle
,
2103 mb_cache_entry_touch(ea_block_cache
, ce
);
2104 mb_cache_entry_put(ea_block_cache
, ce
);
2106 } else if (bs
->bh
&& s
->base
== bs
->bh
->b_data
) {
2107 /* We were modifying this block in-place. */
2108 ea_bdebug(bs
->bh
, "keeping this block");
2109 ext4_xattr_block_cache_insert(ea_block_cache
, bs
->bh
);
2113 /* We need to allocate a new block */
2114 ext4_fsblk_t goal
, block
;
2116 #ifdef EXT4_XATTR_DEBUG
2117 WARN_ON_ONCE(dquot_initialize_needed(inode
));
2119 goal
= ext4_group_first_block_no(sb
,
2120 EXT4_I(inode
)->i_block_group
);
2121 block
= ext4_new_meta_blocks(handle
, inode
, goal
, 0,
2126 ea_idebug(inode
, "creating block %llu",
2127 (unsigned long long)block
);
2129 new_bh
= sb_getblk(sb
, block
);
2130 if (unlikely(!new_bh
)) {
2133 ext4_free_blocks(handle
, inode
, NULL
, block
, 1,
2134 EXT4_FREE_BLOCKS_METADATA
);
2137 error
= ext4_xattr_inode_inc_ref_all(handle
, inode
,
2138 ENTRY(header(s
->base
)+1));
2142 /* Drop the extra ref on ea_inode. */
2143 error
= ext4_xattr_inode_dec_ref(handle
,
2146 ext4_warning_inode(ea_inode
,
2153 lock_buffer(new_bh
);
2154 error
= ext4_journal_get_create_access(handle
, sb
,
2155 new_bh
, EXT4_JTR_NONE
);
2157 unlock_buffer(new_bh
);
2161 memcpy(new_bh
->b_data
, s
->base
, new_bh
->b_size
);
2162 ext4_xattr_block_csum_set(inode
, new_bh
);
2163 set_buffer_uptodate(new_bh
);
2164 unlock_buffer(new_bh
);
2165 ext4_xattr_block_cache_insert(ea_block_cache
, new_bh
);
2166 error
= ext4_handle_dirty_metadata(handle
, inode
,
2173 if (old_ea_inode_quota
)
2174 ext4_xattr_inode_free_quota(inode
, NULL
, old_ea_inode_quota
);
2176 /* Update the inode. */
2177 EXT4_I(inode
)->i_file_acl
= new_bh
? new_bh
->b_blocknr
: 0;
2179 /* Drop the previous xattr block. */
2180 if (bs
->bh
&& bs
->bh
!= new_bh
) {
2181 struct ext4_xattr_inode_array
*ea_inode_array
= NULL
;
2183 ext4_xattr_release_block(handle
, inode
, bs
->bh
,
2185 0 /* extra_credits */);
2186 ext4_xattr_inode_array_free(ea_inode_array
);
2195 error2
= ext4_xattr_inode_dec_ref(handle
, ea_inode
);
2197 ext4_warning_inode(ea_inode
, "dec ref error=%d",
2199 ext4_xattr_inode_free_quota(inode
, ea_inode
,
2200 i_size_read(ea_inode
));
2205 mb_cache_entry_put(ea_block_cache
, ce
);
2207 if (!(bs
->bh
&& s
->base
== bs
->bh
->b_data
))
2213 dquot_free_block(inode
, EXT4_C2B(EXT4_SB(sb
), 1));
2217 EXT4_ERROR_INODE(inode
, "bad block %llu",
2218 EXT4_I(inode
)->i_file_acl
);
2224 int ext4_xattr_ibody_find(struct inode
*inode
, struct ext4_xattr_info
*i
,
2225 struct ext4_xattr_ibody_find
*is
)
2227 struct ext4_xattr_ibody_header
*header
;
2228 struct ext4_inode
*raw_inode
;
2231 if (!EXT4_INODE_HAS_XATTR_SPACE(inode
))
2234 raw_inode
= ext4_raw_inode(&is
->iloc
);
2235 header
= IHDR(inode
, raw_inode
);
2236 is
->s
.base
= is
->s
.first
= IFIRST(header
);
2237 is
->s
.here
= is
->s
.first
;
2238 is
->s
.end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
2239 if (ext4_test_inode_state(inode
, EXT4_STATE_XATTR
)) {
2240 error
= xattr_check_inode(inode
, header
, is
->s
.end
);
2243 /* Find the named attribute. */
2244 error
= xattr_find_entry(inode
, &is
->s
.here
, is
->s
.end
,
2245 i
->name_index
, i
->name
, 0);
2246 if (error
&& error
!= -ENODATA
)
2248 is
->s
.not_found
= error
;
2253 int ext4_xattr_ibody_set(handle_t
*handle
, struct inode
*inode
,
2254 struct ext4_xattr_info
*i
,
2255 struct ext4_xattr_ibody_find
*is
)
2257 struct ext4_xattr_ibody_header
*header
;
2258 struct ext4_xattr_search
*s
= &is
->s
;
2259 struct inode
*ea_inode
= NULL
;
2262 if (!EXT4_INODE_HAS_XATTR_SPACE(inode
))
2265 /* If we need EA inode, prepare it before locking the buffer */
2266 if (i
->value
&& i
->in_inode
) {
2267 WARN_ON_ONCE(!i
->value_len
);
2269 ea_inode
= ext4_xattr_inode_lookup_create(handle
, inode
,
2270 i
->value
, i
->value_len
);
2271 if (IS_ERR(ea_inode
))
2272 return PTR_ERR(ea_inode
);
2274 error
= ext4_xattr_set_entry(i
, s
, handle
, inode
, ea_inode
,
2275 false /* is_block */);
2280 error2
= ext4_xattr_inode_dec_ref(handle
, ea_inode
);
2282 ext4_warning_inode(ea_inode
, "dec ref error=%d",
2285 ext4_xattr_inode_free_quota(inode
, ea_inode
,
2286 i_size_read(ea_inode
));
2291 header
= IHDR(inode
, ext4_raw_inode(&is
->iloc
));
2292 if (!IS_LAST_ENTRY(s
->first
)) {
2293 header
->h_magic
= cpu_to_le32(EXT4_XATTR_MAGIC
);
2294 ext4_set_inode_state(inode
, EXT4_STATE_XATTR
);
2296 header
->h_magic
= cpu_to_le32(0);
2297 ext4_clear_inode_state(inode
, EXT4_STATE_XATTR
);
2303 static int ext4_xattr_value_same(struct ext4_xattr_search
*s
,
2304 struct ext4_xattr_info
*i
)
2308 /* When e_value_inum is set the value is stored externally. */
2309 if (s
->here
->e_value_inum
)
2311 if (le32_to_cpu(s
->here
->e_value_size
) != i
->value_len
)
2313 value
= ((void *)s
->base
) + le16_to_cpu(s
->here
->e_value_offs
);
2314 return !memcmp(value
, i
->value
, i
->value_len
);
2317 static struct buffer_head
*ext4_xattr_get_block(struct inode
*inode
)
2319 struct buffer_head
*bh
;
2322 if (!EXT4_I(inode
)->i_file_acl
)
2324 bh
= ext4_sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
2327 error
= ext4_xattr_check_block(inode
, bh
);
2330 return ERR_PTR(error
);
2336 * ext4_xattr_set_handle()
2338 * Create, replace or remove an extended attribute for this inode. Value
2339 * is NULL to remove an existing extended attribute, and non-NULL to
2340 * either replace an existing extended attribute, or create a new extended
2341 * attribute. The flags XATTR_REPLACE and XATTR_CREATE
2342 * specify that an extended attribute must exist and must not exist
2343 * previous to the call, respectively.
2345 * Returns 0, or a negative error number on failure.
2348 ext4_xattr_set_handle(handle_t
*handle
, struct inode
*inode
, int name_index
,
2349 const char *name
, const void *value
, size_t value_len
,
2352 struct ext4_xattr_info i
= {
2353 .name_index
= name_index
,
2356 .value_len
= value_len
,
2359 struct ext4_xattr_ibody_find is
= {
2360 .s
= { .not_found
= -ENODATA
, },
2362 struct ext4_xattr_block_find bs
= {
2363 .s
= { .not_found
= -ENODATA
, },
2370 if (strlen(name
) > 255)
2373 ext4_write_lock_xattr(inode
, &no_expand
);
2375 /* Check journal credits under write lock. */
2376 if (ext4_handle_valid(handle
)) {
2377 struct buffer_head
*bh
;
2380 bh
= ext4_xattr_get_block(inode
);
2382 error
= PTR_ERR(bh
);
2386 credits
= __ext4_xattr_set_credits(inode
->i_sb
, inode
, bh
,
2388 flags
& XATTR_CREATE
);
2391 if (jbd2_handle_buffer_credits(handle
) < credits
) {
2395 WARN_ON_ONCE(!(current
->flags
& PF_MEMALLOC_NOFS
));
2398 error
= ext4_reserve_inode_write(handle
, inode
, &is
.iloc
);
2402 if (ext4_test_inode_state(inode
, EXT4_STATE_NEW
)) {
2403 struct ext4_inode
*raw_inode
= ext4_raw_inode(&is
.iloc
);
2404 memset(raw_inode
, 0, EXT4_SB(inode
->i_sb
)->s_inode_size
);
2405 ext4_clear_inode_state(inode
, EXT4_STATE_NEW
);
2408 error
= ext4_xattr_ibody_find(inode
, &i
, &is
);
2412 error
= ext4_xattr_block_find(inode
, &i
, &bs
);
2415 if (is
.s
.not_found
&& bs
.s
.not_found
) {
2417 if (flags
& XATTR_REPLACE
)
2424 if (flags
& XATTR_CREATE
)
2429 if (!is
.s
.not_found
)
2430 error
= ext4_xattr_ibody_set(handle
, inode
, &i
, &is
);
2431 else if (!bs
.s
.not_found
)
2432 error
= ext4_xattr_block_set(handle
, inode
, &i
, &bs
);
2435 /* Xattr value did not change? Save us some work and bail out */
2436 if (!is
.s
.not_found
&& ext4_xattr_value_same(&is
.s
, &i
))
2438 if (!bs
.s
.not_found
&& ext4_xattr_value_same(&bs
.s
, &i
))
2441 if (ext4_has_feature_ea_inode(inode
->i_sb
) &&
2442 (EXT4_XATTR_SIZE(i
.value_len
) >
2443 EXT4_XATTR_MIN_LARGE_EA_SIZE(inode
->i_sb
->s_blocksize
)))
2446 error
= ext4_xattr_ibody_set(handle
, inode
, &i
, &is
);
2447 if (!error
&& !bs
.s
.not_found
) {
2449 error
= ext4_xattr_block_set(handle
, inode
, &i
, &bs
);
2450 } else if (error
== -ENOSPC
) {
2451 if (EXT4_I(inode
)->i_file_acl
&& !bs
.s
.base
) {
2454 error
= ext4_xattr_block_find(inode
, &i
, &bs
);
2458 error
= ext4_xattr_block_set(handle
, inode
, &i
, &bs
);
2459 if (!error
&& !is
.s
.not_found
) {
2461 error
= ext4_xattr_ibody_set(handle
, inode
, &i
,
2463 } else if (error
== -ENOSPC
) {
2465 * Xattr does not fit in the block, store at
2466 * external inode if possible.
2468 if (ext4_has_feature_ea_inode(inode
->i_sb
) &&
2469 i
.value_len
&& !i
.in_inode
) {
2477 ext4_xattr_update_super_block(handle
, inode
->i_sb
);
2478 inode_set_ctime_current(inode
);
2479 inode_inc_iversion(inode
);
2482 error
= ext4_mark_iloc_dirty(handle
, inode
, &is
.iloc
);
2484 * The bh is consumed by ext4_mark_iloc_dirty, even with
2489 ext4_handle_sync(handle
);
2491 ext4_fc_mark_ineligible(inode
->i_sb
, EXT4_FC_REASON_XATTR
, handle
);
2496 ext4_write_unlock_xattr(inode
, &no_expand
);
2500 int ext4_xattr_set_credits(struct inode
*inode
, size_t value_len
,
2501 bool is_create
, int *credits
)
2503 struct buffer_head
*bh
;
2508 if (!EXT4_SB(inode
->i_sb
)->s_journal
)
2511 down_read(&EXT4_I(inode
)->xattr_sem
);
2513 bh
= ext4_xattr_get_block(inode
);
2517 *credits
= __ext4_xattr_set_credits(inode
->i_sb
, inode
, bh
,
2518 value_len
, is_create
);
2523 up_read(&EXT4_I(inode
)->xattr_sem
);
2530 * Like ext4_xattr_set_handle, but start from an inode. This extended
2531 * attribute modification is a filesystem transaction by itself.
2533 * Returns 0, or a negative error number on failure.
2536 ext4_xattr_set(struct inode
*inode
, int name_index
, const char *name
,
2537 const void *value
, size_t value_len
, int flags
)
2540 struct super_block
*sb
= inode
->i_sb
;
2541 int error
, retries
= 0;
2544 error
= dquot_initialize(inode
);
2549 error
= ext4_xattr_set_credits(inode
, value_len
, flags
& XATTR_CREATE
,
2554 handle
= ext4_journal_start(inode
, EXT4_HT_XATTR
, credits
);
2555 if (IS_ERR(handle
)) {
2556 error
= PTR_ERR(handle
);
2560 error
= ext4_xattr_set_handle(handle
, inode
, name_index
, name
,
2561 value
, value_len
, flags
);
2562 ext4_fc_mark_ineligible(inode
->i_sb
, EXT4_FC_REASON_XATTR
,
2564 error2
= ext4_journal_stop(handle
);
2565 if (error
== -ENOSPC
&&
2566 ext4_should_retry_alloc(sb
, &retries
))
2576 * Shift the EA entries in the inode to create space for the increased
2579 static void ext4_xattr_shift_entries(struct ext4_xattr_entry
*entry
,
2580 int value_offs_shift
, void *to
,
2581 void *from
, size_t n
)
2583 struct ext4_xattr_entry
*last
= entry
;
2586 /* We always shift xattr headers further thus offsets get lower */
2587 BUG_ON(value_offs_shift
> 0);
2589 /* Adjust the value offsets of the entries */
2590 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
2591 if (!last
->e_value_inum
&& last
->e_value_size
) {
2592 new_offs
= le16_to_cpu(last
->e_value_offs
) +
2594 last
->e_value_offs
= cpu_to_le16(new_offs
);
2597 /* Shift the entries by n bytes */
2598 memmove(to
, from
, n
);
2602 * Move xattr pointed to by 'entry' from inode into external xattr block
2604 static int ext4_xattr_move_to_block(handle_t
*handle
, struct inode
*inode
,
2605 struct ext4_inode
*raw_inode
,
2606 struct ext4_xattr_entry
*entry
)
2608 struct ext4_xattr_ibody_find
*is
= NULL
;
2609 struct ext4_xattr_block_find
*bs
= NULL
;
2610 char *buffer
= NULL
, *b_entry_name
= NULL
;
2611 size_t value_size
= le32_to_cpu(entry
->e_value_size
);
2612 struct ext4_xattr_info i
= {
2615 .name_index
= entry
->e_name_index
,
2616 .in_inode
= !!entry
->e_value_inum
,
2618 struct ext4_xattr_ibody_header
*header
= IHDR(inode
, raw_inode
);
2619 int needs_kvfree
= 0;
2622 is
= kzalloc(sizeof(struct ext4_xattr_ibody_find
), GFP_NOFS
);
2623 bs
= kzalloc(sizeof(struct ext4_xattr_block_find
), GFP_NOFS
);
2624 b_entry_name
= kmalloc(entry
->e_name_len
+ 1, GFP_NOFS
);
2625 if (!is
|| !bs
|| !b_entry_name
) {
2630 is
->s
.not_found
= -ENODATA
;
2631 bs
->s
.not_found
= -ENODATA
;
2635 /* Save the entry name and the entry value */
2636 if (entry
->e_value_inum
) {
2637 buffer
= kvmalloc(value_size
, GFP_NOFS
);
2643 error
= ext4_xattr_inode_get(inode
, entry
, buffer
, value_size
);
2647 size_t value_offs
= le16_to_cpu(entry
->e_value_offs
);
2648 buffer
= (void *)IFIRST(header
) + value_offs
;
2651 memcpy(b_entry_name
, entry
->e_name
, entry
->e_name_len
);
2652 b_entry_name
[entry
->e_name_len
] = '\0';
2653 i
.name
= b_entry_name
;
2655 error
= ext4_get_inode_loc(inode
, &is
->iloc
);
2659 error
= ext4_xattr_ibody_find(inode
, &i
, is
);
2664 i
.value_len
= value_size
;
2665 error
= ext4_xattr_block_find(inode
, &i
, bs
);
2669 /* Move ea entry from the inode into the block */
2670 error
= ext4_xattr_block_set(handle
, inode
, &i
, bs
);
2674 /* Remove the chosen entry from the inode */
2677 error
= ext4_xattr_ibody_set(handle
, inode
, &i
, is
);
2680 kfree(b_entry_name
);
2681 if (needs_kvfree
&& buffer
)
2684 brelse(is
->iloc
.bh
);
2693 static int ext4_xattr_make_inode_space(handle_t
*handle
, struct inode
*inode
,
2694 struct ext4_inode
*raw_inode
,
2695 int isize_diff
, size_t ifree
,
2696 size_t bfree
, int *total_ino
)
2698 struct ext4_xattr_ibody_header
*header
= IHDR(inode
, raw_inode
);
2699 struct ext4_xattr_entry
*small_entry
;
2700 struct ext4_xattr_entry
*entry
;
2701 struct ext4_xattr_entry
*last
;
2702 unsigned int entry_size
; /* EA entry size */
2703 unsigned int total_size
; /* EA entry size + value size */
2704 unsigned int min_total_size
;
2707 while (isize_diff
> ifree
) {
2710 min_total_size
= ~0U;
2711 last
= IFIRST(header
);
2712 /* Find the entry best suited to be pushed into EA block */
2713 for (; !IS_LAST_ENTRY(last
); last
= EXT4_XATTR_NEXT(last
)) {
2714 /* never move system.data out of the inode */
2715 if ((last
->e_name_len
== 4) &&
2716 (last
->e_name_index
== EXT4_XATTR_INDEX_SYSTEM
) &&
2717 !memcmp(last
->e_name
, "data", 4))
2719 total_size
= EXT4_XATTR_LEN(last
->e_name_len
);
2720 if (!last
->e_value_inum
)
2721 total_size
+= EXT4_XATTR_SIZE(
2722 le32_to_cpu(last
->e_value_size
));
2723 if (total_size
<= bfree
&&
2724 total_size
< min_total_size
) {
2725 if (total_size
+ ifree
< isize_diff
) {
2729 min_total_size
= total_size
;
2734 if (entry
== NULL
) {
2735 if (small_entry
== NULL
)
2737 entry
= small_entry
;
2740 entry_size
= EXT4_XATTR_LEN(entry
->e_name_len
);
2741 total_size
= entry_size
;
2742 if (!entry
->e_value_inum
)
2743 total_size
+= EXT4_XATTR_SIZE(
2744 le32_to_cpu(entry
->e_value_size
));
2745 error
= ext4_xattr_move_to_block(handle
, inode
, raw_inode
,
2750 *total_ino
-= entry_size
;
2751 ifree
+= total_size
;
2752 bfree
-= total_size
;
2759 * Expand an inode by new_extra_isize bytes when EAs are present.
2760 * Returns 0 on success or negative error number on failure.
2762 int ext4_expand_extra_isize_ea(struct inode
*inode
, int new_extra_isize
,
2763 struct ext4_inode
*raw_inode
, handle_t
*handle
)
2765 struct ext4_xattr_ibody_header
*header
;
2766 struct ext4_sb_info
*sbi
= EXT4_SB(inode
->i_sb
);
2767 static unsigned int mnt_count
;
2769 size_t ifree
, bfree
;
2772 int error
= 0, tried_min_extra_isize
= 0;
2773 int s_min_extra_isize
= le16_to_cpu(sbi
->s_es
->s_min_extra_isize
);
2774 int isize_diff
; /* How much do we need to grow i_extra_isize */
2777 isize_diff
= new_extra_isize
- EXT4_I(inode
)->i_extra_isize
;
2778 if (EXT4_I(inode
)->i_extra_isize
>= new_extra_isize
)
2781 header
= IHDR(inode
, raw_inode
);
2784 * Check if enough free space is available in the inode to shift the
2785 * entries ahead by new_extra_isize.
2788 base
= IFIRST(header
);
2789 end
= (void *)raw_inode
+ EXT4_SB(inode
->i_sb
)->s_inode_size
;
2790 min_offs
= end
- base
;
2791 total_ino
= sizeof(struct ext4_xattr_ibody_header
) + sizeof(u32
);
2793 error
= xattr_check_inode(inode
, header
, end
);
2797 ifree
= ext4_xattr_free_space(base
, &min_offs
, base
, &total_ino
);
2798 if (ifree
>= isize_diff
)
2802 * Enough free space isn't available in the inode, check if
2803 * EA block can hold new_extra_isize bytes.
2805 if (EXT4_I(inode
)->i_file_acl
) {
2806 struct buffer_head
*bh
;
2808 bh
= ext4_sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
2810 error
= PTR_ERR(bh
);
2813 error
= ext4_xattr_check_block(inode
, bh
);
2819 end
= bh
->b_data
+ bh
->b_size
;
2820 min_offs
= end
- base
;
2821 bfree
= ext4_xattr_free_space(BFIRST(bh
), &min_offs
, base
,
2824 if (bfree
+ ifree
< isize_diff
) {
2825 if (!tried_min_extra_isize
&& s_min_extra_isize
) {
2826 tried_min_extra_isize
++;
2827 new_extra_isize
= s_min_extra_isize
;
2834 bfree
= inode
->i_sb
->s_blocksize
;
2837 error
= ext4_xattr_make_inode_space(handle
, inode
, raw_inode
,
2838 isize_diff
, ifree
, bfree
,
2841 if (error
== -ENOSPC
&& !tried_min_extra_isize
&&
2842 s_min_extra_isize
) {
2843 tried_min_extra_isize
++;
2844 new_extra_isize
= s_min_extra_isize
;
2850 /* Adjust the offsets and shift the remaining entries ahead */
2851 ext4_xattr_shift_entries(IFIRST(header
), EXT4_I(inode
)->i_extra_isize
2852 - new_extra_isize
, (void *)raw_inode
+
2853 EXT4_GOOD_OLD_INODE_SIZE
+ new_extra_isize
,
2854 (void *)header
, total_ino
);
2855 EXT4_I(inode
)->i_extra_isize
= new_extra_isize
;
2857 if (ext4_has_inline_data(inode
))
2858 error
= ext4_find_inline_data_nolock(inode
);
2861 if (error
&& (mnt_count
!= le16_to_cpu(sbi
->s_es
->s_mnt_count
))) {
2862 ext4_warning(inode
->i_sb
, "Unable to expand inode %lu. Delete some EAs or run e2fsck.",
2864 mnt_count
= le16_to_cpu(sbi
->s_es
->s_mnt_count
);
2869 #define EIA_INCR 16 /* must be 2^n */
2870 #define EIA_MASK (EIA_INCR - 1)
2872 /* Add the large xattr @inode into @ea_inode_array for deferred iput().
2873 * If @ea_inode_array is new or full it will be grown and the old
2874 * contents copied over.
2877 ext4_expand_inode_array(struct ext4_xattr_inode_array
**ea_inode_array
,
2878 struct inode
*inode
)
2880 if (*ea_inode_array
== NULL
) {
2882 * Start with 15 inodes, so it fits into a power-of-two size.
2884 (*ea_inode_array
) = kmalloc(
2885 struct_size(*ea_inode_array
, inodes
, EIA_MASK
),
2887 if (*ea_inode_array
== NULL
)
2889 (*ea_inode_array
)->count
= 0;
2890 } else if (((*ea_inode_array
)->count
& EIA_MASK
) == EIA_MASK
) {
2891 /* expand the array once all 15 + n * 16 slots are full */
2892 struct ext4_xattr_inode_array
*new_array
= NULL
;
2894 new_array
= kmalloc(
2895 struct_size(*ea_inode_array
, inodes
,
2896 (*ea_inode_array
)->count
+ EIA_INCR
),
2898 if (new_array
== NULL
)
2900 memcpy(new_array
, *ea_inode_array
,
2901 struct_size(*ea_inode_array
, inodes
,
2902 (*ea_inode_array
)->count
));
2903 kfree(*ea_inode_array
);
2904 *ea_inode_array
= new_array
;
2906 (*ea_inode_array
)->count
++;
2907 (*ea_inode_array
)->inodes
[(*ea_inode_array
)->count
- 1] = inode
;
2912 * ext4_xattr_delete_inode()
2914 * Free extended attribute resources associated with this inode. Traverse
2915 * all entries and decrement reference on any xattr inodes associated with this
2916 * inode. This is called immediately before an inode is freed. We have exclusive
2917 * access to the inode. If an orphan inode is deleted it will also release its
2918 * references on xattr block and xattr inodes.
2920 int ext4_xattr_delete_inode(handle_t
*handle
, struct inode
*inode
,
2921 struct ext4_xattr_inode_array
**ea_inode_array
,
2924 struct buffer_head
*bh
= NULL
;
2925 struct ext4_xattr_ibody_header
*header
;
2926 struct ext4_iloc iloc
= { .bh
= NULL
};
2927 struct ext4_xattr_entry
*entry
;
2928 struct inode
*ea_inode
;
2931 error
= ext4_journal_ensure_credits(handle
, extra_credits
,
2932 ext4_free_metadata_revoke_credits(inode
->i_sb
, 1));
2934 EXT4_ERROR_INODE(inode
, "ensure credits (error %d)", error
);
2938 if (ext4_has_feature_ea_inode(inode
->i_sb
) &&
2939 ext4_test_inode_state(inode
, EXT4_STATE_XATTR
)) {
2941 error
= ext4_get_inode_loc(inode
, &iloc
);
2943 EXT4_ERROR_INODE(inode
, "inode loc (error %d)", error
);
2947 error
= ext4_journal_get_write_access(handle
, inode
->i_sb
,
2948 iloc
.bh
, EXT4_JTR_NONE
);
2950 EXT4_ERROR_INODE(inode
, "write access (error %d)",
2955 header
= IHDR(inode
, ext4_raw_inode(&iloc
));
2956 if (header
->h_magic
== cpu_to_le32(EXT4_XATTR_MAGIC
))
2957 ext4_xattr_inode_dec_ref_all(handle
, inode
, iloc
.bh
,
2959 false /* block_csum */,
2962 false /* skip_quota */);
2965 if (EXT4_I(inode
)->i_file_acl
) {
2966 bh
= ext4_sb_bread(inode
->i_sb
, EXT4_I(inode
)->i_file_acl
, REQ_PRIO
);
2968 error
= PTR_ERR(bh
);
2969 if (error
== -EIO
) {
2970 EXT4_ERROR_INODE_ERR(inode
, EIO
,
2971 "block %llu read error",
2972 EXT4_I(inode
)->i_file_acl
);
2977 error
= ext4_xattr_check_block(inode
, bh
);
2981 if (ext4_has_feature_ea_inode(inode
->i_sb
)) {
2982 for (entry
= BFIRST(bh
); !IS_LAST_ENTRY(entry
);
2983 entry
= EXT4_XATTR_NEXT(entry
)) {
2984 if (!entry
->e_value_inum
)
2986 error
= ext4_xattr_inode_iget(inode
,
2987 le32_to_cpu(entry
->e_value_inum
),
2988 le32_to_cpu(entry
->e_hash
),
2992 ext4_xattr_inode_free_quota(inode
, ea_inode
,
2993 le32_to_cpu(entry
->e_value_size
));
2999 ext4_xattr_release_block(handle
, inode
, bh
, ea_inode_array
,
3002 * Update i_file_acl value in the same transaction that releases
3005 EXT4_I(inode
)->i_file_acl
= 0;
3006 error
= ext4_mark_inode_dirty(handle
, inode
);
3008 EXT4_ERROR_INODE(inode
, "mark inode dirty (error %d)",
3012 ext4_fc_mark_ineligible(inode
->i_sb
, EXT4_FC_REASON_XATTR
, handle
);
3021 void ext4_xattr_inode_array_free(struct ext4_xattr_inode_array
*ea_inode_array
)
3025 if (ea_inode_array
== NULL
)
3028 for (idx
= 0; idx
< ea_inode_array
->count
; ++idx
)
3029 iput(ea_inode_array
->inodes
[idx
]);
3030 kfree(ea_inode_array
);
3034 * ext4_xattr_block_cache_insert()
3036 * Create a new entry in the extended attribute block cache, and insert
3037 * it unless such an entry is already in the cache.
3040 ext4_xattr_block_cache_insert(struct mb_cache
*ea_block_cache
,
3041 struct buffer_head
*bh
)
3043 struct ext4_xattr_header
*header
= BHDR(bh
);
3044 __u32 hash
= le32_to_cpu(header
->h_hash
);
3045 int reusable
= le32_to_cpu(header
->h_refcount
) <
3046 EXT4_XATTR_REFCOUNT_MAX
;
3049 if (!ea_block_cache
)
3051 error
= mb_cache_entry_create(ea_block_cache
, GFP_NOFS
, hash
,
3052 bh
->b_blocknr
, reusable
);
3054 if (error
== -EBUSY
)
3055 ea_bdebug(bh
, "already in cache");
3057 ea_bdebug(bh
, "inserting [%x]", (int)hash
);
3063 * Compare two extended attribute blocks for equality.
3065 * Returns 0 if the blocks are equal, 1 if they differ.
3068 ext4_xattr_cmp(struct ext4_xattr_header
*header1
,
3069 struct ext4_xattr_header
*header2
)
3071 struct ext4_xattr_entry
*entry1
, *entry2
;
3073 entry1
= ENTRY(header1
+1);
3074 entry2
= ENTRY(header2
+1);
3075 while (!IS_LAST_ENTRY(entry1
)) {
3076 if (IS_LAST_ENTRY(entry2
))
3078 if (entry1
->e_hash
!= entry2
->e_hash
||
3079 entry1
->e_name_index
!= entry2
->e_name_index
||
3080 entry1
->e_name_len
!= entry2
->e_name_len
||
3081 entry1
->e_value_size
!= entry2
->e_value_size
||
3082 entry1
->e_value_inum
!= entry2
->e_value_inum
||
3083 memcmp(entry1
->e_name
, entry2
->e_name
, entry1
->e_name_len
))
3085 if (!entry1
->e_value_inum
&&
3086 memcmp((char *)header1
+ le16_to_cpu(entry1
->e_value_offs
),
3087 (char *)header2
+ le16_to_cpu(entry2
->e_value_offs
),
3088 le32_to_cpu(entry1
->e_value_size
)))
3091 entry1
= EXT4_XATTR_NEXT(entry1
);
3092 entry2
= EXT4_XATTR_NEXT(entry2
);
3094 if (!IS_LAST_ENTRY(entry2
))
3100 * ext4_xattr_block_cache_find()
3102 * Find an identical extended attribute block.
3104 * Returns a pointer to the block found, or NULL if such a block was not
3105 * found, or an error pointer if an error occurred while reading ea block.
3107 static struct buffer_head
*
3108 ext4_xattr_block_cache_find(struct inode
*inode
,
3109 struct ext4_xattr_header
*header
,
3110 struct mb_cache_entry
**pce
)
3112 __u32 hash
= le32_to_cpu(header
->h_hash
);
3113 struct mb_cache_entry
*ce
;
3114 struct mb_cache
*ea_block_cache
= EA_BLOCK_CACHE(inode
);
3116 if (!ea_block_cache
)
3118 if (!header
->h_hash
)
3119 return NULL
; /* never share */
3120 ea_idebug(inode
, "looking for cached blocks [%x]", (int)hash
);
3121 ce
= mb_cache_entry_find_first(ea_block_cache
, hash
);
3123 struct buffer_head
*bh
;
3125 bh
= ext4_sb_bread(inode
->i_sb
, ce
->e_value
, REQ_PRIO
);
3127 if (PTR_ERR(bh
) != -ENOMEM
)
3128 EXT4_ERROR_INODE(inode
, "block %lu read error",
3129 (unsigned long)ce
->e_value
);
3130 mb_cache_entry_put(ea_block_cache
, ce
);
3132 } else if (ext4_xattr_cmp(header
, BHDR(bh
)) == 0) {
3137 ce
= mb_cache_entry_find_next(ea_block_cache
, ce
);
3142 #define NAME_HASH_SHIFT 5
3143 #define VALUE_HASH_SHIFT 16
3146 * ext4_xattr_hash_entry()
3148 * Compute the hash of an extended attribute.
3150 static __le32
ext4_xattr_hash_entry(char *name
, size_t name_len
, __le32
*value
,
3155 while (name_len
--) {
3156 hash
= (hash
<< NAME_HASH_SHIFT
) ^
3157 (hash
>> (8*sizeof(hash
) - NAME_HASH_SHIFT
)) ^
3158 (unsigned char)*name
++;
3160 while (value_count
--) {
3161 hash
= (hash
<< VALUE_HASH_SHIFT
) ^
3162 (hash
>> (8*sizeof(hash
) - VALUE_HASH_SHIFT
)) ^
3163 le32_to_cpu(*value
++);
3165 return cpu_to_le32(hash
);
3169 * ext4_xattr_hash_entry_signed()
3171 * Compute the hash of an extended attribute incorrectly.
3173 static __le32
ext4_xattr_hash_entry_signed(char *name
, size_t name_len
, __le32
*value
, size_t value_count
)
3177 while (name_len
--) {
3178 hash
= (hash
<< NAME_HASH_SHIFT
) ^
3179 (hash
>> (8*sizeof(hash
) - NAME_HASH_SHIFT
)) ^
3180 (signed char)*name
++;
3182 while (value_count
--) {
3183 hash
= (hash
<< VALUE_HASH_SHIFT
) ^
3184 (hash
>> (8*sizeof(hash
) - VALUE_HASH_SHIFT
)) ^
3185 le32_to_cpu(*value
++);
3187 return cpu_to_le32(hash
);
3190 #undef NAME_HASH_SHIFT
3191 #undef VALUE_HASH_SHIFT
3193 #define BLOCK_HASH_SHIFT 16
3196 * ext4_xattr_rehash()
3198 * Re-compute the extended attribute hash value after an entry has changed.
3200 static void ext4_xattr_rehash(struct ext4_xattr_header
*header
)
3202 struct ext4_xattr_entry
*here
;
3205 here
= ENTRY(header
+1);
3206 while (!IS_LAST_ENTRY(here
)) {
3207 if (!here
->e_hash
) {
3208 /* Block is not shared if an entry's hash value == 0 */
3212 hash
= (hash
<< BLOCK_HASH_SHIFT
) ^
3213 (hash
>> (8*sizeof(hash
) - BLOCK_HASH_SHIFT
)) ^
3214 le32_to_cpu(here
->e_hash
);
3215 here
= EXT4_XATTR_NEXT(here
);
3217 header
->h_hash
= cpu_to_le32(hash
);
3220 #undef BLOCK_HASH_SHIFT
3222 #define HASH_BUCKET_BITS 10
3225 ext4_xattr_create_cache(void)
3227 return mb_cache_create(HASH_BUCKET_BITS
);
3230 void ext4_xattr_destroy_cache(struct mb_cache
*cache
)
3233 mb_cache_destroy(cache
);