1 // SPDX-License-Identifier: GPL-2.0-only
4 * Copyright (C) 2011 Novell Inc.
8 #include <linux/slab.h>
9 #include <linux/namei.h>
10 #include <linux/file.h>
11 #include <linux/xattr.h>
12 #include <linux/rbtree.h>
13 #include <linux/security.h>
14 #include <linux/cred.h>
15 #include <linux/ratelimit.h>
16 #include "overlayfs.h"
18 struct ovl_cache_entry
{
23 struct list_head l_node
;
25 struct ovl_cache_entry
*next_maybe_whiteout
;
31 struct ovl_dir_cache
{
34 struct list_head entries
;
38 struct ovl_readdir_data
{
39 struct dir_context ctx
;
40 struct dentry
*dentry
;
43 struct list_head
*list
;
44 struct list_head middle
;
45 struct ovl_cache_entry
*first_maybe_whiteout
;
49 bool d_type_supported
;
55 struct ovl_dir_cache
*cache
;
56 struct list_head
*cursor
;
57 struct file
*realfile
;
58 struct file
*upperfile
;
61 static struct ovl_cache_entry
*ovl_cache_entry_from_node(struct rb_node
*n
)
63 return rb_entry(n
, struct ovl_cache_entry
, node
);
66 static bool ovl_cache_entry_find_link(const char *name
, int len
,
67 struct rb_node
***link
,
68 struct rb_node
**parent
)
71 struct rb_node
**newp
= *link
;
73 while (!found
&& *newp
) {
75 struct ovl_cache_entry
*tmp
;
78 tmp
= ovl_cache_entry_from_node(*newp
);
79 cmp
= strncmp(name
, tmp
->name
, len
);
81 newp
= &tmp
->node
.rb_right
;
82 else if (cmp
< 0 || len
< tmp
->len
)
83 newp
= &tmp
->node
.rb_left
;
92 static struct ovl_cache_entry
*ovl_cache_entry_find(struct rb_root
*root
,
93 const char *name
, int len
)
95 struct rb_node
*node
= root
->rb_node
;
99 struct ovl_cache_entry
*p
= ovl_cache_entry_from_node(node
);
101 cmp
= strncmp(name
, p
->name
, len
);
103 node
= p
->node
.rb_right
;
104 else if (cmp
< 0 || len
< p
->len
)
105 node
= p
->node
.rb_left
;
113 static bool ovl_calc_d_ino(struct ovl_readdir_data
*rdd
,
114 struct ovl_cache_entry
*p
)
116 /* Don't care if not doing ovl_iter() */
120 /* Always recalc d_ino when remapping lower inode numbers */
121 if (ovl_xino_bits(rdd
->dentry
->d_sb
))
124 /* Always recalc d_ino for parent */
125 if (strcmp(p
->name
, "..") == 0)
128 /* If this is lower, then native d_ino will do */
133 * Recalc d_ino for '.' and for all entries if dir is impure (contains
136 if ((p
->name
[0] == '.' && p
->len
== 1) ||
137 ovl_test_flag(OVL_IMPURE
, d_inode(rdd
->dentry
)))
143 static struct ovl_cache_entry
*ovl_cache_entry_new(struct ovl_readdir_data
*rdd
,
144 const char *name
, int len
,
145 u64 ino
, unsigned int d_type
)
147 struct ovl_cache_entry
*p
;
148 size_t size
= offsetof(struct ovl_cache_entry
, name
[len
+ 1]);
150 p
= kmalloc(size
, GFP_KERNEL
);
154 memcpy(p
->name
, name
, len
);
160 /* Defer setting d_ino for upper entry to ovl_iterate() */
161 if (ovl_calc_d_ino(rdd
, p
))
163 p
->is_upper
= rdd
->is_upper
;
164 p
->is_whiteout
= false;
166 if (d_type
== DT_CHR
) {
167 p
->next_maybe_whiteout
= rdd
->first_maybe_whiteout
;
168 rdd
->first_maybe_whiteout
= p
;
173 static int ovl_cache_entry_add_rb(struct ovl_readdir_data
*rdd
,
174 const char *name
, int len
, u64 ino
,
177 struct rb_node
**newp
= &rdd
->root
->rb_node
;
178 struct rb_node
*parent
= NULL
;
179 struct ovl_cache_entry
*p
;
181 if (ovl_cache_entry_find_link(name
, len
, &newp
, &parent
))
184 p
= ovl_cache_entry_new(rdd
, name
, len
, ino
, d_type
);
190 list_add_tail(&p
->l_node
, rdd
->list
);
191 rb_link_node(&p
->node
, parent
, newp
);
192 rb_insert_color(&p
->node
, rdd
->root
);
197 static int ovl_fill_lowest(struct ovl_readdir_data
*rdd
,
198 const char *name
, int namelen
,
199 loff_t offset
, u64 ino
, unsigned int d_type
)
201 struct ovl_cache_entry
*p
;
203 p
= ovl_cache_entry_find(rdd
->root
, name
, namelen
);
205 list_move_tail(&p
->l_node
, &rdd
->middle
);
207 p
= ovl_cache_entry_new(rdd
, name
, namelen
, ino
, d_type
);
211 list_add_tail(&p
->l_node
, &rdd
->middle
);
217 void ovl_cache_free(struct list_head
*list
)
219 struct ovl_cache_entry
*p
;
220 struct ovl_cache_entry
*n
;
222 list_for_each_entry_safe(p
, n
, list
, l_node
)
225 INIT_LIST_HEAD(list
);
228 void ovl_dir_cache_free(struct inode
*inode
)
230 struct ovl_dir_cache
*cache
= ovl_dir_cache(inode
);
233 ovl_cache_free(&cache
->entries
);
238 static void ovl_cache_put(struct ovl_dir_file
*od
, struct dentry
*dentry
)
240 struct ovl_dir_cache
*cache
= od
->cache
;
242 WARN_ON(cache
->refcount
<= 0);
244 if (!cache
->refcount
) {
245 if (ovl_dir_cache(d_inode(dentry
)) == cache
)
246 ovl_set_dir_cache(d_inode(dentry
), NULL
);
248 ovl_cache_free(&cache
->entries
);
253 static int ovl_fill_merge(struct dir_context
*ctx
, const char *name
,
254 int namelen
, loff_t offset
, u64 ino
,
257 struct ovl_readdir_data
*rdd
=
258 container_of(ctx
, struct ovl_readdir_data
, ctx
);
262 return ovl_cache_entry_add_rb(rdd
, name
, namelen
, ino
, d_type
);
264 return ovl_fill_lowest(rdd
, name
, namelen
, offset
, ino
, d_type
);
267 static int ovl_check_whiteouts(struct dentry
*dir
, struct ovl_readdir_data
*rdd
)
270 struct ovl_cache_entry
*p
;
271 struct dentry
*dentry
;
272 const struct cred
*old_cred
;
274 old_cred
= ovl_override_creds(rdd
->dentry
->d_sb
);
276 err
= down_write_killable(&dir
->d_inode
->i_rwsem
);
278 while (rdd
->first_maybe_whiteout
) {
279 p
= rdd
->first_maybe_whiteout
;
280 rdd
->first_maybe_whiteout
= p
->next_maybe_whiteout
;
281 dentry
= lookup_one_len(p
->name
, dir
, p
->len
);
282 if (!IS_ERR(dentry
)) {
283 p
->is_whiteout
= ovl_is_whiteout(dentry
);
287 inode_unlock(dir
->d_inode
);
289 revert_creds(old_cred
);
294 static inline int ovl_dir_read(struct path
*realpath
,
295 struct ovl_readdir_data
*rdd
)
297 struct file
*realfile
;
300 realfile
= ovl_path_open(realpath
, O_RDONLY
| O_LARGEFILE
);
301 if (IS_ERR(realfile
))
302 return PTR_ERR(realfile
);
304 rdd
->first_maybe_whiteout
= NULL
;
309 err
= iterate_dir(realfile
, &rdd
->ctx
);
312 } while (!err
&& rdd
->count
);
314 if (!err
&& rdd
->first_maybe_whiteout
&& rdd
->dentry
)
315 err
= ovl_check_whiteouts(realpath
->dentry
, rdd
);
323 * Can we iterate real dir directly?
325 * Non-merge dir may contain whiteouts from a time it was a merge upper, before
326 * lower dir was removed under it and possibly before it was rotated from upper
329 static bool ovl_dir_is_real(struct dentry
*dir
)
331 return !ovl_test_flag(OVL_WHITEOUTS
, d_inode(dir
));
334 static void ovl_dir_reset(struct file
*file
)
336 struct ovl_dir_file
*od
= file
->private_data
;
337 struct ovl_dir_cache
*cache
= od
->cache
;
338 struct dentry
*dentry
= file
->f_path
.dentry
;
341 if (cache
&& ovl_dentry_version_get(dentry
) != cache
->version
) {
342 ovl_cache_put(od
, dentry
);
346 is_real
= ovl_dir_is_real(dentry
);
347 if (od
->is_real
!= is_real
) {
348 /* is_real can only become false when dir is copied up */
349 if (WARN_ON(is_real
))
355 static int ovl_dir_read_merged(struct dentry
*dentry
, struct list_head
*list
,
356 struct rb_root
*root
)
359 struct path realpath
;
360 struct ovl_readdir_data rdd
= {
361 .ctx
.actor
= ovl_fill_merge
,
369 for (idx
= 0; idx
!= -1; idx
= next
) {
370 next
= ovl_path_next(idx
, dentry
, &realpath
);
371 rdd
.is_upper
= ovl_dentry_upper(dentry
) == realpath
.dentry
;
374 err
= ovl_dir_read(&realpath
, &rdd
);
379 * Insert lowest layer entries before upper ones, this
380 * allows offsets to be reasonably constant
382 list_add(&rdd
.middle
, rdd
.list
);
383 rdd
.is_lowest
= true;
384 err
= ovl_dir_read(&realpath
, &rdd
);
385 list_del(&rdd
.middle
);
391 static void ovl_seek_cursor(struct ovl_dir_file
*od
, loff_t pos
)
396 list_for_each(p
, &od
->cache
->entries
) {
401 /* Cursor is safe since the cache is stable */
405 static struct ovl_dir_cache
*ovl_cache_get(struct dentry
*dentry
)
408 struct ovl_dir_cache
*cache
;
410 cache
= ovl_dir_cache(d_inode(dentry
));
411 if (cache
&& ovl_dentry_version_get(dentry
) == cache
->version
) {
412 WARN_ON(!cache
->refcount
);
416 ovl_set_dir_cache(d_inode(dentry
), NULL
);
418 cache
= kzalloc(sizeof(struct ovl_dir_cache
), GFP_KERNEL
);
420 return ERR_PTR(-ENOMEM
);
423 INIT_LIST_HEAD(&cache
->entries
);
424 cache
->root
= RB_ROOT
;
426 res
= ovl_dir_read_merged(dentry
, &cache
->entries
, &cache
->root
);
428 ovl_cache_free(&cache
->entries
);
433 cache
->version
= ovl_dentry_version_get(dentry
);
434 ovl_set_dir_cache(d_inode(dentry
), cache
);
439 /* Map inode number to lower fs unique range */
440 static u64
ovl_remap_lower_ino(u64 ino
, int xinobits
, int fsid
,
441 const char *name
, int namelen
, bool warn
)
443 unsigned int xinoshift
= 64 - xinobits
;
445 if (unlikely(ino
>> xinoshift
)) {
447 pr_warn_ratelimited("d_ino too big (%.*s, ino=%llu, xinobits=%d)\n",
448 namelen
, name
, ino
, xinobits
);
454 * The lowest xinobit is reserved for mapping the non-peresistent inode
455 * numbers range, but this range is only exposed via st_ino, not here.
457 return ino
| ((u64
)fsid
) << (xinoshift
+ 1);
461 * Set d_ino for upper entries. Non-upper entries should always report
462 * the uppermost real inode ino and should not call this function.
464 * When not all layer are on same fs, report real ino also for upper.
466 * When all layers are on the same fs, and upper has a reference to
467 * copy up origin, call vfs_getattr() on the overlay entry to make
468 * sure that d_ino will be consistent with st_ino from stat(2).
470 static int ovl_cache_update_ino(struct path
*path
, struct ovl_cache_entry
*p
)
473 struct dentry
*dir
= path
->dentry
;
474 struct dentry
*this = NULL
;
475 enum ovl_path_type type
;
476 u64 ino
= p
->real_ino
;
477 int xinobits
= ovl_xino_bits(dir
->d_sb
);
480 if (!ovl_same_dev(dir
->d_sb
))
483 if (p
->name
[0] == '.') {
488 if (p
->len
== 2 && p
->name
[1] == '.') {
489 /* we shall not be moved */
490 this = dget(dir
->d_parent
);
494 this = lookup_one_len(p
->name
, dir
, p
->len
);
495 if (IS_ERR_OR_NULL(this) || !this->d_inode
) {
505 type
= ovl_path_type(this);
506 if (OVL_TYPE_ORIGIN(type
)) {
508 struct path statpath
= *path
;
510 statpath
.dentry
= this;
511 err
= vfs_getattr(&statpath
, &stat
, STATX_INO
, 0);
516 * Directory inode is always on overlay st_dev.
517 * Non-dir with ovl_same_dev() could be on pseudo st_dev in case
518 * of xino bits overflow.
520 WARN_ON_ONCE(S_ISDIR(stat
.mode
) &&
521 dir
->d_sb
->s_dev
!= stat
.dev
);
523 } else if (xinobits
&& !OVL_TYPE_UPPER(type
)) {
524 ino
= ovl_remap_lower_ino(ino
, xinobits
,
525 ovl_layer_lower(this)->fsid
,
527 ovl_xino_warn(dir
->d_sb
));
536 pr_warn_ratelimited("failed to look up (%s) for ino (%i)\n",
541 static int ovl_fill_plain(struct dir_context
*ctx
, const char *name
,
542 int namelen
, loff_t offset
, u64 ino
,
545 struct ovl_cache_entry
*p
;
546 struct ovl_readdir_data
*rdd
=
547 container_of(ctx
, struct ovl_readdir_data
, ctx
);
550 p
= ovl_cache_entry_new(rdd
, name
, namelen
, ino
, d_type
);
555 list_add_tail(&p
->l_node
, rdd
->list
);
560 static int ovl_dir_read_impure(struct path
*path
, struct list_head
*list
,
561 struct rb_root
*root
)
564 struct path realpath
;
565 struct ovl_cache_entry
*p
, *n
;
566 struct ovl_readdir_data rdd
= {
567 .ctx
.actor
= ovl_fill_plain
,
572 INIT_LIST_HEAD(list
);
574 ovl_path_upper(path
->dentry
, &realpath
);
576 err
= ovl_dir_read(&realpath
, &rdd
);
580 list_for_each_entry_safe(p
, n
, list
, l_node
) {
581 if (strcmp(p
->name
, ".") != 0 &&
582 strcmp(p
->name
, "..") != 0) {
583 err
= ovl_cache_update_ino(path
, p
);
587 if (p
->ino
== p
->real_ino
) {
588 list_del(&p
->l_node
);
591 struct rb_node
**newp
= &root
->rb_node
;
592 struct rb_node
*parent
= NULL
;
594 if (WARN_ON(ovl_cache_entry_find_link(p
->name
, p
->len
,
598 rb_link_node(&p
->node
, parent
, newp
);
599 rb_insert_color(&p
->node
, root
);
605 static struct ovl_dir_cache
*ovl_cache_get_impure(struct path
*path
)
608 struct dentry
*dentry
= path
->dentry
;
609 struct ovl_dir_cache
*cache
;
611 cache
= ovl_dir_cache(d_inode(dentry
));
612 if (cache
&& ovl_dentry_version_get(dentry
) == cache
->version
)
615 /* Impure cache is not refcounted, free it here */
616 ovl_dir_cache_free(d_inode(dentry
));
617 ovl_set_dir_cache(d_inode(dentry
), NULL
);
619 cache
= kzalloc(sizeof(struct ovl_dir_cache
), GFP_KERNEL
);
621 return ERR_PTR(-ENOMEM
);
623 res
= ovl_dir_read_impure(path
, &cache
->entries
, &cache
->root
);
625 ovl_cache_free(&cache
->entries
);
629 if (list_empty(&cache
->entries
)) {
631 * A good opportunity to get rid of an unneeded "impure" flag.
632 * Removing the "impure" xattr is best effort.
634 if (!ovl_want_write(dentry
)) {
635 ovl_do_removexattr(ovl_dentry_upper(dentry
),
637 ovl_drop_write(dentry
);
639 ovl_clear_flag(OVL_IMPURE
, d_inode(dentry
));
644 cache
->version
= ovl_dentry_version_get(dentry
);
645 ovl_set_dir_cache(d_inode(dentry
), cache
);
650 struct ovl_readdir_translate
{
651 struct dir_context
*orig_ctx
;
652 struct ovl_dir_cache
*cache
;
653 struct dir_context ctx
;
660 static int ovl_fill_real(struct dir_context
*ctx
, const char *name
,
661 int namelen
, loff_t offset
, u64 ino
,
664 struct ovl_readdir_translate
*rdt
=
665 container_of(ctx
, struct ovl_readdir_translate
, ctx
);
666 struct dir_context
*orig_ctx
= rdt
->orig_ctx
;
668 if (rdt
->parent_ino
&& strcmp(name
, "..") == 0) {
669 ino
= rdt
->parent_ino
;
670 } else if (rdt
->cache
) {
671 struct ovl_cache_entry
*p
;
673 p
= ovl_cache_entry_find(&rdt
->cache
->root
, name
, namelen
);
676 } else if (rdt
->xinobits
) {
677 ino
= ovl_remap_lower_ino(ino
, rdt
->xinobits
, rdt
->fsid
,
678 name
, namelen
, rdt
->xinowarn
);
681 return orig_ctx
->actor(orig_ctx
, name
, namelen
, offset
, ino
, d_type
);
684 static bool ovl_is_impure_dir(struct file
*file
)
686 struct ovl_dir_file
*od
= file
->private_data
;
687 struct inode
*dir
= d_inode(file
->f_path
.dentry
);
690 * Only upper dir can be impure, but if we are in the middle of
691 * iterating a lower real dir, dir could be copied up and marked
692 * impure. We only want the impure cache if we started iterating
693 * a real upper dir to begin with.
695 return od
->is_upper
&& ovl_test_flag(OVL_IMPURE
, dir
);
699 static int ovl_iterate_real(struct file
*file
, struct dir_context
*ctx
)
702 struct ovl_dir_file
*od
= file
->private_data
;
703 struct dentry
*dir
= file
->f_path
.dentry
;
704 const struct ovl_layer
*lower_layer
= ovl_layer_lower(dir
);
705 struct ovl_readdir_translate rdt
= {
706 .ctx
.actor
= ovl_fill_real
,
708 .xinobits
= ovl_xino_bits(dir
->d_sb
),
709 .xinowarn
= ovl_xino_warn(dir
->d_sb
),
712 if (rdt
.xinobits
&& lower_layer
)
713 rdt
.fsid
= lower_layer
->fsid
;
715 if (OVL_TYPE_MERGE(ovl_path_type(dir
->d_parent
))) {
717 struct path statpath
= file
->f_path
;
719 statpath
.dentry
= dir
->d_parent
;
720 err
= vfs_getattr(&statpath
, &stat
, STATX_INO
, 0);
724 WARN_ON_ONCE(dir
->d_sb
->s_dev
!= stat
.dev
);
725 rdt
.parent_ino
= stat
.ino
;
728 if (ovl_is_impure_dir(file
)) {
729 rdt
.cache
= ovl_cache_get_impure(&file
->f_path
);
730 if (IS_ERR(rdt
.cache
))
731 return PTR_ERR(rdt
.cache
);
734 err
= iterate_dir(od
->realfile
, &rdt
.ctx
);
735 ctx
->pos
= rdt
.ctx
.pos
;
741 static int ovl_iterate(struct file
*file
, struct dir_context
*ctx
)
743 struct ovl_dir_file
*od
= file
->private_data
;
744 struct dentry
*dentry
= file
->f_path
.dentry
;
745 struct ovl_cache_entry
*p
;
746 const struct cred
*old_cred
;
749 old_cred
= ovl_override_creds(dentry
->d_sb
);
755 * If parent is merge, then need to adjust d_ino for '..', if
756 * dir is impure then need to adjust d_ino for copied up
759 if (ovl_xino_bits(dentry
->d_sb
) ||
760 (ovl_same_fs(dentry
->d_sb
) &&
761 (ovl_is_impure_dir(file
) ||
762 OVL_TYPE_MERGE(ovl_path_type(dentry
->d_parent
))))) {
763 err
= ovl_iterate_real(file
, ctx
);
765 err
= iterate_dir(od
->realfile
, ctx
);
771 struct ovl_dir_cache
*cache
;
773 cache
= ovl_cache_get(dentry
);
774 err
= PTR_ERR(cache
);
779 ovl_seek_cursor(od
, ctx
->pos
);
782 while (od
->cursor
!= &od
->cache
->entries
) {
783 p
= list_entry(od
->cursor
, struct ovl_cache_entry
, l_node
);
784 if (!p
->is_whiteout
) {
786 err
= ovl_cache_update_ino(&file
->f_path
, p
);
790 if (!dir_emit(ctx
, p
->name
, p
->len
, p
->ino
, p
->type
))
793 od
->cursor
= p
->l_node
.next
;
798 revert_creds(old_cred
);
802 static loff_t
ovl_dir_llseek(struct file
*file
, loff_t offset
, int origin
)
805 struct ovl_dir_file
*od
= file
->private_data
;
807 inode_lock(file_inode(file
));
812 res
= vfs_llseek(od
->realfile
, offset
, origin
);
813 file
->f_pos
= od
->realfile
->f_pos
;
819 offset
+= file
->f_pos
;
829 if (offset
!= file
->f_pos
) {
830 file
->f_pos
= offset
;
832 ovl_seek_cursor(od
, offset
);
837 inode_unlock(file_inode(file
));
842 static struct file
*ovl_dir_open_realfile(struct file
*file
,
843 struct path
*realpath
)
846 const struct cred
*old_cred
;
848 old_cred
= ovl_override_creds(file_inode(file
)->i_sb
);
849 res
= ovl_path_open(realpath
, O_RDONLY
| (file
->f_flags
& O_LARGEFILE
));
850 revert_creds(old_cred
);
855 static int ovl_dir_fsync(struct file
*file
, loff_t start
, loff_t end
,
858 struct ovl_dir_file
*od
= file
->private_data
;
859 struct dentry
*dentry
= file
->f_path
.dentry
;
860 struct file
*realfile
= od
->realfile
;
862 /* Nothing to sync for lower */
863 if (!OVL_TYPE_UPPER(ovl_path_type(dentry
)))
867 * Need to check if we started out being a lower dir, but got copied up
870 struct inode
*inode
= file_inode(file
);
872 realfile
= READ_ONCE(od
->upperfile
);
874 struct path upperpath
;
876 ovl_path_upper(dentry
, &upperpath
);
877 realfile
= ovl_dir_open_realfile(file
, &upperpath
);
880 if (!od
->upperfile
) {
881 if (IS_ERR(realfile
)) {
883 return PTR_ERR(realfile
);
885 smp_store_release(&od
->upperfile
, realfile
);
887 /* somebody has beaten us to it */
888 if (!IS_ERR(realfile
))
890 realfile
= od
->upperfile
;
896 return vfs_fsync_range(realfile
, start
, end
, datasync
);
899 static int ovl_dir_release(struct inode
*inode
, struct file
*file
)
901 struct ovl_dir_file
*od
= file
->private_data
;
905 ovl_cache_put(od
, file
->f_path
.dentry
);
916 static int ovl_dir_open(struct inode
*inode
, struct file
*file
)
918 struct path realpath
;
919 struct file
*realfile
;
920 struct ovl_dir_file
*od
;
921 enum ovl_path_type type
;
923 od
= kzalloc(sizeof(struct ovl_dir_file
), GFP_KERNEL
);
927 type
= ovl_path_real(file
->f_path
.dentry
, &realpath
);
928 realfile
= ovl_dir_open_realfile(file
, &realpath
);
929 if (IS_ERR(realfile
)) {
931 return PTR_ERR(realfile
);
933 od
->realfile
= realfile
;
934 od
->is_real
= ovl_dir_is_real(file
->f_path
.dentry
);
935 od
->is_upper
= OVL_TYPE_UPPER(type
);
936 file
->private_data
= od
;
941 const struct file_operations ovl_dir_operations
= {
942 .read
= generic_read_dir
,
943 .open
= ovl_dir_open
,
944 .iterate
= ovl_iterate
,
945 .llseek
= ovl_dir_llseek
,
946 .fsync
= ovl_dir_fsync
,
947 .release
= ovl_dir_release
,
950 int ovl_check_empty_dir(struct dentry
*dentry
, struct list_head
*list
)
953 struct ovl_cache_entry
*p
, *n
;
954 struct rb_root root
= RB_ROOT
;
955 const struct cred
*old_cred
;
957 old_cred
= ovl_override_creds(dentry
->d_sb
);
958 err
= ovl_dir_read_merged(dentry
, list
, &root
);
959 revert_creds(old_cred
);
965 list_for_each_entry_safe(p
, n
, list
, l_node
) {
967 * Select whiteouts in upperdir, they should
968 * be cleared when deleting this directory.
970 if (p
->is_whiteout
) {
976 if (p
->name
[0] == '.') {
979 if (p
->len
== 2 && p
->name
[1] == '.')
986 list_del(&p
->l_node
);
993 void ovl_cleanup_whiteouts(struct dentry
*upper
, struct list_head
*list
)
995 struct ovl_cache_entry
*p
;
997 inode_lock_nested(upper
->d_inode
, I_MUTEX_CHILD
);
998 list_for_each_entry(p
, list
, l_node
) {
999 struct dentry
*dentry
;
1001 if (WARN_ON(!p
->is_whiteout
|| !p
->is_upper
))
1004 dentry
= lookup_one_len(p
->name
, upper
, p
->len
);
1005 if (IS_ERR(dentry
)) {
1006 pr_err("lookup '%s/%.*s' failed (%i)\n",
1007 upper
->d_name
.name
, p
->len
, p
->name
,
1008 (int) PTR_ERR(dentry
));
1011 if (dentry
->d_inode
)
1012 ovl_cleanup(upper
->d_inode
, dentry
);
1015 inode_unlock(upper
->d_inode
);
1018 static int ovl_check_d_type(struct dir_context
*ctx
, const char *name
,
1019 int namelen
, loff_t offset
, u64 ino
,
1020 unsigned int d_type
)
1022 struct ovl_readdir_data
*rdd
=
1023 container_of(ctx
, struct ovl_readdir_data
, ctx
);
1025 /* Even if d_type is not supported, DT_DIR is returned for . and .. */
1026 if (!strncmp(name
, ".", namelen
) || !strncmp(name
, "..", namelen
))
1029 if (d_type
!= DT_UNKNOWN
)
1030 rdd
->d_type_supported
= true;
1036 * Returns 1 if d_type is supported, 0 not supported/unknown. Negative values
1037 * if error is encountered.
1039 int ovl_check_d_type_supported(struct path
*realpath
)
1042 struct ovl_readdir_data rdd
= {
1043 .ctx
.actor
= ovl_check_d_type
,
1044 .d_type_supported
= false,
1047 err
= ovl_dir_read(realpath
, &rdd
);
1051 return rdd
.d_type_supported
;
1054 static void ovl_workdir_cleanup_recurse(struct path
*path
, int level
)
1057 struct inode
*dir
= path
->dentry
->d_inode
;
1059 struct rb_root root
= RB_ROOT
;
1060 struct ovl_cache_entry
*p
;
1061 struct ovl_readdir_data rdd
= {
1062 .ctx
.actor
= ovl_fill_merge
,
1069 err
= ovl_dir_read(path
, &rdd
);
1073 inode_lock_nested(dir
, I_MUTEX_PARENT
);
1074 list_for_each_entry(p
, &list
, l_node
) {
1075 struct dentry
*dentry
;
1077 if (p
->name
[0] == '.') {
1080 if (p
->len
== 2 && p
->name
[1] == '.')
1083 dentry
= lookup_one_len(p
->name
, path
->dentry
, p
->len
);
1086 if (dentry
->d_inode
)
1087 ovl_workdir_cleanup(dir
, path
->mnt
, dentry
, level
);
1092 ovl_cache_free(&list
);
1095 int ovl_workdir_cleanup(struct inode
*dir
, struct vfsmount
*mnt
,
1096 struct dentry
*dentry
, int level
)
1100 if (!d_is_dir(dentry
) || level
> 1) {
1101 return ovl_cleanup(dir
, dentry
);
1104 err
= ovl_do_rmdir(dir
, dentry
);
1106 struct path path
= { .mnt
= mnt
, .dentry
= dentry
};
1109 ovl_workdir_cleanup_recurse(&path
, level
+ 1);
1110 inode_lock_nested(dir
, I_MUTEX_PARENT
);
1111 err
= ovl_cleanup(dir
, dentry
);
1117 int ovl_indexdir_cleanup(struct ovl_fs
*ofs
)
1120 struct dentry
*indexdir
= ofs
->indexdir
;
1121 struct dentry
*index
= NULL
;
1122 struct inode
*dir
= indexdir
->d_inode
;
1123 struct path path
= { .mnt
= ovl_upper_mnt(ofs
), .dentry
= indexdir
};
1125 struct rb_root root
= RB_ROOT
;
1126 struct ovl_cache_entry
*p
;
1127 struct ovl_readdir_data rdd
= {
1128 .ctx
.actor
= ovl_fill_merge
,
1135 err
= ovl_dir_read(&path
, &rdd
);
1139 inode_lock_nested(dir
, I_MUTEX_PARENT
);
1140 list_for_each_entry(p
, &list
, l_node
) {
1141 if (p
->name
[0] == '.') {
1144 if (p
->len
== 2 && p
->name
[1] == '.')
1147 index
= lookup_one_len(p
->name
, indexdir
, p
->len
);
1148 if (IS_ERR(index
)) {
1149 err
= PTR_ERR(index
);
1153 /* Cleanup leftover from index create/cleanup attempt */
1154 if (index
->d_name
.name
[0] == '#') {
1155 err
= ovl_workdir_cleanup(dir
, path
.mnt
, index
, 1);
1160 err
= ovl_verify_index(ofs
, index
);
1163 } else if (err
== -ESTALE
) {
1164 /* Cleanup stale index entries */
1165 err
= ovl_cleanup(dir
, index
);
1166 } else if (err
!= -ENOENT
) {
1168 * Abort mount to avoid corrupting the index if
1169 * an incompatible index entry was found or on out
1173 } else if (ofs
->config
.nfs_export
) {
1175 * Whiteout orphan index to block future open by
1176 * handle after overlay nlink dropped to zero.
1178 err
= ovl_cleanup_and_whiteout(ofs
, dir
, index
);
1180 /* Cleanup orphan index entries */
1181 err
= ovl_cleanup(dir
, index
);
1194 ovl_cache_free(&list
);
1196 pr_err("failed index dir cleanup (%i)\n", err
);