1 // SPDX-License-Identifier: GPL-2.0-only
4 * Copyright (C) 2011 Novell Inc.
8 #include <linux/slab.h>
9 #include <linux/namei.h>
10 #include <linux/file.h>
11 #include <linux/xattr.h>
12 #include <linux/rbtree.h>
13 #include <linux/security.h>
14 #include <linux/cred.h>
15 #include <linux/ratelimit.h>
16 #include "overlayfs.h"
18 struct ovl_cache_entry
{
23 struct list_head l_node
;
25 struct ovl_cache_entry
*next_maybe_whiteout
;
32 struct ovl_dir_cache
{
35 struct list_head entries
;
39 struct ovl_readdir_data
{
40 struct dir_context ctx
;
41 struct dentry
*dentry
;
44 struct list_head
*list
;
45 struct list_head middle
;
46 struct ovl_cache_entry
*first_maybe_whiteout
;
50 bool d_type_supported
;
51 bool in_xwhiteouts_dir
;
57 struct ovl_dir_cache
*cache
;
58 struct list_head
*cursor
;
59 struct file
*realfile
;
60 struct file
*upperfile
;
63 static struct ovl_cache_entry
*ovl_cache_entry_from_node(struct rb_node
*n
)
65 return rb_entry(n
, struct ovl_cache_entry
, node
);
68 static bool ovl_cache_entry_find_link(const char *name
, int len
,
69 struct rb_node
***link
,
70 struct rb_node
**parent
)
73 struct rb_node
**newp
= *link
;
75 while (!found
&& *newp
) {
77 struct ovl_cache_entry
*tmp
;
80 tmp
= ovl_cache_entry_from_node(*newp
);
81 cmp
= strncmp(name
, tmp
->name
, len
);
83 newp
= &tmp
->node
.rb_right
;
84 else if (cmp
< 0 || len
< tmp
->len
)
85 newp
= &tmp
->node
.rb_left
;
94 static struct ovl_cache_entry
*ovl_cache_entry_find(struct rb_root
*root
,
95 const char *name
, int len
)
97 struct rb_node
*node
= root
->rb_node
;
101 struct ovl_cache_entry
*p
= ovl_cache_entry_from_node(node
);
103 cmp
= strncmp(name
, p
->name
, len
);
105 node
= p
->node
.rb_right
;
106 else if (cmp
< 0 || len
< p
->len
)
107 node
= p
->node
.rb_left
;
115 static bool ovl_calc_d_ino(struct ovl_readdir_data
*rdd
,
116 struct ovl_cache_entry
*p
)
118 /* Don't care if not doing ovl_iter() */
122 /* Always recalc d_ino when remapping lower inode numbers */
123 if (ovl_xino_bits(OVL_FS(rdd
->dentry
->d_sb
)))
126 /* Always recalc d_ino for parent */
127 if (strcmp(p
->name
, "..") == 0)
130 /* If this is lower, then native d_ino will do */
135 * Recalc d_ino for '.' and for all entries if dir is impure (contains
138 if ((p
->name
[0] == '.' && p
->len
== 1) ||
139 ovl_test_flag(OVL_IMPURE
, d_inode(rdd
->dentry
)))
145 static struct ovl_cache_entry
*ovl_cache_entry_new(struct ovl_readdir_data
*rdd
,
146 const char *name
, int len
,
147 u64 ino
, unsigned int d_type
)
149 struct ovl_cache_entry
*p
;
150 size_t size
= offsetof(struct ovl_cache_entry
, name
[len
+ 1]);
152 p
= kmalloc(size
, GFP_KERNEL
);
156 memcpy(p
->name
, name
, len
);
162 /* Defer setting d_ino for upper entry to ovl_iterate() */
163 if (ovl_calc_d_ino(rdd
, p
))
165 p
->is_upper
= rdd
->is_upper
;
166 p
->is_whiteout
= false;
167 /* Defer check for overlay.whiteout to ovl_iterate() */
168 p
->check_xwhiteout
= rdd
->in_xwhiteouts_dir
&& d_type
== DT_REG
;
170 if (d_type
== DT_CHR
) {
171 p
->next_maybe_whiteout
= rdd
->first_maybe_whiteout
;
172 rdd
->first_maybe_whiteout
= p
;
177 static bool ovl_cache_entry_add_rb(struct ovl_readdir_data
*rdd
,
178 const char *name
, int len
, u64 ino
,
181 struct rb_node
**newp
= &rdd
->root
->rb_node
;
182 struct rb_node
*parent
= NULL
;
183 struct ovl_cache_entry
*p
;
185 if (ovl_cache_entry_find_link(name
, len
, &newp
, &parent
))
188 p
= ovl_cache_entry_new(rdd
, name
, len
, ino
, d_type
);
194 list_add_tail(&p
->l_node
, rdd
->list
);
195 rb_link_node(&p
->node
, parent
, newp
);
196 rb_insert_color(&p
->node
, rdd
->root
);
201 static bool ovl_fill_lowest(struct ovl_readdir_data
*rdd
,
202 const char *name
, int namelen
,
203 loff_t offset
, u64 ino
, unsigned int d_type
)
205 struct ovl_cache_entry
*p
;
207 p
= ovl_cache_entry_find(rdd
->root
, name
, namelen
);
209 list_move_tail(&p
->l_node
, &rdd
->middle
);
211 p
= ovl_cache_entry_new(rdd
, name
, namelen
, ino
, d_type
);
215 list_add_tail(&p
->l_node
, &rdd
->middle
);
218 return rdd
->err
== 0;
221 void ovl_cache_free(struct list_head
*list
)
223 struct ovl_cache_entry
*p
;
224 struct ovl_cache_entry
*n
;
226 list_for_each_entry_safe(p
, n
, list
, l_node
)
229 INIT_LIST_HEAD(list
);
232 void ovl_dir_cache_free(struct inode
*inode
)
234 struct ovl_dir_cache
*cache
= ovl_dir_cache(inode
);
237 ovl_cache_free(&cache
->entries
);
242 static void ovl_cache_put(struct ovl_dir_file
*od
, struct inode
*inode
)
244 struct ovl_dir_cache
*cache
= od
->cache
;
246 WARN_ON(cache
->refcount
<= 0);
248 if (!cache
->refcount
) {
249 if (ovl_dir_cache(inode
) == cache
)
250 ovl_set_dir_cache(inode
, NULL
);
252 ovl_cache_free(&cache
->entries
);
257 static bool ovl_fill_merge(struct dir_context
*ctx
, const char *name
,
258 int namelen
, loff_t offset
, u64 ino
,
261 struct ovl_readdir_data
*rdd
=
262 container_of(ctx
, struct ovl_readdir_data
, ctx
);
266 return ovl_cache_entry_add_rb(rdd
, name
, namelen
, ino
, d_type
);
268 return ovl_fill_lowest(rdd
, name
, namelen
, offset
, ino
, d_type
);
271 static int ovl_check_whiteouts(const struct path
*path
, struct ovl_readdir_data
*rdd
)
274 struct ovl_cache_entry
*p
;
275 struct dentry
*dentry
, *dir
= path
->dentry
;
276 const struct cred
*old_cred
;
278 old_cred
= ovl_override_creds(rdd
->dentry
->d_sb
);
280 err
= down_write_killable(&dir
->d_inode
->i_rwsem
);
282 while (rdd
->first_maybe_whiteout
) {
283 p
= rdd
->first_maybe_whiteout
;
284 rdd
->first_maybe_whiteout
= p
->next_maybe_whiteout
;
285 dentry
= lookup_one(mnt_idmap(path
->mnt
), p
->name
, dir
, p
->len
);
286 if (!IS_ERR(dentry
)) {
287 p
->is_whiteout
= ovl_is_whiteout(dentry
);
291 inode_unlock(dir
->d_inode
);
293 ovl_revert_creds(old_cred
);
298 static inline int ovl_dir_read(const struct path
*realpath
,
299 struct ovl_readdir_data
*rdd
)
301 struct file
*realfile
;
304 realfile
= ovl_path_open(realpath
, O_RDONLY
| O_LARGEFILE
);
305 if (IS_ERR(realfile
))
306 return PTR_ERR(realfile
);
308 rdd
->first_maybe_whiteout
= NULL
;
313 err
= iterate_dir(realfile
, &rdd
->ctx
);
316 } while (!err
&& rdd
->count
);
318 if (!err
&& rdd
->first_maybe_whiteout
&& rdd
->dentry
)
319 err
= ovl_check_whiteouts(realpath
, rdd
);
326 static void ovl_dir_reset(struct file
*file
)
328 struct ovl_dir_file
*od
= file
->private_data
;
329 struct ovl_dir_cache
*cache
= od
->cache
;
330 struct inode
*inode
= file_inode(file
);
333 if (cache
&& ovl_inode_version_get(inode
) != cache
->version
) {
334 ovl_cache_put(od
, inode
);
338 is_real
= ovl_dir_is_real(inode
);
339 if (od
->is_real
!= is_real
) {
340 /* is_real can only become false when dir is copied up */
341 if (WARN_ON(is_real
))
347 static int ovl_dir_read_merged(struct dentry
*dentry
, struct list_head
*list
,
348 struct rb_root
*root
)
351 struct path realpath
;
352 struct ovl_readdir_data rdd
= {
353 .ctx
.actor
= ovl_fill_merge
,
360 const struct ovl_layer
*layer
;
362 for (idx
= 0; idx
!= -1; idx
= next
) {
363 next
= ovl_path_next(idx
, dentry
, &realpath
, &layer
);
364 rdd
.is_upper
= ovl_dentry_upper(dentry
) == realpath
.dentry
;
365 rdd
.in_xwhiteouts_dir
= layer
->has_xwhiteouts
&&
366 ovl_dentry_has_xwhiteouts(dentry
);
369 err
= ovl_dir_read(&realpath
, &rdd
);
374 * Insert lowest layer entries before upper ones, this
375 * allows offsets to be reasonably constant
377 list_add(&rdd
.middle
, rdd
.list
);
378 rdd
.is_lowest
= true;
379 err
= ovl_dir_read(&realpath
, &rdd
);
380 list_del(&rdd
.middle
);
386 static void ovl_seek_cursor(struct ovl_dir_file
*od
, loff_t pos
)
391 list_for_each(p
, &od
->cache
->entries
) {
396 /* Cursor is safe since the cache is stable */
400 static struct ovl_dir_cache
*ovl_cache_get(struct dentry
*dentry
)
403 struct ovl_dir_cache
*cache
;
404 struct inode
*inode
= d_inode(dentry
);
406 cache
= ovl_dir_cache(inode
);
407 if (cache
&& ovl_inode_version_get(inode
) == cache
->version
) {
408 WARN_ON(!cache
->refcount
);
412 ovl_set_dir_cache(d_inode(dentry
), NULL
);
414 cache
= kzalloc(sizeof(struct ovl_dir_cache
), GFP_KERNEL
);
416 return ERR_PTR(-ENOMEM
);
419 INIT_LIST_HEAD(&cache
->entries
);
420 cache
->root
= RB_ROOT
;
422 res
= ovl_dir_read_merged(dentry
, &cache
->entries
, &cache
->root
);
424 ovl_cache_free(&cache
->entries
);
429 cache
->version
= ovl_inode_version_get(inode
);
430 ovl_set_dir_cache(inode
, cache
);
435 /* Map inode number to lower fs unique range */
436 static u64
ovl_remap_lower_ino(u64 ino
, int xinobits
, int fsid
,
437 const char *name
, int namelen
, bool warn
)
439 unsigned int xinoshift
= 64 - xinobits
;
441 if (unlikely(ino
>> xinoshift
)) {
443 pr_warn_ratelimited("d_ino too big (%.*s, ino=%llu, xinobits=%d)\n",
444 namelen
, name
, ino
, xinobits
);
450 * The lowest xinobit is reserved for mapping the non-peresistent inode
451 * numbers range, but this range is only exposed via st_ino, not here.
453 return ino
| ((u64
)fsid
) << (xinoshift
+ 1);
457 * Set d_ino for upper entries if needed. Non-upper entries should always report
458 * the uppermost real inode ino and should not call this function.
460 * When not all layer are on same fs, report real ino also for upper.
462 * When all layers are on the same fs, and upper has a reference to
463 * copy up origin, call vfs_getattr() on the overlay entry to make
464 * sure that d_ino will be consistent with st_ino from stat(2).
466 * Also checks the overlay.whiteout xattr by doing a full lookup which will return
467 * negative in this case.
469 static int ovl_cache_update(const struct path
*path
, struct ovl_cache_entry
*p
, bool update_ino
)
472 struct dentry
*dir
= path
->dentry
;
473 struct ovl_fs
*ofs
= OVL_FS(dir
->d_sb
);
474 struct dentry
*this = NULL
;
475 enum ovl_path_type type
;
476 u64 ino
= p
->real_ino
;
477 int xinobits
= ovl_xino_bits(ofs
);
480 if (!ovl_same_dev(ofs
) && !p
->check_xwhiteout
)
483 if (p
->name
[0] == '.') {
488 if (p
->len
== 2 && p
->name
[1] == '.') {
489 /* we shall not be moved */
490 this = dget(dir
->d_parent
);
494 /* This checks also for xwhiteouts */
495 this = lookup_one(mnt_idmap(path
->mnt
), p
->name
, dir
, p
->len
);
496 if (IS_ERR_OR_NULL(this) || !this->d_inode
) {
497 /* Mark a stale entry */
498 p
->is_whiteout
= true;
508 if (!ovl_same_dev(ofs
) || !update_ino
)
511 type
= ovl_path_type(this);
512 if (OVL_TYPE_ORIGIN(type
)) {
514 struct path statpath
= *path
;
516 statpath
.dentry
= this;
517 err
= vfs_getattr(&statpath
, &stat
, STATX_INO
, 0);
522 * Directory inode is always on overlay st_dev.
523 * Non-dir with ovl_same_dev() could be on pseudo st_dev in case
524 * of xino bits overflow.
526 WARN_ON_ONCE(S_ISDIR(stat
.mode
) &&
527 dir
->d_sb
->s_dev
!= stat
.dev
);
529 } else if (xinobits
&& !OVL_TYPE_UPPER(type
)) {
530 ino
= ovl_remap_lower_ino(ino
, xinobits
,
531 ovl_layer_lower(this)->fsid
,
542 pr_warn_ratelimited("failed to look up (%s) for ino (%i)\n",
547 static bool ovl_fill_plain(struct dir_context
*ctx
, const char *name
,
548 int namelen
, loff_t offset
, u64 ino
,
551 struct ovl_cache_entry
*p
;
552 struct ovl_readdir_data
*rdd
=
553 container_of(ctx
, struct ovl_readdir_data
, ctx
);
556 p
= ovl_cache_entry_new(rdd
, name
, namelen
, ino
, d_type
);
561 list_add_tail(&p
->l_node
, rdd
->list
);
566 static int ovl_dir_read_impure(const struct path
*path
, struct list_head
*list
,
567 struct rb_root
*root
)
570 struct path realpath
;
571 struct ovl_cache_entry
*p
, *n
;
572 struct ovl_readdir_data rdd
= {
573 .ctx
.actor
= ovl_fill_plain
,
578 INIT_LIST_HEAD(list
);
580 ovl_path_upper(path
->dentry
, &realpath
);
582 err
= ovl_dir_read(&realpath
, &rdd
);
586 list_for_each_entry_safe(p
, n
, list
, l_node
) {
587 if (strcmp(p
->name
, ".") != 0 &&
588 strcmp(p
->name
, "..") != 0) {
589 err
= ovl_cache_update(path
, p
, true);
593 if (p
->ino
== p
->real_ino
) {
594 list_del(&p
->l_node
);
597 struct rb_node
**newp
= &root
->rb_node
;
598 struct rb_node
*parent
= NULL
;
600 if (WARN_ON(ovl_cache_entry_find_link(p
->name
, p
->len
,
604 rb_link_node(&p
->node
, parent
, newp
);
605 rb_insert_color(&p
->node
, root
);
611 static struct ovl_dir_cache
*ovl_cache_get_impure(const struct path
*path
)
614 struct dentry
*dentry
= path
->dentry
;
615 struct inode
*inode
= d_inode(dentry
);
616 struct ovl_fs
*ofs
= OVL_FS(dentry
->d_sb
);
617 struct ovl_dir_cache
*cache
;
619 cache
= ovl_dir_cache(inode
);
620 if (cache
&& ovl_inode_version_get(inode
) == cache
->version
)
623 /* Impure cache is not refcounted, free it here */
624 ovl_dir_cache_free(inode
);
625 ovl_set_dir_cache(inode
, NULL
);
627 cache
= kzalloc(sizeof(struct ovl_dir_cache
), GFP_KERNEL
);
629 return ERR_PTR(-ENOMEM
);
631 res
= ovl_dir_read_impure(path
, &cache
->entries
, &cache
->root
);
633 ovl_cache_free(&cache
->entries
);
637 if (list_empty(&cache
->entries
)) {
639 * A good opportunity to get rid of an unneeded "impure" flag.
640 * Removing the "impure" xattr is best effort.
642 if (!ovl_want_write(dentry
)) {
643 ovl_removexattr(ofs
, ovl_dentry_upper(dentry
),
645 ovl_drop_write(dentry
);
647 ovl_clear_flag(OVL_IMPURE
, inode
);
652 cache
->version
= ovl_inode_version_get(inode
);
653 ovl_set_dir_cache(inode
, cache
);
658 struct ovl_readdir_translate
{
659 struct dir_context
*orig_ctx
;
660 struct ovl_dir_cache
*cache
;
661 struct dir_context ctx
;
668 static bool ovl_fill_real(struct dir_context
*ctx
, const char *name
,
669 int namelen
, loff_t offset
, u64 ino
,
672 struct ovl_readdir_translate
*rdt
=
673 container_of(ctx
, struct ovl_readdir_translate
, ctx
);
674 struct dir_context
*orig_ctx
= rdt
->orig_ctx
;
676 if (rdt
->parent_ino
&& strcmp(name
, "..") == 0) {
677 ino
= rdt
->parent_ino
;
678 } else if (rdt
->cache
) {
679 struct ovl_cache_entry
*p
;
681 p
= ovl_cache_entry_find(&rdt
->cache
->root
, name
, namelen
);
684 } else if (rdt
->xinobits
) {
685 ino
= ovl_remap_lower_ino(ino
, rdt
->xinobits
, rdt
->fsid
,
686 name
, namelen
, rdt
->xinowarn
);
689 return orig_ctx
->actor(orig_ctx
, name
, namelen
, offset
, ino
, d_type
);
692 static bool ovl_is_impure_dir(struct file
*file
)
694 struct ovl_dir_file
*od
= file
->private_data
;
695 struct inode
*dir
= file_inode(file
);
698 * Only upper dir can be impure, but if we are in the middle of
699 * iterating a lower real dir, dir could be copied up and marked
700 * impure. We only want the impure cache if we started iterating
701 * a real upper dir to begin with.
703 return od
->is_upper
&& ovl_test_flag(OVL_IMPURE
, dir
);
707 static int ovl_iterate_real(struct file
*file
, struct dir_context
*ctx
)
710 struct ovl_dir_file
*od
= file
->private_data
;
711 struct dentry
*dir
= file
->f_path
.dentry
;
712 struct ovl_fs
*ofs
= OVL_FS(dir
->d_sb
);
713 const struct ovl_layer
*lower_layer
= ovl_layer_lower(dir
);
714 struct ovl_readdir_translate rdt
= {
715 .ctx
.actor
= ovl_fill_real
,
717 .xinobits
= ovl_xino_bits(ofs
),
718 .xinowarn
= ovl_xino_warn(ofs
),
721 if (rdt
.xinobits
&& lower_layer
)
722 rdt
.fsid
= lower_layer
->fsid
;
724 if (OVL_TYPE_MERGE(ovl_path_type(dir
->d_parent
))) {
726 struct path statpath
= file
->f_path
;
728 statpath
.dentry
= dir
->d_parent
;
729 err
= vfs_getattr(&statpath
, &stat
, STATX_INO
, 0);
733 WARN_ON_ONCE(dir
->d_sb
->s_dev
!= stat
.dev
);
734 rdt
.parent_ino
= stat
.ino
;
737 if (ovl_is_impure_dir(file
)) {
738 rdt
.cache
= ovl_cache_get_impure(&file
->f_path
);
739 if (IS_ERR(rdt
.cache
))
740 return PTR_ERR(rdt
.cache
);
743 err
= iterate_dir(od
->realfile
, &rdt
.ctx
);
744 ctx
->pos
= rdt
.ctx
.pos
;
750 static int ovl_iterate(struct file
*file
, struct dir_context
*ctx
)
752 struct ovl_dir_file
*od
= file
->private_data
;
753 struct dentry
*dentry
= file
->f_path
.dentry
;
754 struct ovl_fs
*ofs
= OVL_FS(dentry
->d_sb
);
755 struct ovl_cache_entry
*p
;
756 const struct cred
*old_cred
;
759 old_cred
= ovl_override_creds(dentry
->d_sb
);
765 * If parent is merge, then need to adjust d_ino for '..', if
766 * dir is impure then need to adjust d_ino for copied up
769 if (ovl_xino_bits(ofs
) ||
771 (ovl_is_impure_dir(file
) ||
772 OVL_TYPE_MERGE(ovl_path_type(dentry
->d_parent
))))) {
773 err
= ovl_iterate_real(file
, ctx
);
775 err
= iterate_dir(od
->realfile
, ctx
);
781 struct ovl_dir_cache
*cache
;
783 cache
= ovl_cache_get(dentry
);
784 err
= PTR_ERR(cache
);
789 ovl_seek_cursor(od
, ctx
->pos
);
792 while (od
->cursor
!= &od
->cache
->entries
) {
793 p
= list_entry(od
->cursor
, struct ovl_cache_entry
, l_node
);
794 if (!p
->is_whiteout
) {
795 if (!p
->ino
|| p
->check_xwhiteout
) {
796 err
= ovl_cache_update(&file
->f_path
, p
, !p
->ino
);
801 /* ovl_cache_update() sets is_whiteout on stale entry */
802 if (!p
->is_whiteout
) {
803 if (!dir_emit(ctx
, p
->name
, p
->len
, p
->ino
, p
->type
))
806 od
->cursor
= p
->l_node
.next
;
811 ovl_revert_creds(old_cred
);
815 static loff_t
ovl_dir_llseek(struct file
*file
, loff_t offset
, int origin
)
818 struct ovl_dir_file
*od
= file
->private_data
;
820 inode_lock(file_inode(file
));
825 res
= vfs_llseek(od
->realfile
, offset
, origin
);
826 file
->f_pos
= od
->realfile
->f_pos
;
832 offset
+= file
->f_pos
;
842 if (offset
!= file
->f_pos
) {
843 file
->f_pos
= offset
;
845 ovl_seek_cursor(od
, offset
);
850 inode_unlock(file_inode(file
));
855 static struct file
*ovl_dir_open_realfile(const struct file
*file
,
856 const struct path
*realpath
)
859 const struct cred
*old_cred
;
861 old_cred
= ovl_override_creds(file_inode(file
)->i_sb
);
862 res
= ovl_path_open(realpath
, O_RDONLY
| (file
->f_flags
& O_LARGEFILE
));
863 ovl_revert_creds(old_cred
);
869 * Like ovl_real_fdget(), returns upperfile if dir was copied up since open.
870 * Unlike ovl_real_fdget(), this caches upperfile in file->private_data.
872 * TODO: use same abstract type for file->private_data of dir and file so
873 * upperfile could also be cached for files as well.
875 struct file
*ovl_dir_real_file(const struct file
*file
, bool want_upper
)
878 struct ovl_dir_file
*od
= file
->private_data
;
879 struct dentry
*dentry
= file
->f_path
.dentry
;
880 struct file
*old
, *realfile
= od
->realfile
;
882 if (!OVL_TYPE_UPPER(ovl_path_type(dentry
)))
883 return want_upper
? NULL
: realfile
;
886 * Need to check if we started out being a lower dir, but got copied up
889 realfile
= READ_ONCE(od
->upperfile
);
891 struct path upperpath
;
893 ovl_path_upper(dentry
, &upperpath
);
894 realfile
= ovl_dir_open_realfile(file
, &upperpath
);
895 if (IS_ERR(realfile
))
898 old
= cmpxchg_release(&od
->upperfile
, NULL
, realfile
);
909 static int ovl_dir_fsync(struct file
*file
, loff_t start
, loff_t end
,
912 struct file
*realfile
;
915 err
= ovl_sync_status(OVL_FS(file_inode(file
)->i_sb
));
919 realfile
= ovl_dir_real_file(file
, true);
920 err
= PTR_ERR_OR_ZERO(realfile
);
922 /* Nothing to sync for lower */
923 if (!realfile
|| err
)
926 return vfs_fsync_range(realfile
, start
, end
, datasync
);
929 static int ovl_dir_release(struct inode
*inode
, struct file
*file
)
931 struct ovl_dir_file
*od
= file
->private_data
;
935 ovl_cache_put(od
, inode
);
946 static int ovl_dir_open(struct inode
*inode
, struct file
*file
)
948 struct path realpath
;
949 struct file
*realfile
;
950 struct ovl_dir_file
*od
;
951 enum ovl_path_type type
;
953 od
= kzalloc(sizeof(struct ovl_dir_file
), GFP_KERNEL
);
957 type
= ovl_path_real(file
->f_path
.dentry
, &realpath
);
958 realfile
= ovl_dir_open_realfile(file
, &realpath
);
959 if (IS_ERR(realfile
)) {
961 return PTR_ERR(realfile
);
963 od
->realfile
= realfile
;
964 od
->is_real
= ovl_dir_is_real(inode
);
965 od
->is_upper
= OVL_TYPE_UPPER(type
);
966 file
->private_data
= od
;
971 WRAP_DIR_ITER(ovl_iterate
) // FIXME!
972 const struct file_operations ovl_dir_operations
= {
973 .read
= generic_read_dir
,
974 .open
= ovl_dir_open
,
975 .iterate_shared
= shared_ovl_iterate
,
976 .llseek
= ovl_dir_llseek
,
977 .fsync
= ovl_dir_fsync
,
978 .release
= ovl_dir_release
,
981 int ovl_check_empty_dir(struct dentry
*dentry
, struct list_head
*list
)
984 struct ovl_cache_entry
*p
, *n
;
985 struct rb_root root
= RB_ROOT
;
986 const struct cred
*old_cred
;
988 old_cred
= ovl_override_creds(dentry
->d_sb
);
989 err
= ovl_dir_read_merged(dentry
, list
, &root
);
990 ovl_revert_creds(old_cred
);
996 list_for_each_entry_safe(p
, n
, list
, l_node
) {
998 * Select whiteouts in upperdir, they should
999 * be cleared when deleting this directory.
1001 if (p
->is_whiteout
) {
1007 if (p
->name
[0] == '.') {
1010 if (p
->len
== 2 && p
->name
[1] == '.')
1017 list_del(&p
->l_node
);
1024 void ovl_cleanup_whiteouts(struct ovl_fs
*ofs
, struct dentry
*upper
,
1025 struct list_head
*list
)
1027 struct ovl_cache_entry
*p
;
1029 inode_lock_nested(upper
->d_inode
, I_MUTEX_CHILD
);
1030 list_for_each_entry(p
, list
, l_node
) {
1031 struct dentry
*dentry
;
1033 if (WARN_ON(!p
->is_whiteout
|| !p
->is_upper
))
1036 dentry
= ovl_lookup_upper(ofs
, p
->name
, upper
, p
->len
);
1037 if (IS_ERR(dentry
)) {
1038 pr_err("lookup '%s/%.*s' failed (%i)\n",
1039 upper
->d_name
.name
, p
->len
, p
->name
,
1040 (int) PTR_ERR(dentry
));
1043 if (dentry
->d_inode
)
1044 ovl_cleanup(ofs
, upper
->d_inode
, dentry
);
1047 inode_unlock(upper
->d_inode
);
1050 static bool ovl_check_d_type(struct dir_context
*ctx
, const char *name
,
1051 int namelen
, loff_t offset
, u64 ino
,
1052 unsigned int d_type
)
1054 struct ovl_readdir_data
*rdd
=
1055 container_of(ctx
, struct ovl_readdir_data
, ctx
);
1057 /* Even if d_type is not supported, DT_DIR is returned for . and .. */
1058 if (!strncmp(name
, ".", namelen
) || !strncmp(name
, "..", namelen
))
1061 if (d_type
!= DT_UNKNOWN
)
1062 rdd
->d_type_supported
= true;
1068 * Returns 1 if d_type is supported, 0 not supported/unknown. Negative values
1069 * if error is encountered.
1071 int ovl_check_d_type_supported(const struct path
*realpath
)
1074 struct ovl_readdir_data rdd
= {
1075 .ctx
.actor
= ovl_check_d_type
,
1076 .d_type_supported
= false,
1079 err
= ovl_dir_read(realpath
, &rdd
);
1083 return rdd
.d_type_supported
;
1086 #define OVL_INCOMPATDIR_NAME "incompat"
1088 static int ovl_workdir_cleanup_recurse(struct ovl_fs
*ofs
, const struct path
*path
,
1092 struct inode
*dir
= path
->dentry
->d_inode
;
1094 struct ovl_cache_entry
*p
;
1095 struct ovl_readdir_data rdd
= {
1096 .ctx
.actor
= ovl_fill_plain
,
1099 bool incompat
= false;
1102 * The "work/incompat" directory is treated specially - if it is not
1103 * empty, instead of printing a generic error and mounting read-only,
1104 * we will error about incompat features and fail the mount.
1106 * When called from ovl_indexdir_cleanup(), path->dentry->d_name.name
1110 !strcmp(path
->dentry
->d_name
.name
, OVL_INCOMPATDIR_NAME
))
1113 err
= ovl_dir_read(path
, &rdd
);
1117 inode_lock_nested(dir
, I_MUTEX_PARENT
);
1118 list_for_each_entry(p
, &list
, l_node
) {
1119 struct dentry
*dentry
;
1121 if (p
->name
[0] == '.') {
1124 if (p
->len
== 2 && p
->name
[1] == '.')
1126 } else if (incompat
) {
1127 pr_err("overlay with incompat feature '%s' cannot be mounted\n",
1132 dentry
= ovl_lookup_upper(ofs
, p
->name
, path
->dentry
, p
->len
);
1135 if (dentry
->d_inode
)
1136 err
= ovl_workdir_cleanup(ofs
, dir
, path
->mnt
, dentry
, level
);
1143 ovl_cache_free(&list
);
1147 int ovl_workdir_cleanup(struct ovl_fs
*ofs
, struct inode
*dir
,
1148 struct vfsmount
*mnt
, struct dentry
*dentry
, int level
)
1152 if (!d_is_dir(dentry
) || level
> 1) {
1153 return ovl_cleanup(ofs
, dir
, dentry
);
1156 err
= ovl_do_rmdir(ofs
, dir
, dentry
);
1158 struct path path
= { .mnt
= mnt
, .dentry
= dentry
};
1161 err
= ovl_workdir_cleanup_recurse(ofs
, &path
, level
+ 1);
1162 inode_lock_nested(dir
, I_MUTEX_PARENT
);
1164 err
= ovl_cleanup(ofs
, dir
, dentry
);
1170 int ovl_indexdir_cleanup(struct ovl_fs
*ofs
)
1173 struct dentry
*indexdir
= ofs
->workdir
;
1174 struct dentry
*index
= NULL
;
1175 struct inode
*dir
= indexdir
->d_inode
;
1176 struct path path
= { .mnt
= ovl_upper_mnt(ofs
), .dentry
= indexdir
};
1178 struct ovl_cache_entry
*p
;
1179 struct ovl_readdir_data rdd
= {
1180 .ctx
.actor
= ovl_fill_plain
,
1184 err
= ovl_dir_read(&path
, &rdd
);
1188 inode_lock_nested(dir
, I_MUTEX_PARENT
);
1189 list_for_each_entry(p
, &list
, l_node
) {
1190 if (p
->name
[0] == '.') {
1193 if (p
->len
== 2 && p
->name
[1] == '.')
1196 index
= ovl_lookup_upper(ofs
, p
->name
, indexdir
, p
->len
);
1197 if (IS_ERR(index
)) {
1198 err
= PTR_ERR(index
);
1202 /* Cleanup leftover from index create/cleanup attempt */
1203 if (index
->d_name
.name
[0] == '#') {
1204 err
= ovl_workdir_cleanup(ofs
, dir
, path
.mnt
, index
, 1);
1209 err
= ovl_verify_index(ofs
, index
);
1212 } else if (err
== -ESTALE
) {
1213 /* Cleanup stale index entries */
1214 err
= ovl_cleanup(ofs
, dir
, index
);
1215 } else if (err
!= -ENOENT
) {
1217 * Abort mount to avoid corrupting the index if
1218 * an incompatible index entry was found or on out
1222 } else if (ofs
->config
.nfs_export
) {
1224 * Whiteout orphan index to block future open by
1225 * handle after overlay nlink dropped to zero.
1227 err
= ovl_cleanup_and_whiteout(ofs
, dir
, index
);
1229 /* Cleanup orphan index entries */
1230 err
= ovl_cleanup(ofs
, dir
, index
);
1243 ovl_cache_free(&list
);
1245 pr_err("failed index dir cleanup (%i)\n", err
);