1 // SPDX-License-Identifier: GPL-2.0
3 * devtmpfs - kernel-maintained tmpfs-based /dev
5 * Copyright (C) 2009, Kay Sievers <kay.sievers@vrfy.org>
7 * During bootup, before any driver core device is registered,
8 * devtmpfs, a tmpfs-based filesystem is created. Every driver-core
9 * device which requests a device node, will add a node in this
11 * By default, all devices are named after the name of the device,
12 * owned by root and have a default mode of 0600. Subsystems can
13 * overwrite the default setting if needed.
16 #include <linux/kernel.h>
17 #include <linux/syscalls.h>
18 #include <linux/mount.h>
19 #include <linux/device.h>
20 #include <linux/genhd.h>
21 #include <linux/namei.h>
23 #include <linux/shmem_fs.h>
24 #include <linux/ramfs.h>
25 #include <linux/sched.h>
26 #include <linux/slab.h>
27 #include <linux/kthread.h>
28 #include <linux/init_syscalls.h>
29 #include <uapi/linux/mount.h>
32 static struct task_struct
*thread
;
34 static int __initdata mount_dev
= IS_ENABLED(CONFIG_DEVTMPFS_MOUNT
);
36 static DEFINE_SPINLOCK(req_lock
);
40 struct completion done
;
43 umode_t mode
; /* 0 => delete */
49 static int __init
mount_param(char *str
)
51 mount_dev
= simple_strtoul(str
, NULL
, 0);
54 __setup("devtmpfs.mount=", mount_param
);
56 static struct vfsmount
*mnt
;
58 static struct dentry
*public_dev_mount(struct file_system_type
*fs_type
, int flags
,
59 const char *dev_name
, void *data
)
61 struct super_block
*s
= mnt
->mnt_sb
;
62 atomic_inc(&s
->s_active
);
63 down_write(&s
->s_umount
);
64 return dget(s
->s_root
);
67 static struct file_system_type internal_fs_type
= {
70 .init_fs_context
= shmem_init_fs_context
,
71 .parameters
= shmem_fs_parameters
,
73 .init_fs_context
= ramfs_init_fs_context
,
74 .parameters
= ramfs_fs_parameters
,
76 .kill_sb
= kill_litter_super
,
79 static struct file_system_type dev_fs_type
= {
81 .mount
= public_dev_mount
,
85 static inline int is_blockdev(struct device
*dev
)
87 return dev
->class == &block_class
;
90 static inline int is_blockdev(struct device
*dev
) { return 0; }
93 static int devtmpfs_submit_req(struct req
*req
, const char *tmp
)
95 init_completion(&req
->done
);
100 spin_unlock(&req_lock
);
102 wake_up_process(thread
);
103 wait_for_completion(&req
->done
);
110 int devtmpfs_create_node(struct device
*dev
)
112 const char *tmp
= NULL
;
119 req
.uid
= GLOBAL_ROOT_UID
;
120 req
.gid
= GLOBAL_ROOT_GID
;
121 req
.name
= device_get_devnode(dev
, &req
.mode
, &req
.uid
, &req
.gid
, &tmp
);
127 if (is_blockdev(dev
))
134 return devtmpfs_submit_req(&req
, tmp
);
137 int devtmpfs_delete_node(struct device
*dev
)
139 const char *tmp
= NULL
;
145 req
.name
= device_get_devnode(dev
, NULL
, NULL
, NULL
, &tmp
);
152 return devtmpfs_submit_req(&req
, tmp
);
155 static int dev_mkdir(const char *name
, umode_t mode
)
157 struct dentry
*dentry
;
161 dentry
= kern_path_create(AT_FDCWD
, name
, &path
, LOOKUP_DIRECTORY
);
163 return PTR_ERR(dentry
);
165 err
= vfs_mkdir(d_inode(path
.dentry
), dentry
, mode
);
167 /* mark as kernel-created inode */
168 d_inode(dentry
)->i_private
= &thread
;
169 done_path_create(&path
, dentry
);
173 static int create_path(const char *nodepath
)
179 /* parent directories do not exist, create them */
180 path
= kstrdup(nodepath
, GFP_KERNEL
);
190 err
= dev_mkdir(path
, 0755);
191 if (err
&& err
!= -EEXIST
)
200 static int handle_create(const char *nodename
, umode_t mode
, kuid_t uid
,
201 kgid_t gid
, struct device
*dev
)
203 struct dentry
*dentry
;
207 dentry
= kern_path_create(AT_FDCWD
, nodename
, &path
, 0);
208 if (dentry
== ERR_PTR(-ENOENT
)) {
209 create_path(nodename
);
210 dentry
= kern_path_create(AT_FDCWD
, nodename
, &path
, 0);
213 return PTR_ERR(dentry
);
215 err
= vfs_mknod(d_inode(path
.dentry
), dentry
, mode
, dev
->devt
);
217 struct iattr newattrs
;
219 newattrs
.ia_mode
= mode
;
220 newattrs
.ia_uid
= uid
;
221 newattrs
.ia_gid
= gid
;
222 newattrs
.ia_valid
= ATTR_MODE
|ATTR_UID
|ATTR_GID
;
223 inode_lock(d_inode(dentry
));
224 notify_change(dentry
, &newattrs
, NULL
);
225 inode_unlock(d_inode(dentry
));
227 /* mark as kernel-created inode */
228 d_inode(dentry
)->i_private
= &thread
;
230 done_path_create(&path
, dentry
);
234 static int dev_rmdir(const char *name
)
237 struct dentry
*dentry
;
240 dentry
= kern_path_locked(name
, &parent
);
242 return PTR_ERR(dentry
);
243 if (d_really_is_positive(dentry
)) {
244 if (d_inode(dentry
)->i_private
== &thread
)
245 err
= vfs_rmdir(d_inode(parent
.dentry
), dentry
);
252 inode_unlock(d_inode(parent
.dentry
));
257 static int delete_path(const char *nodepath
)
262 path
= kstrdup(nodepath
, GFP_KERNEL
);
269 base
= strrchr(path
, '/');
273 err
= dev_rmdir(path
);
282 static int dev_mynode(struct device
*dev
, struct inode
*inode
, struct kstat
*stat
)
284 /* did we create it */
285 if (inode
->i_private
!= &thread
)
288 /* does the dev_t match */
289 if (is_blockdev(dev
)) {
290 if (!S_ISBLK(stat
->mode
))
293 if (!S_ISCHR(stat
->mode
))
296 if (stat
->rdev
!= dev
->devt
)
303 static int handle_remove(const char *nodename
, struct device
*dev
)
306 struct dentry
*dentry
;
310 dentry
= kern_path_locked(nodename
, &parent
);
312 return PTR_ERR(dentry
);
314 if (d_really_is_positive(dentry
)) {
316 struct path p
= {.mnt
= parent
.mnt
, .dentry
= dentry
};
317 err
= vfs_getattr(&p
, &stat
, STATX_TYPE
| STATX_MODE
,
318 AT_STATX_SYNC_AS_STAT
);
319 if (!err
&& dev_mynode(dev
, d_inode(dentry
), &stat
)) {
320 struct iattr newattrs
;
322 * before unlinking this node, reset permissions
323 * of possible references like hardlinks
325 newattrs
.ia_uid
= GLOBAL_ROOT_UID
;
326 newattrs
.ia_gid
= GLOBAL_ROOT_GID
;
327 newattrs
.ia_mode
= stat
.mode
& ~0777;
329 ATTR_UID
|ATTR_GID
|ATTR_MODE
;
330 inode_lock(d_inode(dentry
));
331 notify_change(dentry
, &newattrs
, NULL
);
332 inode_unlock(d_inode(dentry
));
333 err
= vfs_unlink(d_inode(parent
.dentry
), dentry
, NULL
);
334 if (!err
|| err
== -ENOENT
)
341 inode_unlock(d_inode(parent
.dentry
));
344 if (deleted
&& strchr(nodename
, '/'))
345 delete_path(nodename
);
350 * If configured, or requested by the commandline, devtmpfs will be
351 * auto-mounted after the kernel mounted the root filesystem.
353 int __init
devtmpfs_mount(void)
363 err
= init_mount("devtmpfs", "dev", "devtmpfs", MS_SILENT
, NULL
);
365 printk(KERN_INFO
"devtmpfs: error mounting %i\n", err
);
367 printk(KERN_INFO
"devtmpfs: mounted\n");
371 static DECLARE_COMPLETION(setup_done
);
373 static int handle(const char *name
, umode_t mode
, kuid_t uid
, kgid_t gid
,
377 return handle_create(name
, mode
, uid
, gid
, dev
);
379 return handle_remove(name
, dev
);
382 static void __noreturn
devtmpfs_work_loop(void)
385 spin_lock(&req_lock
);
387 struct req
*req
= requests
;
389 spin_unlock(&req_lock
);
391 struct req
*next
= req
->next
;
392 req
->err
= handle(req
->name
, req
->mode
,
393 req
->uid
, req
->gid
, req
->dev
);
394 complete(&req
->done
);
397 spin_lock(&req_lock
);
399 __set_current_state(TASK_INTERRUPTIBLE
);
400 spin_unlock(&req_lock
);
405 static int __init
devtmpfs_setup(void *p
)
409 err
= ksys_unshare(CLONE_NEWNS
);
412 err
= init_mount("devtmpfs", "/", "devtmpfs", MS_SILENT
, NULL
);
415 init_chdir("/.."); /* will traverse into overmounted root */
419 complete(&setup_done
);
424 * The __ref is because devtmpfs_setup needs to be __init for the routines it
425 * calls. That call is done while devtmpfs_init, which is marked __init,
426 * synchronously waits for it to complete.
428 static int __ref
devtmpfsd(void *p
)
430 int err
= devtmpfs_setup(p
);
434 devtmpfs_work_loop();
439 * Create devtmpfs instance, driver-core devices will add their device
442 int __init
devtmpfs_init(void)
444 char opts
[] = "mode=0755";
447 mnt
= vfs_kern_mount(&internal_fs_type
, 0, "devtmpfs", opts
);
449 printk(KERN_ERR
"devtmpfs: unable to create devtmpfs %ld\n",
453 err
= register_filesystem(&dev_fs_type
);
455 printk(KERN_ERR
"devtmpfs: unable to register devtmpfs "
460 thread
= kthread_run(devtmpfsd
, &err
, "kdevtmpfs");
461 if (!IS_ERR(thread
)) {
462 wait_for_completion(&setup_done
);
464 err
= PTR_ERR(thread
);
469 printk(KERN_ERR
"devtmpfs: unable to create devtmpfs %i\n", err
);
470 unregister_filesystem(&dev_fs_type
);
474 printk(KERN_INFO
"devtmpfs: initialized\n");