4 * Copyright (C) 1991, 1992 Linus Torvalds
6 * proc root directory handling functions
9 #include <asm/uaccess.h>
11 #include <linux/errno.h>
12 #include <linux/time.h>
13 #include <linux/proc_fs.h>
14 #include <linux/stat.h>
15 #include <linux/init.h>
16 #include <linux/sched.h>
17 #include <linux/module.h>
18 #include <linux/bitops.h>
19 #include <linux/user_namespace.h>
20 #include <linux/mount.h>
21 #include <linux/pid_namespace.h>
22 #include <linux/parser.h>
26 static int proc_test_super(struct super_block
*sb
, void *data
)
28 return sb
->s_fs_info
== data
;
31 static int proc_set_super(struct super_block
*sb
, void *data
)
33 int err
= set_anon_super(sb
, NULL
);
35 struct pid_namespace
*ns
= (struct pid_namespace
*)data
;
36 sb
->s_fs_info
= get_pid_ns(ns
);
42 Opt_gid
, Opt_hidepid
, Opt_err
,
45 static const match_table_t tokens
= {
46 {Opt_hidepid
, "hidepid=%u"},
51 static int proc_parse_options(char *options
, struct pid_namespace
*pid
)
54 substring_t args
[MAX_OPT_ARGS
];
60 while ((p
= strsep(&options
, ",")) != NULL
) {
65 args
[0].to
= args
[0].from
= NULL
;
66 token
= match_token(p
, tokens
, args
);
69 if (match_int(&args
[0], &option
))
71 pid
->pid_gid
= make_kgid(current_user_ns(), option
);
74 if (match_int(&args
[0], &option
))
76 if (option
< 0 || option
> 2) {
77 pr_err("proc: hidepid value must be between 0 and 2.\n");
80 pid
->hide_pid
= option
;
83 pr_err("proc: unrecognized mount option \"%s\" "
84 "or missing value\n", p
);
92 int proc_remount(struct super_block
*sb
, int *flags
, char *data
)
94 struct pid_namespace
*pid
= sb
->s_fs_info
;
97 return !proc_parse_options(data
, pid
);
100 static struct dentry
*proc_mount(struct file_system_type
*fs_type
,
101 int flags
, const char *dev_name
, void *data
)
104 struct super_block
*sb
;
105 struct pid_namespace
*ns
;
108 if (flags
& MS_KERNMOUNT
) {
109 ns
= (struct pid_namespace
*)data
;
112 ns
= task_active_pid_ns(current
);
115 /* Does the mounter have privilege over the pid namespace? */
116 if (!ns_capable(ns
->user_ns
, CAP_SYS_ADMIN
))
117 return ERR_PTR(-EPERM
);
120 sb
= sget(fs_type
, proc_test_super
, proc_set_super
, flags
, ns
);
125 * procfs isn't actually a stacking filesystem; however, there is
126 * too much magic going on inside it to permit stacking things on
129 sb
->s_stack_depth
= FILESYSTEM_MAX_STACK_DEPTH
;
131 if (!proc_parse_options(options
, ns
)) {
132 deactivate_locked_super(sb
);
133 return ERR_PTR(-EINVAL
);
137 err
= proc_fill_super(sb
);
139 deactivate_locked_super(sb
);
143 sb
->s_flags
|= MS_ACTIVE
;
144 /* User space would break if executables appear on proc */
145 sb
->s_iflags
|= SB_I_NOEXEC
;
148 return dget(sb
->s_root
);
151 static void proc_kill_sb(struct super_block
*sb
)
153 struct pid_namespace
*ns
;
155 ns
= (struct pid_namespace
*)sb
->s_fs_info
;
158 if (ns
->proc_thread_self
)
159 dput(ns
->proc_thread_self
);
164 static struct file_system_type proc_fs_type
= {
167 .kill_sb
= proc_kill_sb
,
168 .fs_flags
= FS_USERNS_VISIBLE
| FS_USERNS_MOUNT
,
171 void __init
proc_root_init(void)
175 proc_init_inodecache();
176 err
= register_filesystem(&proc_fs_type
);
181 proc_thread_self_init();
182 proc_symlink("mounts", NULL
, "self/mounts");
186 #ifdef CONFIG_SYSVIPC
187 proc_mkdir("sysvipc", NULL
);
189 proc_mkdir("fs", NULL
);
190 proc_mkdir("driver", NULL
);
191 proc_create_mount_point("fs/nfsd"); /* somewhere for the nfsd filesystem to be mounted */
192 #if defined(CONFIG_SUN_OPENPROMFS) || defined(CONFIG_SUN_OPENPROMFS_MODULE)
193 /* just give it a mountpoint */
194 proc_create_mount_point("openprom");
197 proc_mkdir("bus", NULL
);
201 static int proc_root_getattr(struct vfsmount
*mnt
, struct dentry
*dentry
, struct kstat
*stat
204 generic_fillattr(d_inode(dentry
), stat
);
205 stat
->nlink
= proc_root
.nlink
+ nr_processes();
209 static struct dentry
*proc_root_lookup(struct inode
* dir
, struct dentry
* dentry
, unsigned int flags
)
211 if (!proc_pid_lookup(dir
, dentry
, flags
))
214 return proc_lookup(dir
, dentry
, flags
);
217 static int proc_root_readdir(struct file
*file
, struct dir_context
*ctx
)
219 if (ctx
->pos
< FIRST_PROCESS_ENTRY
) {
220 int error
= proc_readdir(file
, ctx
);
221 if (unlikely(error
<= 0))
223 ctx
->pos
= FIRST_PROCESS_ENTRY
;
226 return proc_pid_readdir(file
, ctx
);
230 * The root /proc directory is special, as it has the
231 * <pid> directories. Thus we don't use the generic
232 * directory handling functions for that..
234 static const struct file_operations proc_root_operations
= {
235 .read
= generic_read_dir
,
236 .iterate
= proc_root_readdir
,
237 .llseek
= default_llseek
,
241 * proc root can do almost nothing..
243 static const struct inode_operations proc_root_inode_operations
= {
244 .lookup
= proc_root_lookup
,
245 .getattr
= proc_root_getattr
,
249 * This is the root "inode" in the /proc tree..
251 struct proc_dir_entry proc_root
= {
252 .low_ino
= PROC_ROOT_INO
,
254 .mode
= S_IFDIR
| S_IRUGO
| S_IXUGO
,
256 .count
= ATOMIC_INIT(1),
257 .proc_iops
= &proc_root_inode_operations
,
258 .proc_fops
= &proc_root_operations
,
259 .parent
= &proc_root
,
264 int pid_ns_prepare_proc(struct pid_namespace
*ns
)
266 struct vfsmount
*mnt
;
268 mnt
= kern_mount_data(&proc_fs_type
, ns
);
276 void pid_ns_release_proc(struct pid_namespace
*ns
)
278 kern_unmount(ns
->proc_mnt
);