blob: 4aa9ce5df02ffc9b6daf9d1d47157f5aee660799 [file] [log] [blame]
Greg Kroah-Hartmanb2441312017-11-01 15:07:57 +01001// SPDX-License-Identifier: GPL-2.0
Linus Torvalds1da177e2005-04-16 15:20:36 -07002/*
3 * linux/fs/proc/base.c
4 *
5 * Copyright (C) 1991, 1992 Linus Torvalds
6 *
7 * proc base directory handling functions
8 *
9 * 1999, Al Viro. Rewritten. Now it covers the whole per-process part.
10 * Instead of using magical inumbers to determine the kind of object
11 * we allocate and fill in-core inodes upon lookup. They don't even
12 * go into icache. We cache the reference to task_struct upon lookup too.
13 * Eventually it should become a filesystem in its own. We don't use the
14 * rest of procfs anymore.
Mauricio Line070ad42005-09-03 15:55:10 -070015 *
16 *
17 * Changelog:
18 * 17-Jan-2005
19 * Allan Bezerra
20 * Bruna Moreira <bruna.moreira@indt.org.br>
21 * Edjard Mota <edjard.mota@indt.org.br>
22 * Ilias Biris <ilias.biris@indt.org.br>
23 * Mauricio Lin <mauricio.lin@indt.org.br>
24 *
25 * Embedded Linux Lab - 10LE Instituto Nokia de Tecnologia - INdT
26 *
27 * A new process specific entry (smaps) included in /proc. It shows the
28 * size of rss for each memory area. The maps entry lacks information
29 * about physical memory size (rss) for each mapped file, i.e.,
30 * rss information for executables and library files.
31 * This additional information is useful for any tools that need to know
32 * about physical memory consumption for a process specific library.
33 *
34 * Changelog:
35 * 21-Feb-2005
36 * Embedded Linux Lab - 10LE Instituto Nokia de Tecnologia - INdT
37 * Pud inclusion in the page table walking.
38 *
39 * ChangeLog:
40 * 10-Mar-2005
41 * 10LE Instituto Nokia de Tecnologia - INdT:
42 * A better way to walks through the page table as suggested by Hugh Dickins.
43 *
44 * Simo Piiroinen <simo.piiroinen@nokia.com>:
45 * Smaps information related to shared, private, clean and dirty pages.
46 *
47 * Paul Mundt <paul.mundt@nokia.com>:
48 * Overall revision about smaps.
Linus Torvalds1da177e2005-04-16 15:20:36 -070049 */
50
Linus Torvalds7c0f6ba2016-12-24 11:46:01 -080051#include <linux/uaccess.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070052
Linus Torvalds1da177e2005-04-16 15:20:36 -070053#include <linux/errno.h>
54#include <linux/time.h>
55#include <linux/proc_fs.h>
56#include <linux/stat.h>
Andrea Righi59954772008-07-27 17:29:15 +020057#include <linux/task_io_accounting_ops.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070058#include <linux/init.h>
Randy Dunlap16f7e0f2006-01-11 12:17:46 -080059#include <linux/capability.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070060#include <linux/file.h>
Al Viro9f3acc32008-04-24 07:44:08 -040061#include <linux/fdtable.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070062#include <linux/string.h>
63#include <linux/seq_file.h>
64#include <linux/namei.h>
Kirill Korotaev6b3286e2006-12-08 02:37:56 -080065#include <linux/mnt_namespace.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070066#include <linux/mm.h>
David Rientjesa63d83f2010-08-09 17:19:46 -070067#include <linux/swap.h>
Dipankar Sarmab8359962005-09-09 13:04:14 -070068#include <linux/rcupdate.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070069#include <linux/kallsyms.h>
Ken Chen2ec220e2008-11-10 11:26:08 +030070#include <linux/stacktrace.h>
Neil Hormand85f50d2007-10-18 23:40:37 -070071#include <linux/resource.h>
Kees Cook5096add2007-05-08 00:26:04 -070072#include <linux/module.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070073#include <linux/mount.h>
74#include <linux/security.h>
75#include <linux/ptrace.h>
Roland McGrath0d094ef2008-07-25 19:45:49 -070076#include <linux/tracehook.h>
Andrew Morton87ebdc02013-02-27 17:03:16 -080077#include <linux/printk.h>
Alexey Dobriyanefb1a572018-02-06 15:37:24 -080078#include <linux/cache.h>
Paul Menagea4243162007-10-18 23:39:35 -070079#include <linux/cgroup.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070080#include <linux/cpuset.h>
81#include <linux/audit.h>
Al Viro5addc5d2005-11-07 17:15:49 -050082#include <linux/poll.h>
Serge E. Hallyn1651e142006-10-02 02:18:08 -070083#include <linux/nsproxy.h>
Alexey Dobriyan8ac773b2006-10-19 23:28:32 -070084#include <linux/oom.h>
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -070085#include <linux/elf.h>
Pavel Emelyanov60347f62007-10-18 23:40:03 -070086#include <linux/pid_namespace.h>
Eric W. Biederman22d917d2011-11-17 00:11:58 -080087#include <linux/user_namespace.h>
Al Viro5ad4e532009-03-29 19:50:06 -040088#include <linux/fs_struct.h>
Tejun Heo5a0e3ad2010-03-24 17:04:11 +090089#include <linux/slab.h>
Ingo Molnar4eb5aaa2017-02-08 18:51:29 +010090#include <linux/sched/autogroup.h>
Ingo Molnar6e84f312017-02-08 18:51:29 +010091#include <linux/sched/mm.h>
Ingo Molnarf7ccbae2017-02-08 18:51:30 +010092#include <linux/sched/coredump.h>
Ingo Molnarb17b0152017-02-08 18:51:35 +010093#include <linux/sched/debug.h>
Ingo Molnar3905f9a2017-02-05 12:07:04 +010094#include <linux/sched/stat.h>
Pavel Emelyanov640708a2012-01-10 15:11:23 -080095#include <linux/flex_array.h>
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +040096#include <linux/posix-timers.h>
KAMEZAWA Hiroyuki43d2b112012-01-10 15:08:09 -080097#include <trace/events/oom.h>
Linus Torvalds1da177e2005-04-16 15:20:36 -070098#include "internal.h"
Cyrill Gorcunovfaf60af2012-08-23 14:43:24 +040099#include "fd.h"
Linus Torvalds1da177e2005-04-16 15:20:36 -0700100
Alexey Dobriyanac7f1062018-02-06 15:36:59 -0800101#include "../../lib/kstrtox.h"
102
Eric W. Biederman0f2fe202006-06-26 00:25:46 -0700103/* NOTE:
104 * Implementing inode permission operations in /proc is almost
105 * certainly an error. Permission checks need to happen during
106 * each system call not at open time. The reason is that most of
107 * what we wish to check for permissions in /proc varies at runtime.
108 *
109 * The classic example of a problem is opening file descriptors
110 * in /proc for a task before it execs a suid executable.
111 */
112
Alexey Dobriyanefb1a572018-02-06 15:37:24 -0800113static u8 nlink_tid __ro_after_init;
114static u8 nlink_tgid __ro_after_init;
Alexey Dobriyan1270dd82016-12-12 16:45:32 -0800115
Linus Torvalds1da177e2005-04-16 15:20:36 -0700116struct pid_entry {
Alexey Dobriyancedbcca2014-08-08 14:21:33 -0700117 const char *name;
Alexey Dobriyan623f5942016-12-12 16:45:08 -0800118 unsigned int len;
Al Virod161a132011-07-24 03:36:29 -0400119 umode_t mode;
Arjan van de Venc5ef1c42007-02-12 00:55:40 -0800120 const struct inode_operations *iop;
Arjan van de Ven00977a52007-02-12 00:55:34 -0800121 const struct file_operations *fop;
Eric W. Biederman20cdc892006-10-02 02:17:07 -0700122 union proc_op op;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700123};
124
Eric W. Biederman61a28782006-10-02 02:18:49 -0700125#define NOD(NAME, MODE, IOP, FOP, OP) { \
Eric W. Biederman20cdc892006-10-02 02:17:07 -0700126 .name = (NAME), \
Eric Dumazetc5141e62007-05-08 00:26:15 -0700127 .len = sizeof(NAME) - 1, \
Eric W. Biederman20cdc892006-10-02 02:17:07 -0700128 .mode = MODE, \
129 .iop = IOP, \
130 .fop = FOP, \
131 .op = OP, \
132}
133
Alexey Dobriyan631f9c12008-11-10 01:32:52 +0300134#define DIR(NAME, MODE, iops, fops) \
135 NOD(NAME, (S_IFDIR|(MODE)), &iops, &fops, {} )
136#define LNK(NAME, get_link) \
Eric W. Biederman61a28782006-10-02 02:18:49 -0700137 NOD(NAME, (S_IFLNK|S_IRWXUGO), \
Eric W. Biederman20cdc892006-10-02 02:17:07 -0700138 &proc_pid_link_inode_operations, NULL, \
Alexey Dobriyan631f9c12008-11-10 01:32:52 +0300139 { .proc_get_link = get_link } )
140#define REG(NAME, MODE, fops) \
141 NOD(NAME, (S_IFREG|(MODE)), NULL, &fops, {})
Alexey Dobriyan631f9c12008-11-10 01:32:52 +0300142#define ONE(NAME, MODE, show) \
Eric W. Biedermanbe614082008-02-08 04:18:30 -0800143 NOD(NAME, (S_IFREG|(MODE)), \
144 NULL, &proc_single_file_operations, \
Alexey Dobriyan631f9c12008-11-10 01:32:52 +0300145 { .proc_show = show } )
Linus Torvalds1da177e2005-04-16 15:20:36 -0700146
Vegard Nossumaed54172008-06-05 22:46:53 -0700147/*
148 * Count the number of hardlinks for the pid_entry table, excluding the .
149 * and .. links.
150 */
Alexey Dobriyan1270dd82016-12-12 16:45:32 -0800151static unsigned int __init pid_entry_nlink(const struct pid_entry *entries,
Vegard Nossumaed54172008-06-05 22:46:53 -0700152 unsigned int n)
153{
154 unsigned int i;
155 unsigned int count;
156
Alexey Dobriyan1270dd82016-12-12 16:45:32 -0800157 count = 2;
Vegard Nossumaed54172008-06-05 22:46:53 -0700158 for (i = 0; i < n; ++i) {
159 if (S_ISDIR(entries[i].mode))
160 ++count;
161 }
162
163 return count;
164}
165
Miklos Szeredif7ad3c62010-08-10 11:41:36 +0200166static int get_task_root(struct task_struct *task, struct path *root)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700167{
Hugh Dickins7c2c7d92009-03-28 23:21:27 +0000168 int result = -ENOENT;
169
Miklos Szeredi0494f6e2005-09-06 15:18:22 -0700170 task_lock(task);
Miklos Szeredif7ad3c62010-08-10 11:41:36 +0200171 if (task->fs) {
172 get_fs_root(task->fs, root);
Hugh Dickins7c2c7d92009-03-28 23:21:27 +0000173 result = 0;
174 }
Miklos Szeredi0494f6e2005-09-06 15:18:22 -0700175 task_unlock(task);
Hugh Dickins7c2c7d92009-03-28 23:21:27 +0000176 return result;
Miklos Szeredi0494f6e2005-09-06 15:18:22 -0700177}
178
Cyrill Gorcunov7773fbc2012-01-10 15:11:20 -0800179static int proc_cwd_link(struct dentry *dentry, struct path *path)
Miklos Szeredi0494f6e2005-09-06 15:18:22 -0700180{
David Howells2b0143b2015-03-17 22:25:59 +0000181 struct task_struct *task = get_proc_task(d_inode(dentry));
Miklos Szeredi0494f6e2005-09-06 15:18:22 -0700182 int result = -ENOENT;
Eric W. Biederman99f89552006-06-26 00:25:55 -0700183
184 if (task) {
Miklos Szeredif7ad3c62010-08-10 11:41:36 +0200185 task_lock(task);
186 if (task->fs) {
187 get_fs_pwd(task->fs, path);
188 result = 0;
189 }
190 task_unlock(task);
Eric W. Biederman99f89552006-06-26 00:25:55 -0700191 put_task_struct(task);
192 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700193 return result;
194}
195
Cyrill Gorcunov7773fbc2012-01-10 15:11:20 -0800196static int proc_root_link(struct dentry *dentry, struct path *path)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700197{
David Howells2b0143b2015-03-17 22:25:59 +0000198 struct task_struct *task = get_proc_task(d_inode(dentry));
Linus Torvalds1da177e2005-04-16 15:20:36 -0700199 int result = -ENOENT;
Eric W. Biederman99f89552006-06-26 00:25:55 -0700200
201 if (task) {
Miklos Szeredif7ad3c62010-08-10 11:41:36 +0200202 result = get_task_root(task, path);
Eric W. Biederman99f89552006-06-26 00:25:55 -0700203 put_task_struct(task);
204 }
Linus Torvalds1da177e2005-04-16 15:20:36 -0700205 return result;
206}
207
Linus Torvaldse4b4e442018-05-17 13:04:17 -0700208static ssize_t get_mm_cmdline(struct mm_struct *mm, char __user *buf,
Linus Torvalds5ab82712018-05-17 15:17:33 -0700209 size_t count, loff_t *ppos)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700210{
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700211 unsigned long arg_start, arg_end, env_start, env_end;
Linus Torvalds5ab82712018-05-17 15:17:33 -0700212 unsigned long pos, len;
213 char *page;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700214
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700215 /* Check if process spawned far enough to have cmdline. */
Linus Torvaldse4b4e442018-05-17 13:04:17 -0700216 if (!mm->env_end)
217 return 0;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700218
Yang Shi88aa7cc2018-06-07 17:05:28 -0700219 spin_lock(&mm->arg_lock);
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700220 arg_start = mm->arg_start;
221 arg_end = mm->arg_end;
222 env_start = mm->env_start;
223 env_end = mm->env_end;
Yang Shi88aa7cc2018-06-07 17:05:28 -0700224 spin_unlock(&mm->arg_lock);
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700225
Linus Torvalds5ab82712018-05-17 15:17:33 -0700226 if (arg_start >= arg_end)
227 return 0;
Alexey Dobriyan6a6cbe72018-06-07 17:09:59 -0700228
Alexey Dobriyan2ca66ff2014-08-08 14:21:41 -0700229 /*
Linus Torvalds5ab82712018-05-17 15:17:33 -0700230 * We have traditionally allowed the user to re-write
231 * the argument strings and overflow the end result
232 * into the environment section. But only do that if
233 * the environment area is contiguous to the arguments.
Alexey Dobriyan2ca66ff2014-08-08 14:21:41 -0700234 */
Linus Torvalds5ab82712018-05-17 15:17:33 -0700235 if (env_start != arg_end || env_start >= env_end)
236 env_start = env_end = arg_end;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700237
Linus Torvalds5ab82712018-05-17 15:17:33 -0700238 /* We're not going to care if "*ppos" has high bits set */
239 pos = arg_start + *ppos;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700240
Linus Torvalds5ab82712018-05-17 15:17:33 -0700241 /* .. but we do check the result is in the proper range */
242 if (pos < arg_start || pos >= env_end)
243 return 0;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700244
Linus Torvalds5ab82712018-05-17 15:17:33 -0700245 /* .. and we never go past env_end */
246 if (env_end - pos < count)
247 count = env_end - pos;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700248
Linus Torvalds5ab82712018-05-17 15:17:33 -0700249 page = (char *)__get_free_page(GFP_KERNEL);
250 if (!page)
251 return -ENOMEM;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700252
Linus Torvalds5ab82712018-05-17 15:17:33 -0700253 len = 0;
254 while (count) {
255 int got;
256 size_t size = min_t(size_t, PAGE_SIZE, count);
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700257
Linus Torvalds5ab82712018-05-17 15:17:33 -0700258 got = access_remote_vm(mm, pos, page, size, FOLL_ANON);
259 if (got <= 0)
260 break;
261
262 /* Don't walk past a NUL character once you hit arg_end */
263 if (pos + got >= arg_end) {
264 int n = 0;
265
266 /*
267 * If we started before 'arg_end' but ended up
268 * at or after it, we start the NUL character
269 * check at arg_end-1 (where we expect the normal
270 * EOF to be).
271 *
272 * NOTE! This is smaller than 'got', because
273 * pos + got >= arg_end
274 */
275 if (pos < arg_end)
276 n = arg_end - pos - 1;
277
278 /* Cut off at first NUL after 'n' */
279 got = n + strnlen(page+n, got-n);
280 if (!got)
281 break;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700282 }
Alexey Dobriyana0a07b82017-02-24 15:00:20 -0800283
Linus Torvalds5ab82712018-05-17 15:17:33 -0700284 got -= copy_to_user(buf, page, got);
285 if (unlikely(!got)) {
286 if (!len)
287 len = -EFAULT;
288 break;
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700289 }
Linus Torvalds5ab82712018-05-17 15:17:33 -0700290 pos += got;
291 buf += got;
292 len += got;
293 count -= got;
Alexey Dobriyan3cb4e162018-06-07 17:10:02 -0700294 }
295
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700296 free_page((unsigned long)page);
Linus Torvalds5ab82712018-05-17 15:17:33 -0700297 return len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700298}
299
Linus Torvaldse4b4e442018-05-17 13:04:17 -0700300static ssize_t get_task_cmdline(struct task_struct *tsk, char __user *buf,
301 size_t count, loff_t *pos)
302{
303 struct mm_struct *mm;
304 ssize_t ret;
305
306 mm = get_task_mm(tsk);
307 if (!mm)
308 return 0;
309
310 ret = get_mm_cmdline(mm, buf, count, pos);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700311 mmput(mm);
Linus Torvaldse4b4e442018-05-17 13:04:17 -0700312 return ret;
313}
314
315static ssize_t proc_pid_cmdline_read(struct file *file, char __user *buf,
316 size_t count, loff_t *pos)
317{
318 struct task_struct *tsk;
319 ssize_t ret;
320
321 BUG_ON(*pos < 0);
322
323 tsk = get_proc_task(file_inode(file));
324 if (!tsk)
325 return -ESRCH;
326 ret = get_task_cmdline(tsk, buf, count, pos);
327 put_task_struct(tsk);
328 if (ret > 0)
329 *pos += ret;
330 return ret;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700331}
332
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -0700333static const struct file_operations proc_pid_cmdline_ops = {
334 .read = proc_pid_cmdline_read,
335 .llseek = generic_file_llseek,
336};
337
Linus Torvalds1da177e2005-04-16 15:20:36 -0700338#ifdef CONFIG_KALLSYMS
339/*
340 * Provides a wchan file via kallsyms in a proper one-value-per-file format.
341 * Returns the resolved symbol. If that fails, simply return the address.
342 */
Alexey Dobriyanedfcd602014-08-08 14:21:44 -0700343static int proc_pid_wchan(struct seq_file *m, struct pid_namespace *ns,
344 struct pid *pid, struct task_struct *task)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700345{
Alexey Dobriyanffb45122007-05-08 00:28:41 -0700346 unsigned long wchan;
Tejun Heo9281ace2007-07-17 04:03:51 -0700347 char symname[KSYM_NAME_LEN];
Linus Torvalds1da177e2005-04-16 15:20:36 -0700348
Alexey Dobriyan24b2ec22018-04-10 16:31:30 -0700349 if (!ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS))
350 goto print0;
351
Linus Torvalds1da177e2005-04-16 15:20:36 -0700352 wchan = get_wchan(task);
Alexey Dobriyan24b2ec22018-04-10 16:31:30 -0700353 if (wchan && !lookup_symbol_name(wchan, symname)) {
Alexey Dobriyan21dae0a2018-04-10 16:31:34 -0700354 seq_puts(m, symname);
Alexey Dobriyan24b2ec22018-04-10 16:31:30 -0700355 return 0;
356 }
Joe Perches25ce3192015-04-15 16:18:17 -0700357
Alexey Dobriyan24b2ec22018-04-10 16:31:30 -0700358print0:
359 seq_putc(m, '0');
Joe Perches25ce3192015-04-15 16:18:17 -0700360 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700361}
362#endif /* CONFIG_KALLSYMS */
363
Al Viroa9712bc2011-03-23 15:52:50 -0400364static int lock_trace(struct task_struct *task)
365{
366 int err = mutex_lock_killable(&task->signal->cred_guard_mutex);
367 if (err)
368 return err;
Jann Horncaaee622016-01-20 15:00:04 -0800369 if (!ptrace_may_access(task, PTRACE_MODE_ATTACH_FSCREDS)) {
Al Viroa9712bc2011-03-23 15:52:50 -0400370 mutex_unlock(&task->signal->cred_guard_mutex);
371 return -EPERM;
372 }
373 return 0;
374}
375
376static void unlock_trace(struct task_struct *task)
377{
378 mutex_unlock(&task->signal->cred_guard_mutex);
379}
380
Ken Chen2ec220e2008-11-10 11:26:08 +0300381#ifdef CONFIG_STACKTRACE
382
383#define MAX_STACK_TRACE_DEPTH 64
384
385static int proc_pid_stack(struct seq_file *m, struct pid_namespace *ns,
386 struct pid *pid, struct task_struct *task)
387{
388 struct stack_trace trace;
389 unsigned long *entries;
Al Viroa9712bc2011-03-23 15:52:50 -0400390 int err;
Ken Chen2ec220e2008-11-10 11:26:08 +0300391
392 entries = kmalloc(MAX_STACK_TRACE_DEPTH * sizeof(*entries), GFP_KERNEL);
393 if (!entries)
394 return -ENOMEM;
395
396 trace.nr_entries = 0;
397 trace.max_entries = MAX_STACK_TRACE_DEPTH;
398 trace.entries = entries;
399 trace.skip = 0;
Ken Chen2ec220e2008-11-10 11:26:08 +0300400
Al Viroa9712bc2011-03-23 15:52:50 -0400401 err = lock_trace(task);
402 if (!err) {
Alexey Dobriyan5d008fb2018-06-07 17:10:17 -0700403 unsigned int i;
404
Al Viroa9712bc2011-03-23 15:52:50 -0400405 save_stack_trace_tsk(task, &trace);
406
407 for (i = 0; i < trace.nr_entries; i++) {
Linus Torvalds8f5abe82017-11-27 16:45:56 -0800408 seq_printf(m, "[<0>] %pB\n", (void *)entries[i]);
Al Viroa9712bc2011-03-23 15:52:50 -0400409 }
410 unlock_trace(task);
Ken Chen2ec220e2008-11-10 11:26:08 +0300411 }
412 kfree(entries);
413
Al Viroa9712bc2011-03-23 15:52:50 -0400414 return err;
Ken Chen2ec220e2008-11-10 11:26:08 +0300415}
416#endif
417
Naveen N. Rao5968cec2015-06-30 14:36:03 +0530418#ifdef CONFIG_SCHED_INFO
Linus Torvalds1da177e2005-04-16 15:20:36 -0700419/*
420 * Provides /proc/PID/schedstat
421 */
Alexey Dobriyanf6e826c2014-08-08 14:21:46 -0700422static int proc_pid_schedstat(struct seq_file *m, struct pid_namespace *ns,
423 struct pid *pid, struct task_struct *task)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700424{
Naveen N. Rao5968cec2015-06-30 14:36:03 +0530425 if (unlikely(!sched_info_on()))
426 seq_printf(m, "0 0 0\n");
427 else
428 seq_printf(m, "%llu %llu %lu\n",
Joe Perches25ce3192015-04-15 16:18:17 -0700429 (unsigned long long)task->se.sum_exec_runtime,
430 (unsigned long long)task->sched_info.run_delay,
431 task->sched_info.pcount);
432
433 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700434}
435#endif
436
Arjan van de Ven97455122008-01-25 21:08:34 +0100437#ifdef CONFIG_LATENCYTOP
438static int lstats_show_proc(struct seq_file *m, void *v)
439{
440 int i;
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800441 struct inode *inode = m->private;
442 struct task_struct *task = get_proc_task(inode);
Arjan van de Ven97455122008-01-25 21:08:34 +0100443
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800444 if (!task)
445 return -ESRCH;
446 seq_puts(m, "Latency Top version : v0.1\n");
Arjan van de Ven97455122008-01-25 21:08:34 +0100447 for (i = 0; i < 32; i++) {
Joe Perches34e49d42011-01-12 17:00:30 -0800448 struct latency_record *lr = &task->latency_record[i];
449 if (lr->backtrace[0]) {
Arjan van de Ven97455122008-01-25 21:08:34 +0100450 int q;
Joe Perches34e49d42011-01-12 17:00:30 -0800451 seq_printf(m, "%i %li %li",
452 lr->count, lr->time, lr->max);
Arjan van de Ven97455122008-01-25 21:08:34 +0100453 for (q = 0; q < LT_BACKTRACEDEPTH; q++) {
Joe Perches34e49d42011-01-12 17:00:30 -0800454 unsigned long bt = lr->backtrace[q];
455 if (!bt)
Arjan van de Ven97455122008-01-25 21:08:34 +0100456 break;
Joe Perches34e49d42011-01-12 17:00:30 -0800457 if (bt == ULONG_MAX)
Arjan van de Ven97455122008-01-25 21:08:34 +0100458 break;
Joe Perches34e49d42011-01-12 17:00:30 -0800459 seq_printf(m, " %ps", (void *)bt);
Arjan van de Ven97455122008-01-25 21:08:34 +0100460 }
Alexey Dobriyan9d6de122011-01-12 17:00:32 -0800461 seq_putc(m, '\n');
Arjan van de Ven97455122008-01-25 21:08:34 +0100462 }
463
464 }
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800465 put_task_struct(task);
Arjan van de Ven97455122008-01-25 21:08:34 +0100466 return 0;
467}
468
469static int lstats_open(struct inode *inode, struct file *file)
470{
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800471 return single_open(file, lstats_show_proc, inode);
Hiroshi Shimamotod6643d12008-02-14 10:27:00 -0800472}
473
Arjan van de Ven97455122008-01-25 21:08:34 +0100474static ssize_t lstats_write(struct file *file, const char __user *buf,
475 size_t count, loff_t *offs)
476{
Al Viro496ad9a2013-01-23 17:07:38 -0500477 struct task_struct *task = get_proc_task(file_inode(file));
Arjan van de Ven97455122008-01-25 21:08:34 +0100478
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800479 if (!task)
480 return -ESRCH;
Arjan van de Ven97455122008-01-25 21:08:34 +0100481 clear_all_latency_tracing(task);
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800482 put_task_struct(task);
Arjan van de Ven97455122008-01-25 21:08:34 +0100483
484 return count;
485}
486
487static const struct file_operations proc_lstats_operations = {
488 .open = lstats_open,
489 .read = seq_read,
490 .write = lstats_write,
491 .llseek = seq_lseek,
Hiroshi Shimamoto13d77c32008-02-20 16:53:29 -0800492 .release = single_release,
Arjan van de Ven97455122008-01-25 21:08:34 +0100493};
494
495#endif
496
Alexey Dobriyan6ba51e32014-08-08 14:21:48 -0700497static int proc_oom_score(struct seq_file *m, struct pid_namespace *ns,
498 struct pid *pid, struct task_struct *task)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700499{
David Rientjesa7f638f2012-05-29 15:06:47 -0700500 unsigned long totalpages = totalram_pages + total_swap_pages;
Oleg Nesterovb95c35e2010-04-01 15:13:57 +0200501 unsigned long points = 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700502
Oleg Nesterovef419392016-08-02 14:03:19 -0700503 points = oom_badness(task, NULL, NULL, totalpages) *
504 1000 / totalpages;
Joe Perches25ce3192015-04-15 16:18:17 -0700505 seq_printf(m, "%lu\n", points);
506
507 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700508}
509
Neil Hormand85f50d2007-10-18 23:40:37 -0700510struct limit_names {
Alexey Dobriyancedbcca2014-08-08 14:21:33 -0700511 const char *name;
512 const char *unit;
Neil Hormand85f50d2007-10-18 23:40:37 -0700513};
514
515static const struct limit_names lnames[RLIM_NLIMITS] = {
Kees Cookcff4edb2009-09-22 16:45:32 -0700516 [RLIMIT_CPU] = {"Max cpu time", "seconds"},
Neil Hormand85f50d2007-10-18 23:40:37 -0700517 [RLIMIT_FSIZE] = {"Max file size", "bytes"},
518 [RLIMIT_DATA] = {"Max data size", "bytes"},
519 [RLIMIT_STACK] = {"Max stack size", "bytes"},
520 [RLIMIT_CORE] = {"Max core file size", "bytes"},
521 [RLIMIT_RSS] = {"Max resident set", "bytes"},
522 [RLIMIT_NPROC] = {"Max processes", "processes"},
523 [RLIMIT_NOFILE] = {"Max open files", "files"},
524 [RLIMIT_MEMLOCK] = {"Max locked memory", "bytes"},
525 [RLIMIT_AS] = {"Max address space", "bytes"},
526 [RLIMIT_LOCKS] = {"Max file locks", "locks"},
527 [RLIMIT_SIGPENDING] = {"Max pending signals", "signals"},
528 [RLIMIT_MSGQUEUE] = {"Max msgqueue size", "bytes"},
529 [RLIMIT_NICE] = {"Max nice priority", NULL},
530 [RLIMIT_RTPRIO] = {"Max realtime priority", NULL},
Eugene Teo88081172008-02-23 15:23:52 -0800531 [RLIMIT_RTTIME] = {"Max realtime timeout", "us"},
Neil Hormand85f50d2007-10-18 23:40:37 -0700532};
533
534/* Display limits for a process */
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700535static int proc_pid_limits(struct seq_file *m, struct pid_namespace *ns,
536 struct pid *pid, struct task_struct *task)
Neil Hormand85f50d2007-10-18 23:40:37 -0700537{
538 unsigned int i;
Neil Hormand85f50d2007-10-18 23:40:37 -0700539 unsigned long flags;
Neil Hormand85f50d2007-10-18 23:40:37 -0700540
541 struct rlimit rlim[RLIM_NLIMITS];
542
Lai Jiangshana6bebbc2008-10-05 00:51:15 +0400543 if (!lock_task_sighand(task, &flags))
Neil Hormand85f50d2007-10-18 23:40:37 -0700544 return 0;
Neil Hormand85f50d2007-10-18 23:40:37 -0700545 memcpy(rlim, task->signal->rlim, sizeof(struct rlimit) * RLIM_NLIMITS);
546 unlock_task_sighand(task, &flags);
Neil Hormand85f50d2007-10-18 23:40:37 -0700547
548 /*
549 * print the file header
550 */
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700551 seq_printf(m, "%-25s %-20s %-20s %-10s\n",
Joe Perches25ce3192015-04-15 16:18:17 -0700552 "Limit", "Soft Limit", "Hard Limit", "Units");
Neil Hormand85f50d2007-10-18 23:40:37 -0700553
554 for (i = 0; i < RLIM_NLIMITS; i++) {
555 if (rlim[i].rlim_cur == RLIM_INFINITY)
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700556 seq_printf(m, "%-25s %-20s ",
Joe Perches25ce3192015-04-15 16:18:17 -0700557 lnames[i].name, "unlimited");
Neil Hormand85f50d2007-10-18 23:40:37 -0700558 else
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700559 seq_printf(m, "%-25s %-20lu ",
Joe Perches25ce3192015-04-15 16:18:17 -0700560 lnames[i].name, rlim[i].rlim_cur);
Neil Hormand85f50d2007-10-18 23:40:37 -0700561
562 if (rlim[i].rlim_max == RLIM_INFINITY)
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700563 seq_printf(m, "%-20s ", "unlimited");
Neil Hormand85f50d2007-10-18 23:40:37 -0700564 else
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700565 seq_printf(m, "%-20lu ", rlim[i].rlim_max);
Neil Hormand85f50d2007-10-18 23:40:37 -0700566
567 if (lnames[i].unit)
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700568 seq_printf(m, "%-10s\n", lnames[i].unit);
Neil Hormand85f50d2007-10-18 23:40:37 -0700569 else
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700570 seq_putc(m, '\n');
Neil Hormand85f50d2007-10-18 23:40:37 -0700571 }
572
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -0700573 return 0;
Neil Hormand85f50d2007-10-18 23:40:37 -0700574}
575
Roland McGrathebcb6732008-07-25 19:46:00 -0700576#ifdef CONFIG_HAVE_ARCH_TRACEHOOK
Alexey Dobriyan09d93bd2014-08-08 14:21:39 -0700577static int proc_pid_syscall(struct seq_file *m, struct pid_namespace *ns,
578 struct pid *pid, struct task_struct *task)
Roland McGrathebcb6732008-07-25 19:46:00 -0700579{
580 long nr;
581 unsigned long args[6], sp, pc;
Joe Perches25ce3192015-04-15 16:18:17 -0700582 int res;
583
584 res = lock_trace(task);
Al Viroa9712bc2011-03-23 15:52:50 -0400585 if (res)
586 return res;
Roland McGrathebcb6732008-07-25 19:46:00 -0700587
588 if (task_current_syscall(task, &nr, args, 6, &sp, &pc))
Alexey Dobriyan09d93bd2014-08-08 14:21:39 -0700589 seq_puts(m, "running\n");
Al Viroa9712bc2011-03-23 15:52:50 -0400590 else if (nr < 0)
Alexey Dobriyan09d93bd2014-08-08 14:21:39 -0700591 seq_printf(m, "%ld 0x%lx 0x%lx\n", nr, sp, pc);
Al Viroa9712bc2011-03-23 15:52:50 -0400592 else
Alexey Dobriyan09d93bd2014-08-08 14:21:39 -0700593 seq_printf(m,
Roland McGrathebcb6732008-07-25 19:46:00 -0700594 "%ld 0x%lx 0x%lx 0x%lx 0x%lx 0x%lx 0x%lx 0x%lx 0x%lx\n",
595 nr,
596 args[0], args[1], args[2], args[3], args[4], args[5],
597 sp, pc);
Al Viroa9712bc2011-03-23 15:52:50 -0400598 unlock_trace(task);
Joe Perches25ce3192015-04-15 16:18:17 -0700599
600 return 0;
Roland McGrathebcb6732008-07-25 19:46:00 -0700601}
602#endif /* CONFIG_HAVE_ARCH_TRACEHOOK */
603
Linus Torvalds1da177e2005-04-16 15:20:36 -0700604/************************************************************************/
605/* Here the fs part begins */
606/************************************************************************/
607
608/* permission checks */
Eric W. Biederman778c1142006-06-26 00:25:58 -0700609static int proc_fd_access_allowed(struct inode *inode)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700610{
Eric W. Biederman778c1142006-06-26 00:25:58 -0700611 struct task_struct *task;
612 int allowed = 0;
Eric W. Biedermandf26c402006-06-26 00:25:59 -0700613 /* Allow access to a task's file descriptors if it is us or we
614 * may use ptrace attach to the process and find out that
615 * information.
Eric W. Biederman778c1142006-06-26 00:25:58 -0700616 */
617 task = get_proc_task(inode);
Eric W. Biedermandf26c402006-06-26 00:25:59 -0700618 if (task) {
Jann Horncaaee622016-01-20 15:00:04 -0800619 allowed = ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS);
Eric W. Biederman778c1142006-06-26 00:25:58 -0700620 put_task_struct(task);
Eric W. Biedermandf26c402006-06-26 00:25:59 -0700621 }
Eric W. Biederman778c1142006-06-26 00:25:58 -0700622 return allowed;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700623}
624
Eric W. Biederman6b4e3062010-03-07 16:41:34 -0800625int proc_setattr(struct dentry *dentry, struct iattr *attr)
Linus Torvalds6d76fa52006-07-15 12:26:45 -0700626{
627 int error;
David Howells2b0143b2015-03-17 22:25:59 +0000628 struct inode *inode = d_inode(dentry);
Linus Torvalds6d76fa52006-07-15 12:26:45 -0700629
630 if (attr->ia_valid & ATTR_MODE)
631 return -EPERM;
632
Jan Kara31051c82016-05-26 16:55:18 +0200633 error = setattr_prepare(dentry, attr);
Christoph Hellwig10257742010-06-04 11:30:02 +0200634 if (error)
635 return error;
636
Christoph Hellwig10257742010-06-04 11:30:02 +0200637 setattr_copy(inode, attr);
638 mark_inode_dirty(inode);
639 return 0;
Linus Torvalds6d76fa52006-07-15 12:26:45 -0700640}
641
Vasiliy Kulikov04996802012-01-10 15:11:31 -0800642/*
643 * May current process learn task's sched/cmdline info (for hide_pid_min=1)
644 * or euid/egid (for hide_pid_min=2)?
645 */
646static bool has_pid_permissions(struct pid_namespace *pid,
647 struct task_struct *task,
648 int hide_pid_min)
649{
650 if (pid->hide_pid < hide_pid_min)
651 return true;
652 if (in_group_p(pid->pid_gid))
653 return true;
Jann Horncaaee622016-01-20 15:00:04 -0800654 return ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS);
Vasiliy Kulikov04996802012-01-10 15:11:31 -0800655}
656
657
658static int proc_pid_permission(struct inode *inode, int mask)
659{
Christoph Hellwig76f668b2018-05-16 07:19:01 +0200660 struct pid_namespace *pid = proc_pid_ns(inode);
Vasiliy Kulikov04996802012-01-10 15:11:31 -0800661 struct task_struct *task;
662 bool has_perms;
663
664 task = get_proc_task(inode);
Xiaotian Fenga2ef9902012-01-12 17:17:08 -0800665 if (!task)
666 return -ESRCH;
Lafcadio Wluiki796f5712017-02-24 15:00:23 -0800667 has_perms = has_pid_permissions(pid, task, HIDEPID_NO_ACCESS);
Vasiliy Kulikov04996802012-01-10 15:11:31 -0800668 put_task_struct(task);
669
670 if (!has_perms) {
Lafcadio Wluiki796f5712017-02-24 15:00:23 -0800671 if (pid->hide_pid == HIDEPID_INVISIBLE) {
Vasiliy Kulikov04996802012-01-10 15:11:31 -0800672 /*
673 * Let's make getdents(), stat(), and open()
674 * consistent with each other. If a process
675 * may not stat() a file, it shouldn't be seen
676 * in procfs at all.
677 */
678 return -ENOENT;
679 }
680
681 return -EPERM;
682 }
683 return generic_permission(inode, mask);
684}
685
686
687
Arjan van de Venc5ef1c42007-02-12 00:55:40 -0800688static const struct inode_operations proc_def_inode_operations = {
Linus Torvalds6d76fa52006-07-15 12:26:45 -0700689 .setattr = proc_setattr,
690};
691
Eric W. Biedermanbe614082008-02-08 04:18:30 -0800692static int proc_single_show(struct seq_file *m, void *v)
693{
694 struct inode *inode = m->private;
Christoph Hellwig76f668b2018-05-16 07:19:01 +0200695 struct pid_namespace *ns = proc_pid_ns(inode);
696 struct pid *pid = proc_pid(inode);
Eric W. Biedermanbe614082008-02-08 04:18:30 -0800697 struct task_struct *task;
698 int ret;
699
Eric W. Biedermanbe614082008-02-08 04:18:30 -0800700 task = get_pid_task(pid, PIDTYPE_PID);
701 if (!task)
702 return -ESRCH;
703
704 ret = PROC_I(inode)->op.proc_show(m, ns, pid, task);
705
706 put_task_struct(task);
707 return ret;
708}
709
710static int proc_single_open(struct inode *inode, struct file *filp)
711{
Jovi Zhangc6a34052011-01-12 17:00:34 -0800712 return single_open(filp, proc_single_show, inode);
Eric W. Biedermanbe614082008-02-08 04:18:30 -0800713}
714
715static const struct file_operations proc_single_file_operations = {
716 .open = proc_single_open,
717 .read = seq_read,
718 .llseek = seq_lseek,
719 .release = single_release,
720};
721
Oleg Nesterov5381e162014-10-09 15:25:24 -0700722
723struct mm_struct *proc_mem_open(struct inode *inode, unsigned int mode)
724{
725 struct task_struct *task = get_proc_task(inode);
726 struct mm_struct *mm = ERR_PTR(-ESRCH);
727
728 if (task) {
Jann Horncaaee622016-01-20 15:00:04 -0800729 mm = mm_access(task, mode | PTRACE_MODE_FSCREDS);
Oleg Nesterov5381e162014-10-09 15:25:24 -0700730 put_task_struct(task);
731
732 if (!IS_ERR_OR_NULL(mm)) {
733 /* ensure this mm_struct can't be freed */
Vegard Nossumf1f10072017-02-27 14:30:07 -0800734 mmgrab(mm);
Oleg Nesterov5381e162014-10-09 15:25:24 -0700735 /* but do not pin its memory */
736 mmput(mm);
737 }
738 }
739
740 return mm;
741}
742
Cong Wangb409e572012-05-31 16:26:17 -0700743static int __mem_open(struct inode *inode, struct file *file, unsigned int mode)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700744{
Oleg Nesterov5381e162014-10-09 15:25:24 -0700745 struct mm_struct *mm = proc_mem_open(inode, mode);
Linus Torvaldse2683372012-01-17 15:21:19 -0800746
747 if (IS_ERR(mm))
748 return PTR_ERR(mm);
749
Linus Torvaldse2683372012-01-17 15:21:19 -0800750 file->private_data = mm;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700751 return 0;
752}
753
Cong Wangb409e572012-05-31 16:26:17 -0700754static int mem_open(struct inode *inode, struct file *file)
755{
Djalal Harounibc452b42012-07-30 14:42:28 -0700756 int ret = __mem_open(inode, file, PTRACE_MODE_ATTACH);
757
758 /* OK to pass negative loff_t, we can catch out-of-range */
759 file->f_mode |= FMODE_UNSIGNED_OFFSET;
760
761 return ret;
Cong Wangb409e572012-05-31 16:26:17 -0700762}
763
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100764static ssize_t mem_rw(struct file *file, char __user *buf,
765 size_t count, loff_t *ppos, int write)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700766{
Linus Torvaldse2683372012-01-17 15:21:19 -0800767 struct mm_struct *mm = file->private_data;
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100768 unsigned long addr = *ppos;
769 ssize_t copied;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700770 char *page;
Linus Torvalds272ddc82016-10-24 19:00:44 -0700771 unsigned int flags;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700772
Linus Torvaldse2683372012-01-17 15:21:19 -0800773 if (!mm)
774 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700775
Michal Hocko0ee931c2017-09-13 16:28:29 -0700776 page = (char *)__get_free_page(GFP_KERNEL);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700777 if (!page)
Linus Torvaldse2683372012-01-17 15:21:19 -0800778 return -ENOMEM;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700779
Frederik Deweerdtf7ca54f2006-09-29 02:01:02 -0700780 copied = 0;
Vegard Nossum388f7932017-02-27 14:30:13 -0800781 if (!mmget_not_zero(mm))
Oleg Nesterov6d08f2c2012-01-31 17:15:11 +0100782 goto free;
783
Linus Torvaldsf511c0b2017-05-30 12:38:59 -0700784 flags = FOLL_FORCE | (write ? FOLL_WRITE : 0);
Lorenzo Stoakes6347e8d2016-10-13 01:20:19 +0100785
Linus Torvalds1da177e2005-04-16 15:20:36 -0700786 while (count > 0) {
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100787 int this_len = min_t(int, count, PAGE_SIZE);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700788
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100789 if (write && copy_from_user(page, buf, this_len)) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700790 copied = -EFAULT;
791 break;
792 }
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100793
Lorenzo Stoakes6347e8d2016-10-13 01:20:19 +0100794 this_len = access_remote_vm(mm, addr, page, this_len, flags);
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100795 if (!this_len) {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700796 if (!copied)
797 copied = -EIO;
798 break;
799 }
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100800
801 if (!write && copy_to_user(buf, page, this_len)) {
802 copied = -EFAULT;
803 break;
804 }
805
806 buf += this_len;
807 addr += this_len;
808 copied += this_len;
809 count -= this_len;
Linus Torvalds1da177e2005-04-16 15:20:36 -0700810 }
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100811 *ppos = addr;
KOSAKI Motohiro30cd8902011-05-26 16:25:52 -0700812
Oleg Nesterov6d08f2c2012-01-31 17:15:11 +0100813 mmput(mm);
814free:
KOSAKI Motohiro30cd8902011-05-26 16:25:52 -0700815 free_page((unsigned long) page);
Linus Torvalds1da177e2005-04-16 15:20:36 -0700816 return copied;
817}
Linus Torvalds1da177e2005-04-16 15:20:36 -0700818
Oleg Nesterov572d34b2012-01-31 17:14:54 +0100819static ssize_t mem_read(struct file *file, char __user *buf,
820 size_t count, loff_t *ppos)
821{
822 return mem_rw(file, buf, count, ppos, 0);
823}
824
825static ssize_t mem_write(struct file *file, const char __user *buf,
826 size_t count, loff_t *ppos)
827{
828 return mem_rw(file, (char __user*)buf, count, ppos, 1);
829}
830
Matt Mackall85863e42008-02-04 22:29:04 -0800831loff_t mem_lseek(struct file *file, loff_t offset, int orig)
Linus Torvalds1da177e2005-04-16 15:20:36 -0700832{
833 switch (orig) {
834 case 0:
835 file->f_pos = offset;
836 break;
837 case 1:
838 file->f_pos += offset;
839 break;
840 default:
841 return -EINVAL;
842 }
843 force_successful_syscall_return();
844 return file->f_pos;
845}
846
Linus Torvaldse2683372012-01-17 15:21:19 -0800847static int mem_release(struct inode *inode, struct file *file)
848{
849 struct mm_struct *mm = file->private_data;
Oleg Nesterov71879d32012-01-31 17:14:38 +0100850 if (mm)
Oleg Nesterov6d08f2c2012-01-31 17:15:11 +0100851 mmdrop(mm);
Linus Torvaldse2683372012-01-17 15:21:19 -0800852 return 0;
853}
854
Arjan van de Ven00977a52007-02-12 00:55:34 -0800855static const struct file_operations proc_mem_operations = {
Linus Torvalds1da177e2005-04-16 15:20:36 -0700856 .llseek = mem_lseek,
857 .read = mem_read,
858 .write = mem_write,
859 .open = mem_open,
Linus Torvaldse2683372012-01-17 15:21:19 -0800860 .release = mem_release,
Linus Torvalds1da177e2005-04-16 15:20:36 -0700861};
862
Cong Wangb409e572012-05-31 16:26:17 -0700863static int environ_open(struct inode *inode, struct file *file)
864{
865 return __mem_open(inode, file, PTRACE_MODE_READ);
866}
867
James Pearson315e28c2007-10-16 23:30:17 -0700868static ssize_t environ_read(struct file *file, char __user *buf,
869 size_t count, loff_t *ppos)
870{
James Pearson315e28c2007-10-16 23:30:17 -0700871 char *page;
872 unsigned long src = *ppos;
Cong Wangb409e572012-05-31 16:26:17 -0700873 int ret = 0;
874 struct mm_struct *mm = file->private_data;
Mateusz Guzika3b609e2016-01-20 15:01:05 -0800875 unsigned long env_start, env_end;
James Pearson315e28c2007-10-16 23:30:17 -0700876
Mathias Krause8148a732016-05-05 16:22:26 -0700877 /* Ensure the process spawned far enough to have an environment. */
878 if (!mm || !mm->env_end)
Cong Wangb409e572012-05-31 16:26:17 -0700879 return 0;
James Pearson315e28c2007-10-16 23:30:17 -0700880
Michal Hocko0ee931c2017-09-13 16:28:29 -0700881 page = (char *)__get_free_page(GFP_KERNEL);
James Pearson315e28c2007-10-16 23:30:17 -0700882 if (!page)
Cong Wangb409e572012-05-31 16:26:17 -0700883 return -ENOMEM;
James Pearson315e28c2007-10-16 23:30:17 -0700884
Al Virod6f64b82011-02-15 22:26:01 -0500885 ret = 0;
Vegard Nossum388f7932017-02-27 14:30:13 -0800886 if (!mmget_not_zero(mm))
Cong Wangb409e572012-05-31 16:26:17 -0700887 goto free;
Mateusz Guzika3b609e2016-01-20 15:01:05 -0800888
Yang Shi88aa7cc2018-06-07 17:05:28 -0700889 spin_lock(&mm->arg_lock);
Mateusz Guzika3b609e2016-01-20 15:01:05 -0800890 env_start = mm->env_start;
891 env_end = mm->env_end;
Yang Shi88aa7cc2018-06-07 17:05:28 -0700892 spin_unlock(&mm->arg_lock);
Mateusz Guzika3b609e2016-01-20 15:01:05 -0800893
James Pearson315e28c2007-10-16 23:30:17 -0700894 while (count > 0) {
Djalal Harounie8905ec2012-07-30 14:42:26 -0700895 size_t this_len, max_len;
896 int retval;
897
Mateusz Guzika3b609e2016-01-20 15:01:05 -0800898 if (src >= (env_end - env_start))
Djalal Harounie8905ec2012-07-30 14:42:26 -0700899 break;
James Pearson315e28c2007-10-16 23:30:17 -0700900
Mateusz Guzika3b609e2016-01-20 15:01:05 -0800901 this_len = env_end - (env_start + src);
James Pearson315e28c2007-10-16 23:30:17 -0700902
Djalal Harounie8905ec2012-07-30 14:42:26 -0700903 max_len = min_t(size_t, PAGE_SIZE, count);
904 this_len = min(max_len, this_len);
James Pearson315e28c2007-10-16 23:30:17 -0700905
Willy Tarreau7f7ccc22018-05-11 08:11:44 +0200906 retval = access_remote_vm(mm, (env_start + src), page, this_len, FOLL_ANON);
James Pearson315e28c2007-10-16 23:30:17 -0700907
908 if (retval <= 0) {
909 ret = retval;
910 break;
911 }
912
913 if (copy_to_user(buf, page, retval)) {
914 ret = -EFAULT;
915 break;
916 }
917
918 ret += retval;
919 src += retval;
920 buf += retval;
921 count -= retval;
922 }
923 *ppos = src;
James Pearson315e28c2007-10-16 23:30:17 -0700924 mmput(mm);
Cong Wangb409e572012-05-31 16:26:17 -0700925
926free:
James Pearson315e28c2007-10-16 23:30:17 -0700927 free_page((unsigned long) page);
James Pearson315e28c2007-10-16 23:30:17 -0700928 return ret;
929}
930
931static const struct file_operations proc_environ_operations = {
Cong Wangb409e572012-05-31 16:26:17 -0700932 .open = environ_open,
James Pearson315e28c2007-10-16 23:30:17 -0700933 .read = environ_read,
Arnd Bergmann87df8422010-03-17 23:06:02 +0100934 .llseek = generic_file_llseek,
Cong Wangb409e572012-05-31 16:26:17 -0700935 .release = mem_release,
James Pearson315e28c2007-10-16 23:30:17 -0700936};
937
Al Viroc5317162016-10-05 18:43:43 -0400938static int auxv_open(struct inode *inode, struct file *file)
939{
940 return __mem_open(inode, file, PTRACE_MODE_READ_FSCREDS);
941}
942
943static ssize_t auxv_read(struct file *file, char __user *buf,
944 size_t count, loff_t *ppos)
945{
946 struct mm_struct *mm = file->private_data;
947 unsigned int nwords = 0;
Leon Yu06b28492016-10-27 17:46:50 -0700948
949 if (!mm)
950 return 0;
Al Viroc5317162016-10-05 18:43:43 -0400951 do {
952 nwords += 2;
953 } while (mm->saved_auxv[nwords - 2] != 0); /* AT_NULL */
954 return simple_read_from_buffer(buf, count, ppos, mm->saved_auxv,
955 nwords * sizeof(mm->saved_auxv[0]));
956}
957
958static const struct file_operations proc_auxv_operations = {
959 .open = auxv_open,
960 .read = auxv_read,
961 .llseek = generic_file_llseek,
962 .release = mem_release,
963};
964
David Rientjesfa0cbbf2012-11-12 17:53:04 -0800965static ssize_t oom_adj_read(struct file *file, char __user *buf, size_t count,
966 loff_t *ppos)
967{
Al Viro496ad9a2013-01-23 17:07:38 -0500968 struct task_struct *task = get_proc_task(file_inode(file));
David Rientjesfa0cbbf2012-11-12 17:53:04 -0800969 char buffer[PROC_NUMBUF];
970 int oom_adj = OOM_ADJUST_MIN;
971 size_t len;
David Rientjesfa0cbbf2012-11-12 17:53:04 -0800972
973 if (!task)
974 return -ESRCH;
Michal Hockof913da52016-07-28 15:44:37 -0700975 if (task->signal->oom_score_adj == OOM_SCORE_ADJ_MAX)
976 oom_adj = OOM_ADJUST_MAX;
977 else
978 oom_adj = (task->signal->oom_score_adj * -OOM_DISABLE) /
979 OOM_SCORE_ADJ_MAX;
David Rientjesfa0cbbf2012-11-12 17:53:04 -0800980 put_task_struct(task);
981 len = snprintf(buffer, sizeof(buffer), "%d\n", oom_adj);
982 return simple_read_from_buffer(buf, count, ppos, buffer, len);
983}
984
Michal Hocko1d5f0ac2016-07-28 15:44:40 -0700985static int __set_oom_adj(struct file *file, int oom_adj, bool legacy)
986{
987 static DEFINE_MUTEX(oom_adj_mutex);
Michal Hocko44a70ade2016-07-28 15:44:43 -0700988 struct mm_struct *mm = NULL;
Michal Hocko1d5f0ac2016-07-28 15:44:40 -0700989 struct task_struct *task;
990 int err = 0;
991
992 task = get_proc_task(file_inode(file));
993 if (!task)
994 return -ESRCH;
995
996 mutex_lock(&oom_adj_mutex);
997 if (legacy) {
998 if (oom_adj < task->signal->oom_score_adj &&
999 !capable(CAP_SYS_RESOURCE)) {
1000 err = -EACCES;
1001 goto err_unlock;
1002 }
1003 /*
1004 * /proc/pid/oom_adj is provided for legacy purposes, ask users to use
1005 * /proc/pid/oom_score_adj instead.
1006 */
1007 pr_warn_once("%s (%d): /proc/%d/oom_adj is deprecated, please use /proc/%d/oom_score_adj instead.\n",
1008 current->comm, task_pid_nr(current), task_pid_nr(task),
1009 task_pid_nr(task));
1010 } else {
1011 if ((short)oom_adj < task->signal->oom_score_adj_min &&
1012 !capable(CAP_SYS_RESOURCE)) {
1013 err = -EACCES;
1014 goto err_unlock;
1015 }
1016 }
1017
Michal Hocko44a70ade2016-07-28 15:44:43 -07001018 /*
1019 * Make sure we will check other processes sharing the mm if this is
1020 * not vfrok which wants its own oom_score_adj.
1021 * pin the mm so it doesn't go away and get reused after task_unlock
1022 */
1023 if (!task->vfork_done) {
1024 struct task_struct *p = find_lock_task_mm(task);
1025
1026 if (p) {
1027 if (atomic_read(&p->mm->mm_users) > 1) {
1028 mm = p->mm;
Vegard Nossumf1f10072017-02-27 14:30:07 -08001029 mmgrab(mm);
Michal Hocko44a70ade2016-07-28 15:44:43 -07001030 }
1031 task_unlock(p);
1032 }
1033 }
1034
Michal Hocko1d5f0ac2016-07-28 15:44:40 -07001035 task->signal->oom_score_adj = oom_adj;
1036 if (!legacy && has_capability_noaudit(current, CAP_SYS_RESOURCE))
1037 task->signal->oom_score_adj_min = (short)oom_adj;
1038 trace_oom_score_adj_update(task);
Michal Hocko44a70ade2016-07-28 15:44:43 -07001039
1040 if (mm) {
1041 struct task_struct *p;
1042
1043 rcu_read_lock();
1044 for_each_process(p) {
1045 if (same_thread_group(task, p))
1046 continue;
1047
1048 /* do not touch kernel threads or the global init */
1049 if (p->flags & PF_KTHREAD || is_global_init(p))
1050 continue;
1051
1052 task_lock(p);
1053 if (!p->vfork_done && process_shares_mm(p, mm)) {
1054 pr_info("updating oom_score_adj for %d (%s) from %d to %d because it shares mm with %d (%s). Report if this is unexpected.\n",
1055 task_pid_nr(p), p->comm,
1056 p->signal->oom_score_adj, oom_adj,
1057 task_pid_nr(task), task->comm);
1058 p->signal->oom_score_adj = oom_adj;
1059 if (!legacy && has_capability_noaudit(current, CAP_SYS_RESOURCE))
1060 p->signal->oom_score_adj_min = (short)oom_adj;
1061 }
1062 task_unlock(p);
1063 }
1064 rcu_read_unlock();
1065 mmdrop(mm);
1066 }
Michal Hocko1d5f0ac2016-07-28 15:44:40 -07001067err_unlock:
1068 mutex_unlock(&oom_adj_mutex);
1069 put_task_struct(task);
1070 return err;
1071}
Michal Hockof913da52016-07-28 15:44:37 -07001072
David Rientjesb72bdfa2015-11-05 18:50:32 -08001073/*
1074 * /proc/pid/oom_adj exists solely for backwards compatibility with previous
1075 * kernels. The effective policy is defined by oom_score_adj, which has a
1076 * different scale: oom_adj grew exponentially and oom_score_adj grows linearly.
1077 * Values written to oom_adj are simply mapped linearly to oom_score_adj.
1078 * Processes that become oom disabled via oom_adj will still be oom disabled
1079 * with this implementation.
1080 *
1081 * oom_adj cannot be removed since existing userspace binaries use it.
1082 */
David Rientjesfa0cbbf2012-11-12 17:53:04 -08001083static ssize_t oom_adj_write(struct file *file, const char __user *buf,
1084 size_t count, loff_t *ppos)
1085{
David Rientjesfa0cbbf2012-11-12 17:53:04 -08001086 char buffer[PROC_NUMBUF];
1087 int oom_adj;
David Rientjesfa0cbbf2012-11-12 17:53:04 -08001088 int err;
1089
1090 memset(buffer, 0, sizeof(buffer));
1091 if (count > sizeof(buffer) - 1)
1092 count = sizeof(buffer) - 1;
1093 if (copy_from_user(buffer, buf, count)) {
1094 err = -EFAULT;
1095 goto out;
1096 }
1097
1098 err = kstrtoint(strstrip(buffer), 0, &oom_adj);
1099 if (err)
1100 goto out;
1101 if ((oom_adj < OOM_ADJUST_MIN || oom_adj > OOM_ADJUST_MAX) &&
1102 oom_adj != OOM_DISABLE) {
1103 err = -EINVAL;
1104 goto out;
1105 }
1106
David Rientjesfa0cbbf2012-11-12 17:53:04 -08001107 /*
1108 * Scale /proc/pid/oom_score_adj appropriately ensuring that a maximum
1109 * value is always attainable.
1110 */
1111 if (oom_adj == OOM_ADJUST_MAX)
1112 oom_adj = OOM_SCORE_ADJ_MAX;
1113 else
1114 oom_adj = (oom_adj * OOM_SCORE_ADJ_MAX) / -OOM_DISABLE;
1115
Michal Hocko1d5f0ac2016-07-28 15:44:40 -07001116 err = __set_oom_adj(file, oom_adj, true);
David Rientjesfa0cbbf2012-11-12 17:53:04 -08001117out:
1118 return err < 0 ? err : count;
1119}
1120
1121static const struct file_operations proc_oom_adj_operations = {
1122 .read = oom_adj_read,
1123 .write = oom_adj_write,
1124 .llseek = generic_file_llseek,
1125};
1126
David Rientjesa63d83f2010-08-09 17:19:46 -07001127static ssize_t oom_score_adj_read(struct file *file, char __user *buf,
1128 size_t count, loff_t *ppos)
1129{
Al Viro496ad9a2013-01-23 17:07:38 -05001130 struct task_struct *task = get_proc_task(file_inode(file));
David Rientjesa63d83f2010-08-09 17:19:46 -07001131 char buffer[PROC_NUMBUF];
David Rientjesa9c58b902012-12-11 16:02:54 -08001132 short oom_score_adj = OOM_SCORE_ADJ_MIN;
David Rientjesa63d83f2010-08-09 17:19:46 -07001133 size_t len;
1134
1135 if (!task)
1136 return -ESRCH;
Michal Hockof913da52016-07-28 15:44:37 -07001137 oom_score_adj = task->signal->oom_score_adj;
David Rientjesa63d83f2010-08-09 17:19:46 -07001138 put_task_struct(task);
David Rientjesa9c58b902012-12-11 16:02:54 -08001139 len = snprintf(buffer, sizeof(buffer), "%hd\n", oom_score_adj);
David Rientjesa63d83f2010-08-09 17:19:46 -07001140 return simple_read_from_buffer(buf, count, ppos, buffer, len);
1141}
1142
1143static ssize_t oom_score_adj_write(struct file *file, const char __user *buf,
1144 size_t count, loff_t *ppos)
1145{
David Rientjesa63d83f2010-08-09 17:19:46 -07001146 char buffer[PROC_NUMBUF];
Alexey Dobriyan0a8cb8e2011-05-26 16:25:50 -07001147 int oom_score_adj;
David Rientjesa63d83f2010-08-09 17:19:46 -07001148 int err;
1149
1150 memset(buffer, 0, sizeof(buffer));
1151 if (count > sizeof(buffer) - 1)
1152 count = sizeof(buffer) - 1;
David Rientjes723548b2010-10-26 14:21:25 -07001153 if (copy_from_user(buffer, buf, count)) {
1154 err = -EFAULT;
1155 goto out;
1156 }
David Rientjesa63d83f2010-08-09 17:19:46 -07001157
Alexey Dobriyan0a8cb8e2011-05-26 16:25:50 -07001158 err = kstrtoint(strstrip(buffer), 0, &oom_score_adj);
David Rientjesa63d83f2010-08-09 17:19:46 -07001159 if (err)
David Rientjes723548b2010-10-26 14:21:25 -07001160 goto out;
David Rientjesa63d83f2010-08-09 17:19:46 -07001161 if (oom_score_adj < OOM_SCORE_ADJ_MIN ||
David Rientjes723548b2010-10-26 14:21:25 -07001162 oom_score_adj > OOM_SCORE_ADJ_MAX) {
1163 err = -EINVAL;
1164 goto out;
1165 }
David Rientjesa63d83f2010-08-09 17:19:46 -07001166
Michal Hocko1d5f0ac2016-07-28 15:44:40 -07001167 err = __set_oom_adj(file, oom_score_adj, false);
David Rientjes723548b2010-10-26 14:21:25 -07001168out:
1169 return err < 0 ? err : count;
David Rientjesa63d83f2010-08-09 17:19:46 -07001170}
1171
1172static const struct file_operations proc_oom_score_adj_operations = {
1173 .read = oom_score_adj_read,
1174 .write = oom_score_adj_write,
Arnd Bergmann6038f372010-08-15 18:52:59 +02001175 .llseek = default_llseek,
David Rientjesa63d83f2010-08-09 17:19:46 -07001176};
1177
Linus Torvalds1da177e2005-04-16 15:20:36 -07001178#ifdef CONFIG_AUDITSYSCALL
Alexey Dobriyanb4eb4f72016-10-29 19:04:39 +03001179#define TMPBUFLEN 11
Linus Torvalds1da177e2005-04-16 15:20:36 -07001180static ssize_t proc_loginuid_read(struct file * file, char __user * buf,
1181 size_t count, loff_t *ppos)
1182{
Al Viro496ad9a2013-01-23 17:07:38 -05001183 struct inode * inode = file_inode(file);
Eric W. Biederman99f89552006-06-26 00:25:55 -07001184 struct task_struct *task = get_proc_task(inode);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001185 ssize_t length;
1186 char tmpbuf[TMPBUFLEN];
1187
Eric W. Biederman99f89552006-06-26 00:25:55 -07001188 if (!task)
1189 return -ESRCH;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001190 length = scnprintf(tmpbuf, TMPBUFLEN, "%u",
Eric W. Biedermane1760bd2012-09-10 22:39:43 -07001191 from_kuid(file->f_cred->user_ns,
1192 audit_get_loginuid(task)));
Eric W. Biederman99f89552006-06-26 00:25:55 -07001193 put_task_struct(task);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001194 return simple_read_from_buffer(buf, count, ppos, tmpbuf, length);
1195}
1196
1197static ssize_t proc_loginuid_write(struct file * file, const char __user * buf,
1198 size_t count, loff_t *ppos)
1199{
Al Viro496ad9a2013-01-23 17:07:38 -05001200 struct inode * inode = file_inode(file);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001201 uid_t loginuid;
Eric W. Biedermane1760bd2012-09-10 22:39:43 -07001202 kuid_t kloginuid;
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001203 int rv;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001204
Paul E. McKenney7dc52152010-02-22 17:04:52 -08001205 rcu_read_lock();
1206 if (current != pid_task(proc_pid(inode), PIDTYPE_PID)) {
1207 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001208 return -EPERM;
Paul E. McKenney7dc52152010-02-22 17:04:52 -08001209 }
1210 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07001211
Linus Torvalds1da177e2005-04-16 15:20:36 -07001212 if (*ppos != 0) {
1213 /* No partial writes. */
1214 return -EINVAL;
1215 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07001216
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001217 rv = kstrtou32_from_user(buf, count, 10, &loginuid);
1218 if (rv < 0)
1219 return rv;
Eric Paris81407c82013-05-24 09:49:14 -04001220
1221 /* is userspace tring to explicitly UNSET the loginuid? */
1222 if (loginuid == AUDIT_UID_UNSET) {
1223 kloginuid = INVALID_UID;
1224 } else {
1225 kloginuid = make_kuid(file->f_cred->user_ns, loginuid);
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001226 if (!uid_valid(kloginuid))
1227 return -EINVAL;
Eric W. Biedermane1760bd2012-09-10 22:39:43 -07001228 }
1229
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001230 rv = audit_set_loginuid(kloginuid);
1231 if (rv < 0)
1232 return rv;
1233 return count;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001234}
1235
Arjan van de Ven00977a52007-02-12 00:55:34 -08001236static const struct file_operations proc_loginuid_operations = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001237 .read = proc_loginuid_read,
1238 .write = proc_loginuid_write,
Arnd Bergmann87df8422010-03-17 23:06:02 +01001239 .llseek = generic_file_llseek,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001240};
Eric Paris1e0bd752008-03-13 08:15:31 -04001241
1242static ssize_t proc_sessionid_read(struct file * file, char __user * buf,
1243 size_t count, loff_t *ppos)
1244{
Al Viro496ad9a2013-01-23 17:07:38 -05001245 struct inode * inode = file_inode(file);
Eric Paris1e0bd752008-03-13 08:15:31 -04001246 struct task_struct *task = get_proc_task(inode);
1247 ssize_t length;
1248 char tmpbuf[TMPBUFLEN];
1249
1250 if (!task)
1251 return -ESRCH;
1252 length = scnprintf(tmpbuf, TMPBUFLEN, "%u",
1253 audit_get_sessionid(task));
1254 put_task_struct(task);
1255 return simple_read_from_buffer(buf, count, ppos, tmpbuf, length);
1256}
1257
1258static const struct file_operations proc_sessionid_operations = {
1259 .read = proc_sessionid_read,
Arnd Bergmann87df8422010-03-17 23:06:02 +01001260 .llseek = generic_file_llseek,
Eric Paris1e0bd752008-03-13 08:15:31 -04001261};
Linus Torvalds1da177e2005-04-16 15:20:36 -07001262#endif
1263
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001264#ifdef CONFIG_FAULT_INJECTION
1265static ssize_t proc_fault_inject_read(struct file * file, char __user * buf,
1266 size_t count, loff_t *ppos)
1267{
Al Viro496ad9a2013-01-23 17:07:38 -05001268 struct task_struct *task = get_proc_task(file_inode(file));
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001269 char buffer[PROC_NUMBUF];
1270 size_t len;
1271 int make_it_fail;
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001272
1273 if (!task)
1274 return -ESRCH;
1275 make_it_fail = task->make_it_fail;
1276 put_task_struct(task);
1277
1278 len = snprintf(buffer, sizeof(buffer), "%i\n", make_it_fail);
Akinobu Mita0c28f282007-05-08 00:31:41 -07001279
1280 return simple_read_from_buffer(buf, count, ppos, buffer, len);
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001281}
1282
1283static ssize_t proc_fault_inject_write(struct file * file,
1284 const char __user * buf, size_t count, loff_t *ppos)
1285{
1286 struct task_struct *task;
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001287 char buffer[PROC_NUMBUF];
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001288 int make_it_fail;
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001289 int rv;
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001290
1291 if (!capable(CAP_SYS_RESOURCE))
1292 return -EPERM;
1293 memset(buffer, 0, sizeof(buffer));
1294 if (count > sizeof(buffer) - 1)
1295 count = sizeof(buffer) - 1;
1296 if (copy_from_user(buffer, buf, count))
1297 return -EFAULT;
Alexey Dobriyan774636e2015-09-09 15:36:59 -07001298 rv = kstrtoint(strstrip(buffer), 0, &make_it_fail);
1299 if (rv < 0)
1300 return rv;
Dave Jones16caed32014-04-07 15:39:15 -07001301 if (make_it_fail < 0 || make_it_fail > 1)
1302 return -EINVAL;
1303
Al Viro496ad9a2013-01-23 17:07:38 -05001304 task = get_proc_task(file_inode(file));
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001305 if (!task)
1306 return -ESRCH;
1307 task->make_it_fail = make_it_fail;
1308 put_task_struct(task);
Vincent Licba8aaf2009-09-22 16:45:38 -07001309
1310 return count;
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001311}
1312
Arjan van de Ven00977a52007-02-12 00:55:34 -08001313static const struct file_operations proc_fault_inject_operations = {
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001314 .read = proc_fault_inject_read,
1315 .write = proc_fault_inject_write,
Arnd Bergmann87df8422010-03-17 23:06:02 +01001316 .llseek = generic_file_llseek,
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001317};
Dmitry Vyukove41d58182017-07-12 14:34:35 -07001318
1319static ssize_t proc_fail_nth_write(struct file *file, const char __user *buf,
1320 size_t count, loff_t *ppos)
1321{
1322 struct task_struct *task;
Akinobu Mita9049f2f2017-07-14 14:49:52 -07001323 int err;
1324 unsigned int n;
Dmitry Vyukove41d58182017-07-12 14:34:35 -07001325
Akinobu Mita9049f2f2017-07-14 14:49:52 -07001326 err = kstrtouint_from_user(buf, count, 0, &n);
Dmitry Vyukove41d58182017-07-12 14:34:35 -07001327 if (err)
1328 return err;
Akinobu Mita1203c8e2017-07-14 14:49:57 -07001329
1330 task = get_proc_task(file_inode(file));
1331 if (!task)
1332 return -ESRCH;
Alexey Dobriyan9f7118b2018-02-06 15:36:55 -08001333 task->fail_nth = n;
Akinobu Mita1203c8e2017-07-14 14:49:57 -07001334 put_task_struct(task);
1335
Dmitry Vyukove41d58182017-07-12 14:34:35 -07001336 return count;
1337}
1338
1339static ssize_t proc_fail_nth_read(struct file *file, char __user *buf,
1340 size_t count, loff_t *ppos)
1341{
1342 struct task_struct *task;
Akinobu Mitabfc74092017-07-14 14:49:54 -07001343 char numbuf[PROC_NUMBUF];
1344 ssize_t len;
Dmitry Vyukove41d58182017-07-12 14:34:35 -07001345
1346 task = get_proc_task(file_inode(file));
1347 if (!task)
1348 return -ESRCH;
Alexey Dobriyan9f7118b2018-02-06 15:36:55 -08001349 len = snprintf(numbuf, sizeof(numbuf), "%u\n", task->fail_nth);
Akinobu Mitabfc74092017-07-14 14:49:54 -07001350 len = simple_read_from_buffer(buf, count, ppos, numbuf, len);
Akinobu Mita1203c8e2017-07-14 14:49:57 -07001351 put_task_struct(task);
Akinobu Mitabfc74092017-07-14 14:49:54 -07001352
1353 return len;
Dmitry Vyukove41d58182017-07-12 14:34:35 -07001354}
1355
1356static const struct file_operations proc_fail_nth_operations = {
1357 .read = proc_fail_nth_read,
1358 .write = proc_fail_nth_write,
1359};
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08001360#endif
1361
Arjan van de Ven97455122008-01-25 21:08:34 +01001362
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001363#ifdef CONFIG_SCHED_DEBUG
1364/*
1365 * Print out various scheduling related per-task fields:
1366 */
1367static int sched_show(struct seq_file *m, void *v)
1368{
1369 struct inode *inode = m->private;
Christoph Hellwig76f668b2018-05-16 07:19:01 +02001370 struct pid_namespace *ns = proc_pid_ns(inode);
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001371 struct task_struct *p;
1372
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001373 p = get_proc_task(inode);
1374 if (!p)
1375 return -ESRCH;
Aleksa Sarai74dc3382017-08-06 14:41:41 +10001376 proc_sched_show_task(p, ns, m);
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001377
1378 put_task_struct(p);
1379
1380 return 0;
1381}
1382
1383static ssize_t
1384sched_write(struct file *file, const char __user *buf,
1385 size_t count, loff_t *offset)
1386{
Al Viro496ad9a2013-01-23 17:07:38 -05001387 struct inode *inode = file_inode(file);
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001388 struct task_struct *p;
1389
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001390 p = get_proc_task(inode);
1391 if (!p)
1392 return -ESRCH;
1393 proc_sched_set_task(p);
1394
1395 put_task_struct(p);
1396
1397 return count;
1398}
1399
1400static int sched_open(struct inode *inode, struct file *filp)
1401{
Jovi Zhangc6a34052011-01-12 17:00:34 -08001402 return single_open(filp, sched_show, inode);
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001403}
1404
1405static const struct file_operations proc_pid_sched_operations = {
1406 .open = sched_open,
1407 .read = seq_read,
1408 .write = sched_write,
1409 .llseek = seq_lseek,
Alexey Dobriyan5ea473a2007-07-31 00:38:50 -07001410 .release = single_release,
Ingo Molnar43ae34c2007-07-09 18:52:00 +02001411};
1412
1413#endif
1414
Mike Galbraith5091faa2010-11-30 14:18:03 +01001415#ifdef CONFIG_SCHED_AUTOGROUP
1416/*
1417 * Print out autogroup related information:
1418 */
1419static int sched_autogroup_show(struct seq_file *m, void *v)
1420{
1421 struct inode *inode = m->private;
1422 struct task_struct *p;
1423
1424 p = get_proc_task(inode);
1425 if (!p)
1426 return -ESRCH;
1427 proc_sched_autogroup_show_task(p, m);
1428
1429 put_task_struct(p);
1430
1431 return 0;
1432}
1433
1434static ssize_t
1435sched_autogroup_write(struct file *file, const char __user *buf,
1436 size_t count, loff_t *offset)
1437{
Al Viro496ad9a2013-01-23 17:07:38 -05001438 struct inode *inode = file_inode(file);
Mike Galbraith5091faa2010-11-30 14:18:03 +01001439 struct task_struct *p;
1440 char buffer[PROC_NUMBUF];
Alexey Dobriyan0a8cb8e2011-05-26 16:25:50 -07001441 int nice;
Mike Galbraith5091faa2010-11-30 14:18:03 +01001442 int err;
1443
1444 memset(buffer, 0, sizeof(buffer));
1445 if (count > sizeof(buffer) - 1)
1446 count = sizeof(buffer) - 1;
1447 if (copy_from_user(buffer, buf, count))
1448 return -EFAULT;
1449
Alexey Dobriyan0a8cb8e2011-05-26 16:25:50 -07001450 err = kstrtoint(strstrip(buffer), 0, &nice);
1451 if (err < 0)
1452 return err;
Mike Galbraith5091faa2010-11-30 14:18:03 +01001453
1454 p = get_proc_task(inode);
1455 if (!p)
1456 return -ESRCH;
1457
Hiroshi Shimamoto2e5b5b32012-02-23 17:41:27 +09001458 err = proc_sched_autogroup_set_nice(p, nice);
Mike Galbraith5091faa2010-11-30 14:18:03 +01001459 if (err)
1460 count = err;
1461
1462 put_task_struct(p);
1463
1464 return count;
1465}
1466
1467static int sched_autogroup_open(struct inode *inode, struct file *filp)
1468{
1469 int ret;
1470
1471 ret = single_open(filp, sched_autogroup_show, NULL);
1472 if (!ret) {
1473 struct seq_file *m = filp->private_data;
1474
1475 m->private = inode;
1476 }
1477 return ret;
1478}
1479
1480static const struct file_operations proc_pid_sched_autogroup_operations = {
1481 .open = sched_autogroup_open,
1482 .read = seq_read,
1483 .write = sched_autogroup_write,
1484 .llseek = seq_lseek,
1485 .release = single_release,
1486};
1487
1488#endif /* CONFIG_SCHED_AUTOGROUP */
1489
john stultz4614a696b2009-12-14 18:00:05 -08001490static ssize_t comm_write(struct file *file, const char __user *buf,
1491 size_t count, loff_t *offset)
1492{
Al Viro496ad9a2013-01-23 17:07:38 -05001493 struct inode *inode = file_inode(file);
john stultz4614a696b2009-12-14 18:00:05 -08001494 struct task_struct *p;
1495 char buffer[TASK_COMM_LEN];
David Rientjes830e0fc2013-04-30 15:28:18 -07001496 const size_t maxlen = sizeof(buffer) - 1;
john stultz4614a696b2009-12-14 18:00:05 -08001497
1498 memset(buffer, 0, sizeof(buffer));
David Rientjes830e0fc2013-04-30 15:28:18 -07001499 if (copy_from_user(buffer, buf, count > maxlen ? maxlen : count))
john stultz4614a696b2009-12-14 18:00:05 -08001500 return -EFAULT;
1501
1502 p = get_proc_task(inode);
1503 if (!p)
1504 return -ESRCH;
1505
1506 if (same_thread_group(current, p))
1507 set_task_comm(p, buffer);
1508 else
1509 count = -EINVAL;
1510
1511 put_task_struct(p);
1512
1513 return count;
1514}
1515
1516static int comm_show(struct seq_file *m, void *v)
1517{
1518 struct inode *inode = m->private;
1519 struct task_struct *p;
1520
1521 p = get_proc_task(inode);
1522 if (!p)
1523 return -ESRCH;
1524
Tejun Heo88b72b32018-05-18 08:47:13 -07001525 proc_task_name(m, p, false);
1526 seq_putc(m, '\n');
john stultz4614a696b2009-12-14 18:00:05 -08001527
1528 put_task_struct(p);
1529
1530 return 0;
1531}
1532
1533static int comm_open(struct inode *inode, struct file *filp)
1534{
Jovi Zhangc6a34052011-01-12 17:00:34 -08001535 return single_open(filp, comm_show, inode);
john stultz4614a696b2009-12-14 18:00:05 -08001536}
1537
1538static const struct file_operations proc_pid_set_comm_operations = {
1539 .open = comm_open,
1540 .read = seq_read,
1541 .write = comm_write,
1542 .llseek = seq_lseek,
1543 .release = single_release,
1544};
1545
Cyrill Gorcunov7773fbc2012-01-10 15:11:20 -08001546static int proc_exe_link(struct dentry *dentry, struct path *exe_path)
Matt Helsley925d1c42008-04-29 01:01:36 -07001547{
1548 struct task_struct *task;
Matt Helsley925d1c42008-04-29 01:01:36 -07001549 struct file *exe_file;
1550
David Howells2b0143b2015-03-17 22:25:59 +00001551 task = get_proc_task(d_inode(dentry));
Matt Helsley925d1c42008-04-29 01:01:36 -07001552 if (!task)
1553 return -ENOENT;
Mateusz Guzikcd81a9172016-08-23 16:20:38 +02001554 exe_file = get_task_exe_file(task);
Matt Helsley925d1c42008-04-29 01:01:36 -07001555 put_task_struct(task);
Matt Helsley925d1c42008-04-29 01:01:36 -07001556 if (exe_file) {
1557 *exe_path = exe_file->f_path;
1558 path_get(&exe_file->f_path);
1559 fput(exe_file);
1560 return 0;
1561 } else
1562 return -ENOENT;
1563}
1564
Al Viro6b255392015-11-17 10:20:54 -05001565static const char *proc_pid_get_link(struct dentry *dentry,
Al Virofceef392015-12-29 15:58:39 -05001566 struct inode *inode,
1567 struct delayed_call *done)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001568{
Christoph Hellwig408ef012012-06-18 10:47:03 -04001569 struct path path;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001570 int error = -EACCES;
1571
Al Viro6b255392015-11-17 10:20:54 -05001572 if (!dentry)
1573 return ERR_PTR(-ECHILD);
1574
Eric W. Biederman778c1142006-06-26 00:25:58 -07001575 /* Are we allowed to snoop on the tasks file descriptors? */
1576 if (!proc_fd_access_allowed(inode))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001577 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001578
Christoph Hellwig408ef012012-06-18 10:47:03 -04001579 error = PROC_I(inode)->op.proc_get_link(dentry, &path);
1580 if (error)
1581 goto out;
1582
Al Viro6e77137b2015-05-02 13:37:52 -04001583 nd_jump_link(&path);
Christoph Hellwig408ef012012-06-18 10:47:03 -04001584 return NULL;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001585out:
Al Viro008b1502005-08-20 00:17:39 +01001586 return ERR_PTR(error);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001587}
1588
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001589static int do_proc_readlink(struct path *path, char __user *buffer, int buflen)
Linus Torvalds1da177e2005-04-16 15:20:36 -07001590{
Michal Hocko0ee931c2017-09-13 16:28:29 -07001591 char *tmp = (char *)__get_free_page(GFP_KERNEL);
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001592 char *pathname;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001593 int len;
1594
1595 if (!tmp)
1596 return -ENOMEM;
Akinobu Mita0c28f282007-05-08 00:31:41 -07001597
Eric W. Biederman7b2a69b2010-12-05 15:51:21 -08001598 pathname = d_path(path, tmp, PAGE_SIZE);
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001599 len = PTR_ERR(pathname);
1600 if (IS_ERR(pathname))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001601 goto out;
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001602 len = tmp + PAGE_SIZE - 1 - pathname;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001603
1604 if (len > buflen)
1605 len = buflen;
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001606 if (copy_to_user(buffer, pathname, len))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001607 len = -EFAULT;
1608 out:
1609 free_page((unsigned long)tmp);
1610 return len;
1611}
1612
1613static int proc_pid_readlink(struct dentry * dentry, char __user * buffer, int buflen)
1614{
1615 int error = -EACCES;
David Howells2b0143b2015-03-17 22:25:59 +00001616 struct inode *inode = d_inode(dentry);
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001617 struct path path;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001618
Eric W. Biederman778c1142006-06-26 00:25:58 -07001619 /* Are we allowed to snoop on the tasks file descriptors? */
1620 if (!proc_fd_access_allowed(inode))
Linus Torvalds1da177e2005-04-16 15:20:36 -07001621 goto out;
Linus Torvalds1da177e2005-04-16 15:20:36 -07001622
Cyrill Gorcunov7773fbc2012-01-10 15:11:20 -08001623 error = PROC_I(inode)->op.proc_get_link(dentry, &path);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001624 if (error)
1625 goto out;
1626
Jan Blunck3dcd25f2008-02-14 19:38:35 -08001627 error = do_proc_readlink(&path, buffer, buflen);
1628 path_put(&path);
Linus Torvalds1da177e2005-04-16 15:20:36 -07001629out:
Linus Torvalds1da177e2005-04-16 15:20:36 -07001630 return error;
1631}
1632
Cyrill Gorcunovfaf60af2012-08-23 14:43:24 +04001633const struct inode_operations proc_pid_link_inode_operations = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07001634 .readlink = proc_pid_readlink,
Al Viro6b255392015-11-17 10:20:54 -05001635 .get_link = proc_pid_get_link,
Linus Torvalds6d76fa52006-07-15 12:26:45 -07001636 .setattr = proc_setattr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07001637};
1638
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001639
1640/* building an inode */
1641
Al Viroc6eb50d2017-09-30 14:45:42 -04001642void task_dump_owner(struct task_struct *task, umode_t mode,
Eric W. Biederman68eb94f2017-01-03 10:23:11 +13001643 kuid_t *ruid, kgid_t *rgid)
1644{
1645 /* Depending on the state of dumpable compute who should own a
1646 * proc file for a task.
1647 */
1648 const struct cred *cred;
1649 kuid_t uid;
1650 kgid_t gid;
1651
Alexey Dobriyan2e0ad552018-04-20 14:56:03 -07001652 if (unlikely(task->flags & PF_KTHREAD)) {
1653 *ruid = GLOBAL_ROOT_UID;
1654 *rgid = GLOBAL_ROOT_GID;
1655 return;
1656 }
1657
Eric W. Biederman68eb94f2017-01-03 10:23:11 +13001658 /* Default to the tasks effective ownership */
1659 rcu_read_lock();
1660 cred = __task_cred(task);
1661 uid = cred->euid;
1662 gid = cred->egid;
1663 rcu_read_unlock();
1664
1665 /*
1666 * Before the /proc/pid/status file was created the only way to read
1667 * the effective uid of a /process was to stat /proc/pid. Reading
1668 * /proc/pid/status is slow enough that procps and other packages
1669 * kept stating /proc/pid. To keep the rules in /proc simple I have
1670 * made this apply to all per process world readable and executable
1671 * directories.
1672 */
1673 if (mode != (S_IFDIR|S_IRUGO|S_IXUGO)) {
1674 struct mm_struct *mm;
1675 task_lock(task);
1676 mm = task->mm;
1677 /* Make non-dumpable tasks owned by some root */
1678 if (mm) {
1679 if (get_dumpable(mm) != SUID_DUMP_USER) {
1680 struct user_namespace *user_ns = mm->user_ns;
1681
1682 uid = make_kuid(user_ns, 0);
1683 if (!uid_valid(uid))
1684 uid = GLOBAL_ROOT_UID;
1685
1686 gid = make_kgid(user_ns, 0);
1687 if (!gid_valid(gid))
1688 gid = GLOBAL_ROOT_GID;
1689 }
1690 } else {
1691 uid = GLOBAL_ROOT_UID;
1692 gid = GLOBAL_ROOT_GID;
1693 }
1694 task_unlock(task);
1695 }
1696 *ruid = uid;
1697 *rgid = gid;
1698}
1699
Andreas Gruenbacherdb978da2016-11-10 22:18:28 +01001700struct inode *proc_pid_make_inode(struct super_block * sb,
1701 struct task_struct *task, umode_t mode)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001702{
1703 struct inode * inode;
1704 struct proc_inode *ei;
1705
1706 /* We need a new inode */
1707
1708 inode = new_inode(sb);
1709 if (!inode)
1710 goto out;
1711
1712 /* Common stuff */
1713 ei = PROC_I(inode);
Andreas Gruenbacherdb978da2016-11-10 22:18:28 +01001714 inode->i_mode = mode;
Christoph Hellwig85fe4022010-10-23 11:19:54 -04001715 inode->i_ino = get_next_ino();
Deepa Dinamani078cd822016-09-14 07:48:04 -07001716 inode->i_mtime = inode->i_atime = inode->i_ctime = current_time(inode);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001717 inode->i_op = &proc_def_inode_operations;
1718
1719 /*
1720 * grab the reference to task.
1721 */
Oleg Nesterov1a657f782006-10-02 02:18:59 -07001722 ei->pid = get_task_pid(task, PIDTYPE_PID);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001723 if (!ei->pid)
1724 goto out_unlock;
1725
Eric W. Biederman68eb94f2017-01-03 10:23:11 +13001726 task_dump_owner(task, 0, &inode->i_uid, &inode->i_gid);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001727 security_task_to_inode(task, inode);
1728
1729out:
1730 return inode;
1731
1732out_unlock:
1733 iput(inode);
1734 return NULL;
1735}
1736
David Howellsa528d352017-01-31 16:46:22 +00001737int pid_getattr(const struct path *path, struct kstat *stat,
1738 u32 request_mask, unsigned int query_flags)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001739{
David Howellsa528d352017-01-31 16:46:22 +00001740 struct inode *inode = d_inode(path->dentry);
Christoph Hellwig76f668b2018-05-16 07:19:01 +02001741 struct pid_namespace *pid = proc_pid_ns(inode);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001742 struct task_struct *task;
David Howellsc69e8d92008-11-14 10:39:19 +11001743
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001744 generic_fillattr(inode, stat);
1745
Eric W. Biedermandcb0f222012-02-09 08:48:21 -08001746 stat->uid = GLOBAL_ROOT_UID;
1747 stat->gid = GLOBAL_ROOT_GID;
Alexey Dobriyan94116922018-06-07 17:10:07 -07001748 rcu_read_lock();
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001749 task = pid_task(proc_pid(inode), PIDTYPE_PID);
1750 if (task) {
Lafcadio Wluiki796f5712017-02-24 15:00:23 -08001751 if (!has_pid_permissions(pid, task, HIDEPID_INVISIBLE)) {
Vasiliy Kulikov04996802012-01-10 15:11:31 -08001752 rcu_read_unlock();
1753 /*
1754 * This doesn't prevent learning whether PID exists,
1755 * it only makes getattr() consistent with readdir().
1756 */
1757 return -ENOENT;
1758 }
Eric W. Biederman68eb94f2017-01-03 10:23:11 +13001759 task_dump_owner(task, inode->i_mode, &stat->uid, &stat->gid);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001760 }
1761 rcu_read_unlock();
1762 return 0;
1763}
1764
1765/* dentry stuff */
1766
1767/*
Al Viro1bbc5512018-05-02 21:26:16 -04001768 * Set <pid>/... inode ownership (can change due to setuid(), etc.)
1769 */
1770void pid_update_inode(struct task_struct *task, struct inode *inode)
1771{
1772 task_dump_owner(task, inode->i_mode, &inode->i_uid, &inode->i_gid);
1773
1774 inode->i_mode &= ~(S_ISUID | S_ISGID);
1775 security_task_to_inode(task, inode);
1776}
1777
1778/*
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001779 * Rewrite the inode's ownerships here because the owning task may have
1780 * performed a setuid(), etc.
1781 *
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001782 */
Al Viro1bbc5512018-05-02 21:26:16 -04001783static int pid_revalidate(struct dentry *dentry, unsigned int flags)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001784{
Nick Piggin34286d62011-01-07 17:49:57 +11001785 struct inode *inode;
1786 struct task_struct *task;
David Howellsc69e8d92008-11-14 10:39:19 +11001787
Al Viro0b728e12012-06-10 16:03:43 -04001788 if (flags & LOOKUP_RCU)
Nick Piggin34286d62011-01-07 17:49:57 +11001789 return -ECHILD;
1790
David Howells2b0143b2015-03-17 22:25:59 +00001791 inode = d_inode(dentry);
Nick Piggin34286d62011-01-07 17:49:57 +11001792 task = get_proc_task(inode);
1793
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001794 if (task) {
Al Viro1bbc5512018-05-02 21:26:16 -04001795 pid_update_inode(task, inode);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001796 put_task_struct(task);
1797 return 1;
1798 }
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001799 return 0;
1800}
1801
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08001802static inline bool proc_inode_is_dead(struct inode *inode)
1803{
1804 return !proc_pid(inode)->tasks[PIDTYPE_PID].first;
1805}
1806
David Howells1dd704b2013-04-12 01:08:50 +01001807int pid_delete_dentry(const struct dentry *dentry)
1808{
1809 /* Is the task we represent dead?
1810 * If so, then don't put the dentry on the lru list,
1811 * kill it immediately.
1812 */
David Howells2b0143b2015-03-17 22:25:59 +00001813 return proc_inode_is_dead(d_inode(dentry));
David Howells1dd704b2013-04-12 01:08:50 +01001814}
1815
Eric W. Biederman6b4e3062010-03-07 16:41:34 -08001816const struct dentry_operations pid_dentry_operations =
Eric W. Biederman28a6d672006-10-02 02:17:05 -07001817{
1818 .d_revalidate = pid_revalidate,
1819 .d_delete = pid_delete_dentry,
1820};
1821
1822/* Lookups */
1823
Eric W. Biederman1c0d04c2006-10-02 02:18:57 -07001824/*
1825 * Fill a directory entry.
1826 *
1827 * If possible create the dcache entry and derive our inode number and
1828 * file type from dcache entry.
1829 *
1830 * Since all of the proc inode numbers are dynamically generated, the inode
1831 * numbers do not exist until the inode is cache. This means creating the
1832 * the dcache entry in readdir is necessary to keep the inode numbers
1833 * reported by readdir in sync with the inode numbers reported
1834 * by stat.
1835 */
Al Virof0c3b502013-05-16 12:07:31 -04001836bool proc_fill_cache(struct file *file, struct dir_context *ctx,
Alexey Dobriyana4ef3892018-06-07 17:10:10 -07001837 const char *name, unsigned int len,
Eric Dumazetc5141e62007-05-08 00:26:15 -07001838 instantiate_t instantiate, struct task_struct *task, const void *ptr)
Eric W. Biederman61a28782006-10-02 02:18:49 -07001839{
Al Virof0c3b502013-05-16 12:07:31 -04001840 struct dentry *child, *dir = file->f_path.dentry;
Al Viro1df98b82013-06-15 11:33:10 +04001841 struct qstr qname = QSTR_INIT(name, len);
Eric W. Biederman61a28782006-10-02 02:18:49 -07001842 struct inode *inode;
Al Viro0168b9e2018-05-03 09:21:05 -04001843 unsigned type = DT_UNKNOWN;
1844 ino_t ino = 1;
Eric W. Biederman61a28782006-10-02 02:18:49 -07001845
Al Viro1df98b82013-06-15 11:33:10 +04001846 child = d_hash_and_lookup(dir, &qname);
Eric W. Biederman61a28782006-10-02 02:18:49 -07001847 if (!child) {
Al Viro37817642016-04-20 16:31:31 -04001848 DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wq);
1849 child = d_alloc_parallel(dir, &qname, &wq);
1850 if (IS_ERR(child))
Al Viro1df98b82013-06-15 11:33:10 +04001851 goto end_instantiate;
Al Viro37817642016-04-20 16:31:31 -04001852 if (d_in_lookup(child)) {
Al Viro0168b9e2018-05-03 09:21:05 -04001853 struct dentry *res;
1854 res = instantiate(child, task, ptr);
Al Viro37817642016-04-20 16:31:31 -04001855 d_lookup_done(child);
Al Viro0168b9e2018-05-03 09:21:05 -04001856 if (unlikely(res)) {
1857 dput(child);
1858 child = res;
Al Virod85b3992018-06-08 01:17:11 -04001859 if (IS_ERR(child))
1860 goto end_instantiate;
Al Viro37817642016-04-20 16:31:31 -04001861 }
Eric W. Biederman61a28782006-10-02 02:18:49 -07001862 }
1863 }
David Howells2b0143b2015-03-17 22:25:59 +00001864 inode = d_inode(child);
Al Viro147ce692013-06-15 10:26:35 +04001865 ino = inode->i_ino;
1866 type = inode->i_mode >> 12;
Eric W. Biederman61a28782006-10-02 02:18:49 -07001867 dput(child);
Al Virod85b3992018-06-08 01:17:11 -04001868end_instantiate:
Al Virof0c3b502013-05-16 12:07:31 -04001869 return dir_emit(ctx, name, len, ino, type);
Eric W. Biederman61a28782006-10-02 02:18:49 -07001870}
1871
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001872/*
1873 * dname_to_vma_addr - maps a dentry name into two unsigned longs
1874 * which represent vma start and end addresses.
1875 */
1876static int dname_to_vma_addr(struct dentry *dentry,
1877 unsigned long *start, unsigned long *end)
1878{
Alexey Dobriyanac7f1062018-02-06 15:36:59 -08001879 const char *str = dentry->d_name.name;
1880 unsigned long long sval, eval;
1881 unsigned int len;
1882
Alexey Dobriyan35318db2018-04-10 16:41:14 -07001883 if (str[0] == '0' && str[1] != '-')
1884 return -EINVAL;
Alexey Dobriyanac7f1062018-02-06 15:36:59 -08001885 len = _parse_integer(str, 16, &sval);
1886 if (len & KSTRTOX_OVERFLOW)
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001887 return -EINVAL;
Alexey Dobriyanac7f1062018-02-06 15:36:59 -08001888 if (sval != (unsigned long)sval)
1889 return -EINVAL;
1890 str += len;
1891
1892 if (*str != '-')
1893 return -EINVAL;
1894 str++;
1895
Alexey Dobriyan35318db2018-04-10 16:41:14 -07001896 if (str[0] == '0' && str[1])
1897 return -EINVAL;
Alexey Dobriyanac7f1062018-02-06 15:36:59 -08001898 len = _parse_integer(str, 16, &eval);
1899 if (len & KSTRTOX_OVERFLOW)
1900 return -EINVAL;
1901 if (eval != (unsigned long)eval)
1902 return -EINVAL;
1903 str += len;
1904
1905 if (*str != '\0')
1906 return -EINVAL;
1907
1908 *start = sval;
1909 *end = eval;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001910
1911 return 0;
1912}
1913
Al Viro0b728e12012-06-10 16:03:43 -04001914static int map_files_d_revalidate(struct dentry *dentry, unsigned int flags)
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001915{
1916 unsigned long vm_start, vm_end;
1917 bool exact_vma_exists = false;
1918 struct mm_struct *mm = NULL;
1919 struct task_struct *task;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001920 struct inode *inode;
1921 int status = 0;
1922
Al Viro0b728e12012-06-10 16:03:43 -04001923 if (flags & LOOKUP_RCU)
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001924 return -ECHILD;
1925
David Howells2b0143b2015-03-17 22:25:59 +00001926 inode = d_inode(dentry);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001927 task = get_proc_task(inode);
1928 if (!task)
1929 goto out_notask;
1930
Jann Horncaaee622016-01-20 15:00:04 -08001931 mm = mm_access(task, PTRACE_MODE_READ_FSCREDS);
Cong Wang2344bec2012-05-31 16:26:18 -07001932 if (IS_ERR_OR_NULL(mm))
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001933 goto out;
1934
1935 if (!dname_to_vma_addr(dentry, &vm_start, &vm_end)) {
1936 down_read(&mm->mmap_sem);
1937 exact_vma_exists = !!find_exact_vma(mm, vm_start, vm_end);
1938 up_read(&mm->mmap_sem);
1939 }
1940
1941 mmput(mm);
1942
1943 if (exact_vma_exists) {
Eric W. Biederman68eb94f2017-01-03 10:23:11 +13001944 task_dump_owner(task, 0, &inode->i_uid, &inode->i_gid);
1945
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001946 security_task_to_inode(task, inode);
1947 status = 1;
1948 }
1949
1950out:
1951 put_task_struct(task);
1952
1953out_notask:
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001954 return status;
1955}
1956
1957static const struct dentry_operations tid_map_files_dentry_operations = {
1958 .d_revalidate = map_files_d_revalidate,
1959 .d_delete = pid_delete_dentry,
1960};
1961
Al Viro6b255392015-11-17 10:20:54 -05001962static int map_files_get_link(struct dentry *dentry, struct path *path)
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001963{
1964 unsigned long vm_start, vm_end;
1965 struct vm_area_struct *vma;
1966 struct task_struct *task;
1967 struct mm_struct *mm;
1968 int rc;
1969
1970 rc = -ENOENT;
David Howells2b0143b2015-03-17 22:25:59 +00001971 task = get_proc_task(d_inode(dentry));
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001972 if (!task)
1973 goto out;
1974
1975 mm = get_task_mm(task);
1976 put_task_struct(task);
1977 if (!mm)
1978 goto out;
1979
1980 rc = dname_to_vma_addr(dentry, &vm_start, &vm_end);
1981 if (rc)
1982 goto out_mmput;
1983
Artem Fetishev70335ab2014-03-10 15:49:45 -07001984 rc = -ENOENT;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08001985 down_read(&mm->mmap_sem);
1986 vma = find_exact_vma(mm, vm_start, vm_end);
1987 if (vma && vma->vm_file) {
1988 *path = vma->vm_file->f_path;
1989 path_get(path);
1990 rc = 0;
1991 }
1992 up_read(&mm->mmap_sem);
1993
1994out_mmput:
1995 mmput(mm);
1996out:
1997 return rc;
1998}
1999
2000struct map_files_info {
Alexey Dobriyan20d28cd2018-02-06 15:37:06 -08002001 unsigned long start;
2002 unsigned long end;
Al Viro7b540d02012-08-27 14:55:26 -04002003 fmode_t mode;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002004};
2005
Calvin Owensbdb4d102015-09-09 15:35:54 -07002006/*
2007 * Only allow CAP_SYS_ADMIN to follow the links, due to concerns about how the
2008 * symlinks may be used to bypass permissions on ancestor directories in the
2009 * path to the file in question.
2010 */
2011static const char *
Al Viro6b255392015-11-17 10:20:54 -05002012proc_map_files_get_link(struct dentry *dentry,
Al Virofceef392015-12-29 15:58:39 -05002013 struct inode *inode,
2014 struct delayed_call *done)
Calvin Owensbdb4d102015-09-09 15:35:54 -07002015{
2016 if (!capable(CAP_SYS_ADMIN))
2017 return ERR_PTR(-EPERM);
2018
Al Virofceef392015-12-29 15:58:39 -05002019 return proc_pid_get_link(dentry, inode, done);
Calvin Owensbdb4d102015-09-09 15:35:54 -07002020}
2021
2022/*
Al Viro6b255392015-11-17 10:20:54 -05002023 * Identical to proc_pid_link_inode_operations except for get_link()
Calvin Owensbdb4d102015-09-09 15:35:54 -07002024 */
2025static const struct inode_operations proc_map_files_link_inode_operations = {
2026 .readlink = proc_pid_readlink,
Al Viro6b255392015-11-17 10:20:54 -05002027 .get_link = proc_map_files_get_link,
Calvin Owensbdb4d102015-09-09 15:35:54 -07002028 .setattr = proc_setattr,
2029};
2030
Al Viro0168b9e2018-05-03 09:21:05 -04002031static struct dentry *
2032proc_map_files_instantiate(struct dentry *dentry,
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002033 struct task_struct *task, const void *ptr)
2034{
Al Viro7b540d02012-08-27 14:55:26 -04002035 fmode_t mode = (fmode_t)(unsigned long)ptr;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002036 struct proc_inode *ei;
2037 struct inode *inode;
2038
Al Viro0168b9e2018-05-03 09:21:05 -04002039 inode = proc_pid_make_inode(dentry->d_sb, task, S_IFLNK |
Andreas Gruenbacherdb978da2016-11-10 22:18:28 +01002040 ((mode & FMODE_READ ) ? S_IRUSR : 0) |
2041 ((mode & FMODE_WRITE) ? S_IWUSR : 0));
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002042 if (!inode)
Al Viro0168b9e2018-05-03 09:21:05 -04002043 return ERR_PTR(-ENOENT);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002044
2045 ei = PROC_I(inode);
Al Viro6b255392015-11-17 10:20:54 -05002046 ei->op.proc_get_link = map_files_get_link;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002047
Calvin Owensbdb4d102015-09-09 15:35:54 -07002048 inode->i_op = &proc_map_files_link_inode_operations;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002049 inode->i_size = 64;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002050
2051 d_set_d_op(dentry, &tid_map_files_dentry_operations);
Al Viro0168b9e2018-05-03 09:21:05 -04002052 return d_splice_alias(inode, dentry);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002053}
2054
2055static struct dentry *proc_map_files_lookup(struct inode *dir,
Al Viro00cd8dd2012-06-10 17:13:09 -04002056 struct dentry *dentry, unsigned int flags)
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002057{
2058 unsigned long vm_start, vm_end;
2059 struct vm_area_struct *vma;
2060 struct task_struct *task;
Al Viro0168b9e2018-05-03 09:21:05 -04002061 struct dentry *result;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002062 struct mm_struct *mm;
2063
Al Viro0168b9e2018-05-03 09:21:05 -04002064 result = ERR_PTR(-ENOENT);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002065 task = get_proc_task(dir);
2066 if (!task)
2067 goto out;
2068
Al Viro0168b9e2018-05-03 09:21:05 -04002069 result = ERR_PTR(-EACCES);
Jann Horncaaee622016-01-20 15:00:04 -08002070 if (!ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS))
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002071 goto out_put_task;
2072
Al Viro0168b9e2018-05-03 09:21:05 -04002073 result = ERR_PTR(-ENOENT);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002074 if (dname_to_vma_addr(dentry, &vm_start, &vm_end))
Cyrill Gorcunoveb94cd92012-05-17 17:03:25 -07002075 goto out_put_task;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002076
2077 mm = get_task_mm(task);
2078 if (!mm)
Cyrill Gorcunoveb94cd92012-05-17 17:03:25 -07002079 goto out_put_task;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002080
2081 down_read(&mm->mmap_sem);
2082 vma = find_exact_vma(mm, vm_start, vm_end);
2083 if (!vma)
2084 goto out_no_vma;
2085
Stanislav Kinsbursky05f56482012-11-26 16:29:42 -08002086 if (vma->vm_file)
Al Viro0168b9e2018-05-03 09:21:05 -04002087 result = proc_map_files_instantiate(dentry, task,
Stanislav Kinsbursky05f56482012-11-26 16:29:42 -08002088 (void *)(unsigned long)vma->vm_file->f_mode);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002089
2090out_no_vma:
2091 up_read(&mm->mmap_sem);
2092 mmput(mm);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002093out_put_task:
2094 put_task_struct(task);
2095out:
Al Viro0168b9e2018-05-03 09:21:05 -04002096 return result;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002097}
2098
2099static const struct inode_operations proc_map_files_inode_operations = {
2100 .lookup = proc_map_files_lookup,
2101 .permission = proc_fd_permission,
2102 .setattr = proc_setattr,
2103};
2104
2105static int
Al Virof0c3b502013-05-16 12:07:31 -04002106proc_map_files_readdir(struct file *file, struct dir_context *ctx)
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002107{
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002108 struct vm_area_struct *vma;
2109 struct task_struct *task;
2110 struct mm_struct *mm;
Al Virof0c3b502013-05-16 12:07:31 -04002111 unsigned long nr_files, pos, i;
2112 struct flex_array *fa = NULL;
2113 struct map_files_info info;
2114 struct map_files_info *p;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002115 int ret;
2116
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002117 ret = -ENOENT;
Al Virof0c3b502013-05-16 12:07:31 -04002118 task = get_proc_task(file_inode(file));
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002119 if (!task)
2120 goto out;
2121
2122 ret = -EACCES;
Jann Horncaaee622016-01-20 15:00:04 -08002123 if (!ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS))
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002124 goto out_put_task;
2125
2126 ret = 0;
Al Virof0c3b502013-05-16 12:07:31 -04002127 if (!dir_emit_dots(file, ctx))
2128 goto out_put_task;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002129
Al Virof0c3b502013-05-16 12:07:31 -04002130 mm = get_task_mm(task);
2131 if (!mm)
2132 goto out_put_task;
2133 down_read(&mm->mmap_sem);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002134
Al Virof0c3b502013-05-16 12:07:31 -04002135 nr_files = 0;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002136
Al Virof0c3b502013-05-16 12:07:31 -04002137 /*
2138 * We need two passes here:
2139 *
2140 * 1) Collect vmas of mapped files with mmap_sem taken
2141 * 2) Release mmap_sem and instantiate entries
2142 *
2143 * otherwise we get lockdep complained, since filldir()
2144 * routine might require mmap_sem taken in might_fault().
2145 */
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002146
Al Virof0c3b502013-05-16 12:07:31 -04002147 for (vma = mm->mmap, pos = 2; vma; vma = vma->vm_next) {
2148 if (vma->vm_file && ++pos > ctx->pos)
2149 nr_files++;
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002150 }
Al Virof0c3b502013-05-16 12:07:31 -04002151
2152 if (nr_files) {
2153 fa = flex_array_alloc(sizeof(info), nr_files,
2154 GFP_KERNEL);
2155 if (!fa || flex_array_prealloc(fa, 0, nr_files,
2156 GFP_KERNEL)) {
2157 ret = -ENOMEM;
2158 if (fa)
2159 flex_array_free(fa);
2160 up_read(&mm->mmap_sem);
2161 mmput(mm);
2162 goto out_put_task;
2163 }
2164 for (i = 0, vma = mm->mmap, pos = 2; vma;
2165 vma = vma->vm_next) {
2166 if (!vma->vm_file)
2167 continue;
2168 if (++pos <= ctx->pos)
2169 continue;
2170
Alexey Dobriyan20d28cd2018-02-06 15:37:06 -08002171 info.start = vma->vm_start;
2172 info.end = vma->vm_end;
Al Virof0c3b502013-05-16 12:07:31 -04002173 info.mode = vma->vm_file->f_mode;
Al Virof0c3b502013-05-16 12:07:31 -04002174 if (flex_array_put(fa, i++, &info, GFP_KERNEL))
2175 BUG();
2176 }
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002177 }
Al Virof0c3b502013-05-16 12:07:31 -04002178 up_read(&mm->mmap_sem);
Alexey Dobriyanfe079a52018-04-10 16:32:05 -07002179 mmput(mm);
Al Virof0c3b502013-05-16 12:07:31 -04002180
2181 for (i = 0; i < nr_files; i++) {
Alexey Dobriyan20d28cd2018-02-06 15:37:06 -08002182 char buf[4 * sizeof(long) + 2]; /* max: %lx-%lx\0 */
2183 unsigned int len;
2184
Al Virof0c3b502013-05-16 12:07:31 -04002185 p = flex_array_get(fa, i);
Alexey Dobriyan20d28cd2018-02-06 15:37:06 -08002186 len = snprintf(buf, sizeof(buf), "%lx-%lx", p->start, p->end);
Al Virof0c3b502013-05-16 12:07:31 -04002187 if (!proc_fill_cache(file, ctx,
Alexey Dobriyan20d28cd2018-02-06 15:37:06 -08002188 buf, len,
Al Virof0c3b502013-05-16 12:07:31 -04002189 proc_map_files_instantiate,
2190 task,
2191 (void *)(unsigned long)p->mode))
2192 break;
2193 ctx->pos++;
2194 }
2195 if (fa)
2196 flex_array_free(fa);
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002197
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002198out_put_task:
2199 put_task_struct(task);
2200out:
2201 return ret;
2202}
2203
2204static const struct file_operations proc_map_files_operations = {
2205 .read = generic_read_dir,
Al Virof50752e2016-04-20 17:13:54 -04002206 .iterate_shared = proc_map_files_readdir,
2207 .llseek = generic_file_llseek,
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002208};
2209
Nicolas Pitreb18b6a92017-01-21 00:09:08 -05002210#if defined(CONFIG_CHECKPOINT_RESTORE) && defined(CONFIG_POSIX_TIMERS)
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002211struct timers_private {
2212 struct pid *pid;
2213 struct task_struct *task;
2214 struct sighand_struct *sighand;
Pavel Emelyanov57b80152013-03-11 13:13:08 +04002215 struct pid_namespace *ns;
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002216 unsigned long flags;
2217};
2218
2219static void *timers_start(struct seq_file *m, loff_t *pos)
2220{
2221 struct timers_private *tp = m->private;
2222
2223 tp->task = get_pid_task(tp->pid, PIDTYPE_PID);
2224 if (!tp->task)
2225 return ERR_PTR(-ESRCH);
2226
2227 tp->sighand = lock_task_sighand(tp->task, &tp->flags);
2228 if (!tp->sighand)
2229 return ERR_PTR(-ESRCH);
2230
2231 return seq_list_start(&tp->task->signal->posix_timers, *pos);
2232}
2233
2234static void *timers_next(struct seq_file *m, void *v, loff_t *pos)
2235{
2236 struct timers_private *tp = m->private;
2237 return seq_list_next(v, &tp->task->signal->posix_timers, pos);
2238}
2239
2240static void timers_stop(struct seq_file *m, void *v)
2241{
2242 struct timers_private *tp = m->private;
2243
2244 if (tp->sighand) {
2245 unlock_task_sighand(tp->task, &tp->flags);
2246 tp->sighand = NULL;
2247 }
2248
2249 if (tp->task) {
2250 put_task_struct(tp->task);
2251 tp->task = NULL;
2252 }
2253}
2254
2255static int show_timer(struct seq_file *m, void *v)
2256{
2257 struct k_itimer *timer;
Pavel Emelyanov57b80152013-03-11 13:13:08 +04002258 struct timers_private *tp = m->private;
2259 int notify;
Alexey Dobriyancedbcca2014-08-08 14:21:33 -07002260 static const char * const nstr[] = {
Pavel Emelyanov57b80152013-03-11 13:13:08 +04002261 [SIGEV_SIGNAL] = "signal",
2262 [SIGEV_NONE] = "none",
2263 [SIGEV_THREAD] = "thread",
2264 };
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002265
2266 timer = list_entry((struct list_head *)v, struct k_itimer, list);
Pavel Emelyanov57b80152013-03-11 13:13:08 +04002267 notify = timer->it_sigev_notify;
2268
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002269 seq_printf(m, "ID: %d\n", timer->it_id);
Linus Torvaldsba3edf1f2017-12-06 18:23:27 -08002270 seq_printf(m, "signal: %d/%px\n",
Joe Perches25ce3192015-04-15 16:18:17 -07002271 timer->sigq->info.si_signo,
2272 timer->sigq->info.si_value.sival_ptr);
Pavel Emelyanov57b80152013-03-11 13:13:08 +04002273 seq_printf(m, "notify: %s/%s.%d\n",
Joe Perches25ce3192015-04-15 16:18:17 -07002274 nstr[notify & ~SIGEV_THREAD_ID],
2275 (notify & SIGEV_THREAD_ID) ? "tid" : "pid",
2276 pid_nr_ns(timer->it_pid, tp->ns));
Pavel Tikhomirov15ef0292013-05-17 02:12:03 +04002277 seq_printf(m, "ClockID: %d\n", timer->it_clock);
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002278
2279 return 0;
2280}
2281
2282static const struct seq_operations proc_timers_seq_ops = {
2283 .start = timers_start,
2284 .next = timers_next,
2285 .stop = timers_stop,
2286 .show = show_timer,
2287};
2288
2289static int proc_timers_open(struct inode *inode, struct file *file)
2290{
2291 struct timers_private *tp;
2292
2293 tp = __seq_open_private(file, &proc_timers_seq_ops,
2294 sizeof(struct timers_private));
2295 if (!tp)
2296 return -ENOMEM;
2297
2298 tp->pid = proc_pid(inode);
Christoph Hellwig76f668b2018-05-16 07:19:01 +02002299 tp->ns = proc_pid_ns(inode);
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002300 return 0;
2301}
2302
2303static const struct file_operations proc_timers_operations = {
2304 .open = proc_timers_open,
2305 .read = seq_read,
2306 .llseek = seq_lseek,
2307 .release = seq_release_private,
2308};
Eric Engestromb5946be2016-03-17 14:20:57 -07002309#endif
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002310
John Stultz5de23d42016-03-17 14:20:54 -07002311static ssize_t timerslack_ns_write(struct file *file, const char __user *buf,
2312 size_t count, loff_t *offset)
2313{
2314 struct inode *inode = file_inode(file);
2315 struct task_struct *p;
2316 u64 slack_ns;
2317 int err;
2318
2319 err = kstrtoull_from_user(buf, count, 10, &slack_ns);
2320 if (err < 0)
2321 return err;
2322
2323 p = get_proc_task(inode);
2324 if (!p)
2325 return -ESRCH;
2326
John Stultz4b2bd5f2016-10-07 17:02:33 -07002327 if (p != current) {
2328 if (!capable(CAP_SYS_NICE)) {
2329 count = -EPERM;
2330 goto out;
2331 }
John Stultz5de23d42016-03-17 14:20:54 -07002332
John Stultz4b2bd5f2016-10-07 17:02:33 -07002333 err = security_task_setscheduler(p);
2334 if (err) {
2335 count = err;
2336 goto out;
2337 }
John Stultz904763e2016-10-07 17:02:29 -07002338 }
2339
John Stultz7abbaf92016-10-07 17:02:26 -07002340 task_lock(p);
2341 if (slack_ns == 0)
2342 p->timer_slack_ns = p->default_timer_slack_ns;
2343 else
2344 p->timer_slack_ns = slack_ns;
2345 task_unlock(p);
2346
2347out:
John Stultz5de23d42016-03-17 14:20:54 -07002348 put_task_struct(p);
2349
2350 return count;
2351}
2352
2353static int timerslack_ns_show(struct seq_file *m, void *v)
2354{
2355 struct inode *inode = m->private;
2356 struct task_struct *p;
John Stultz7abbaf92016-10-07 17:02:26 -07002357 int err = 0;
John Stultz5de23d42016-03-17 14:20:54 -07002358
2359 p = get_proc_task(inode);
2360 if (!p)
2361 return -ESRCH;
2362
John Stultz4b2bd5f2016-10-07 17:02:33 -07002363 if (p != current) {
John Stultz5de23d42016-03-17 14:20:54 -07002364
John Stultz4b2bd5f2016-10-07 17:02:33 -07002365 if (!capable(CAP_SYS_NICE)) {
2366 err = -EPERM;
2367 goto out;
2368 }
2369 err = security_task_getscheduler(p);
2370 if (err)
2371 goto out;
2372 }
John Stultz904763e2016-10-07 17:02:29 -07002373
John Stultz7abbaf92016-10-07 17:02:26 -07002374 task_lock(p);
2375 seq_printf(m, "%llu\n", p->timer_slack_ns);
2376 task_unlock(p);
2377
2378out:
John Stultz5de23d42016-03-17 14:20:54 -07002379 put_task_struct(p);
2380
2381 return err;
2382}
2383
2384static int timerslack_ns_open(struct inode *inode, struct file *filp)
2385{
2386 return single_open(filp, timerslack_ns_show, inode);
2387}
2388
2389static const struct file_operations proc_pid_set_timerslack_ns_operations = {
2390 .open = timerslack_ns_open,
2391 .read = seq_read,
2392 .write = timerslack_ns_write,
2393 .llseek = seq_lseek,
2394 .release = single_release,
2395};
2396
Al Viro0168b9e2018-05-03 09:21:05 -04002397static struct dentry *proc_pident_instantiate(struct dentry *dentry,
2398 struct task_struct *task, const void *ptr)
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002399{
Eric Dumazetc5141e62007-05-08 00:26:15 -07002400 const struct pid_entry *p = ptr;
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002401 struct inode *inode;
2402 struct proc_inode *ei;
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002403
Al Viro0168b9e2018-05-03 09:21:05 -04002404 inode = proc_pid_make_inode(dentry->d_sb, task, p->mode);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002405 if (!inode)
Al Viro0168b9e2018-05-03 09:21:05 -04002406 return ERR_PTR(-ENOENT);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002407
2408 ei = PROC_I(inode);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002409 if (S_ISDIR(inode->i_mode))
Miklos Szeredibfe86842011-10-28 14:13:29 +02002410 set_nlink(inode, 2); /* Use getattr to fix if necessary */
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002411 if (p->iop)
2412 inode->i_op = p->iop;
2413 if (p->fop)
2414 inode->i_fop = p->fop;
2415 ei->op = p->op;
Al Viro1bbc5512018-05-02 21:26:16 -04002416 pid_update_inode(task, inode);
Nick Pigginfb045ad2011-01-07 17:49:55 +11002417 d_set_d_op(dentry, &pid_dentry_operations);
Al Viro0168b9e2018-05-03 09:21:05 -04002418 return d_splice_alias(inode, dentry);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07002419}
2420
Linus Torvalds1da177e2005-04-16 15:20:36 -07002421static struct dentry *proc_pident_lookup(struct inode *dir,
2422 struct dentry *dentry,
Eric Dumazetc5141e62007-05-08 00:26:15 -07002423 const struct pid_entry *ents,
Eric W. Biederman7bcd6b02006-10-02 02:18:56 -07002424 unsigned int nents)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002425{
Eric W. Biederman99f89552006-06-26 00:25:55 -07002426 struct task_struct *task = get_proc_task(dir);
Eric Dumazetc5141e62007-05-08 00:26:15 -07002427 const struct pid_entry *p, *last;
Al Viro0168b9e2018-05-03 09:21:05 -04002428 struct dentry *res = ERR_PTR(-ENOENT);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002429
Eric W. Biederman99f89552006-06-26 00:25:55 -07002430 if (!task)
2431 goto out_no_task;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002432
Eric W. Biederman20cdc892006-10-02 02:17:07 -07002433 /*
2434 * Yes, it does not scale. And it should not. Don't add
2435 * new entries into /proc/<tgid>/ without very good reasons.
2436 */
Alexey Dobriyanbac5f5d2016-12-12 16:45:28 -08002437 last = &ents[nents];
2438 for (p = ents; p < last; p++) {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002439 if (p->len != dentry->d_name.len)
2440 continue;
2441 if (!memcmp(dentry->d_name.name, p->name, p->len))
2442 break;
2443 }
Alexey Dobriyanbac5f5d2016-12-12 16:45:28 -08002444 if (p >= last)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002445 goto out;
2446
Al Viro0168b9e2018-05-03 09:21:05 -04002447 res = proc_pident_instantiate(dentry, task, p);
Linus Torvalds1da177e2005-04-16 15:20:36 -07002448out:
Eric W. Biederman99f89552006-06-26 00:25:55 -07002449 put_task_struct(task);
2450out_no_task:
Al Viro0168b9e2018-05-03 09:21:05 -04002451 return res;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002452}
2453
Al Virof0c3b502013-05-16 12:07:31 -04002454static int proc_pident_readdir(struct file *file, struct dir_context *ctx,
Eric Dumazetc5141e62007-05-08 00:26:15 -07002455 const struct pid_entry *ents, unsigned int nents)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002456{
Al Virof0c3b502013-05-16 12:07:31 -04002457 struct task_struct *task = get_proc_task(file_inode(file));
2458 const struct pid_entry *p;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002459
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002460 if (!task)
Al Virof0c3b502013-05-16 12:07:31 -04002461 return -ENOENT;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002462
Al Virof0c3b502013-05-16 12:07:31 -04002463 if (!dir_emit_dots(file, ctx))
2464 goto out;
2465
2466 if (ctx->pos >= nents + 2)
2467 goto out;
2468
Alexey Dobriyanbac5f5d2016-12-12 16:45:28 -08002469 for (p = ents + (ctx->pos - 2); p < ents + nents; p++) {
Al Virof0c3b502013-05-16 12:07:31 -04002470 if (!proc_fill_cache(file, ctx, p->name, p->len,
2471 proc_pident_instantiate, task, p))
2472 break;
2473 ctx->pos++;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002474 }
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002475out:
Eric W. Biederman61a28782006-10-02 02:18:49 -07002476 put_task_struct(task);
Al Virof0c3b502013-05-16 12:07:31 -04002477 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07002478}
2479
Linus Torvalds1da177e2005-04-16 15:20:36 -07002480#ifdef CONFIG_SECURITY
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002481static ssize_t proc_pid_attr_read(struct file * file, char __user * buf,
2482 size_t count, loff_t *ppos)
2483{
Al Viro496ad9a2013-01-23 17:07:38 -05002484 struct inode * inode = file_inode(file);
Al Viro04ff9702007-03-12 16:17:58 +00002485 char *p = NULL;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002486 ssize_t length;
2487 struct task_struct *task = get_proc_task(inode);
2488
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002489 if (!task)
Al Viro04ff9702007-03-12 16:17:58 +00002490 return -ESRCH;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002491
2492 length = security_getprocattr(task,
Josef "Jeff" Sipek2fddfee2006-12-08 02:36:36 -08002493 (char*)file->f_path.dentry->d_name.name,
Al Viro04ff9702007-03-12 16:17:58 +00002494 &p);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002495 put_task_struct(task);
Al Viro04ff9702007-03-12 16:17:58 +00002496 if (length > 0)
2497 length = simple_read_from_buffer(buf, count, ppos, p, length);
2498 kfree(p);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002499 return length;
2500}
2501
2502static ssize_t proc_pid_attr_write(struct file * file, const char __user * buf,
2503 size_t count, loff_t *ppos)
2504{
Al Viro496ad9a2013-01-23 17:07:38 -05002505 struct inode * inode = file_inode(file);
Al Virobb646cd2015-12-24 00:16:30 -05002506 void *page;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002507 ssize_t length;
2508 struct task_struct *task = get_proc_task(inode);
2509
2510 length = -ESRCH;
2511 if (!task)
2512 goto out_no_task;
Stephen Smalleyb21507e2017-01-09 10:07:31 -05002513
2514 /* A task may only write its own attributes. */
2515 length = -EACCES;
2516 if (current != task)
2517 goto out;
2518
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002519 if (count > PAGE_SIZE)
2520 count = PAGE_SIZE;
2521
2522 /* No partial writes. */
2523 length = -EINVAL;
2524 if (*ppos != 0)
2525 goto out;
2526
Al Virobb646cd2015-12-24 00:16:30 -05002527 page = memdup_user(buf, count);
2528 if (IS_ERR(page)) {
2529 length = PTR_ERR(page);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002530 goto out;
Al Virobb646cd2015-12-24 00:16:30 -05002531 }
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002532
David Howells107db7c2009-05-08 13:55:27 +01002533 /* Guard against adverse ptrace interaction */
Stephen Smalleyb21507e2017-01-09 10:07:31 -05002534 length = mutex_lock_interruptible(&current->signal->cred_guard_mutex);
David Howells107db7c2009-05-08 13:55:27 +01002535 if (length < 0)
2536 goto out_free;
2537
Stephen Smalleyb21507e2017-01-09 10:07:31 -05002538 length = security_setprocattr(file->f_path.dentry->d_name.name,
Al Virobb646cd2015-12-24 00:16:30 -05002539 page, count);
Stephen Smalleyb21507e2017-01-09 10:07:31 -05002540 mutex_unlock(&current->signal->cred_guard_mutex);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002541out_free:
Al Virobb646cd2015-12-24 00:16:30 -05002542 kfree(page);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002543out:
2544 put_task_struct(task);
2545out_no_task:
2546 return length;
2547}
2548
Arjan van de Ven00977a52007-02-12 00:55:34 -08002549static const struct file_operations proc_pid_attr_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002550 .read = proc_pid_attr_read,
2551 .write = proc_pid_attr_write,
Arnd Bergmann87df8422010-03-17 23:06:02 +01002552 .llseek = generic_file_llseek,
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002553};
2554
Eric Dumazetc5141e62007-05-08 00:26:15 -07002555static const struct pid_entry attr_dir_stuff[] = {
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002556 REG("current", S_IRUGO|S_IWUGO, proc_pid_attr_operations),
2557 REG("prev", S_IRUGO, proc_pid_attr_operations),
2558 REG("exec", S_IRUGO|S_IWUGO, proc_pid_attr_operations),
2559 REG("fscreate", S_IRUGO|S_IWUGO, proc_pid_attr_operations),
2560 REG("keycreate", S_IRUGO|S_IWUGO, proc_pid_attr_operations),
2561 REG("sockcreate", S_IRUGO|S_IWUGO, proc_pid_attr_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002562};
2563
Al Virof0c3b502013-05-16 12:07:31 -04002564static int proc_attr_dir_readdir(struct file *file, struct dir_context *ctx)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002565{
Al Virof0c3b502013-05-16 12:07:31 -04002566 return proc_pident_readdir(file, ctx,
2567 attr_dir_stuff, ARRAY_SIZE(attr_dir_stuff));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002568}
2569
Arjan van de Ven00977a52007-02-12 00:55:34 -08002570static const struct file_operations proc_attr_dir_operations = {
Linus Torvalds1da177e2005-04-16 15:20:36 -07002571 .read = generic_read_dir,
Al Virof50752e2016-04-20 17:13:54 -04002572 .iterate_shared = proc_attr_dir_readdir,
2573 .llseek = generic_file_llseek,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002574};
2575
Eric W. Biederman72d9dcf2006-10-02 02:18:50 -07002576static struct dentry *proc_attr_dir_lookup(struct inode *dir,
Al Viro00cd8dd2012-06-10 17:13:09 -04002577 struct dentry *dentry, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07002578{
Eric W. Biederman7bcd6b02006-10-02 02:18:56 -07002579 return proc_pident_lookup(dir, dentry,
2580 attr_dir_stuff, ARRAY_SIZE(attr_dir_stuff));
Linus Torvalds1da177e2005-04-16 15:20:36 -07002581}
2582
Arjan van de Venc5ef1c42007-02-12 00:55:40 -08002583static const struct inode_operations proc_attr_dir_inode_operations = {
Eric W. Biederman72d9dcf2006-10-02 02:18:50 -07002584 .lookup = proc_attr_dir_lookup,
Eric W. Biederman99f89552006-06-26 00:25:55 -07002585 .getattr = pid_getattr,
Linus Torvalds6d76fa52006-07-15 12:26:45 -07002586 .setattr = proc_setattr,
Linus Torvalds1da177e2005-04-16 15:20:36 -07002587};
2588
Linus Torvalds1da177e2005-04-16 15:20:36 -07002589#endif
2590
Christoph Hellwig698ba7b2009-12-15 16:47:37 -08002591#ifdef CONFIG_ELF_CORE
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002592static ssize_t proc_coredump_filter_read(struct file *file, char __user *buf,
2593 size_t count, loff_t *ppos)
2594{
Al Viro496ad9a2013-01-23 17:07:38 -05002595 struct task_struct *task = get_proc_task(file_inode(file));
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002596 struct mm_struct *mm;
2597 char buffer[PROC_NUMBUF];
2598 size_t len;
2599 int ret;
2600
2601 if (!task)
2602 return -ESRCH;
2603
2604 ret = 0;
2605 mm = get_task_mm(task);
2606 if (mm) {
2607 len = snprintf(buffer, sizeof(buffer), "%08lx\n",
2608 ((mm->flags & MMF_DUMP_FILTER_MASK) >>
2609 MMF_DUMP_FILTER_SHIFT));
2610 mmput(mm);
2611 ret = simple_read_from_buffer(buf, count, ppos, buffer, len);
2612 }
2613
2614 put_task_struct(task);
2615
2616 return ret;
2617}
2618
2619static ssize_t proc_coredump_filter_write(struct file *file,
2620 const char __user *buf,
2621 size_t count,
2622 loff_t *ppos)
2623{
2624 struct task_struct *task;
2625 struct mm_struct *mm;
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002626 unsigned int val;
2627 int ret;
2628 int i;
2629 unsigned long mask;
2630
Alexey Dobriyan774636e2015-09-09 15:36:59 -07002631 ret = kstrtouint_from_user(buf, count, 0, &val);
2632 if (ret < 0)
2633 return ret;
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002634
2635 ret = -ESRCH;
Al Viro496ad9a2013-01-23 17:07:38 -05002636 task = get_proc_task(file_inode(file));
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002637 if (!task)
2638 goto out_no_task;
2639
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002640 mm = get_task_mm(task);
2641 if (!mm)
2642 goto out_no_mm;
Colin Ian King41a0c2492015-12-18 14:22:01 -08002643 ret = 0;
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002644
2645 for (i = 0, mask = 1; i < MMF_DUMP_FILTER_BITS; i++, mask <<= 1) {
2646 if (val & mask)
2647 set_bit(i + MMF_DUMP_FILTER_SHIFT, &mm->flags);
2648 else
2649 clear_bit(i + MMF_DUMP_FILTER_SHIFT, &mm->flags);
2650 }
2651
2652 mmput(mm);
2653 out_no_mm:
2654 put_task_struct(task);
2655 out_no_task:
Alexey Dobriyan774636e2015-09-09 15:36:59 -07002656 if (ret < 0)
2657 return ret;
2658 return count;
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002659}
2660
2661static const struct file_operations proc_coredump_filter_operations = {
2662 .read = proc_coredump_filter_read,
2663 .write = proc_coredump_filter_write,
Arnd Bergmann87df8422010-03-17 23:06:02 +01002664 .llseek = generic_file_llseek,
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002665};
2666#endif
2667
Andrew Mortonaba76fd2006-12-10 02:19:48 -08002668#ifdef CONFIG_TASK_IO_ACCOUNTING
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07002669static int do_io_accounting(struct task_struct *task, struct seq_file *m, int whole)
Andrew Mortonaba76fd2006-12-10 02:19:48 -08002670{
Andrea Righi940389b2008-07-28 00:48:12 +02002671 struct task_io_accounting acct = task->ioac;
Andrea Righi59954772008-07-27 17:29:15 +02002672 unsigned long flags;
Vasiliy Kulikov293eb1e2011-07-26 16:08:38 -07002673 int result;
Andrea Righi297c5d92008-07-25 01:48:49 -07002674
Vasiliy Kulikov293eb1e2011-07-26 16:08:38 -07002675 result = mutex_lock_killable(&task->signal->cred_guard_mutex);
2676 if (result)
2677 return result;
2678
Jann Horncaaee622016-01-20 15:00:04 -08002679 if (!ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS)) {
Vasiliy Kulikov293eb1e2011-07-26 16:08:38 -07002680 result = -EACCES;
2681 goto out_unlock;
2682 }
Vasiliy Kulikov1d1221f2011-06-24 16:08:38 +04002683
Andrea Righi59954772008-07-27 17:29:15 +02002684 if (whole && lock_task_sighand(task, &flags)) {
2685 struct task_struct *t = task;
Andrea Righib2d002d2008-07-26 15:22:27 -07002686
Andrea Righi59954772008-07-27 17:29:15 +02002687 task_io_accounting_add(&acct, &task->signal->ioac);
2688 while_each_thread(task, t)
2689 task_io_accounting_add(&acct, &t->ioac);
Andrea Righi297c5d92008-07-25 01:48:49 -07002690
Andrea Righi59954772008-07-27 17:29:15 +02002691 unlock_task_sighand(task, &flags);
Andrea Righi297c5d92008-07-25 01:48:49 -07002692 }
Joe Perches25ce3192015-04-15 16:18:17 -07002693 seq_printf(m,
2694 "rchar: %llu\n"
2695 "wchar: %llu\n"
2696 "syscr: %llu\n"
2697 "syscw: %llu\n"
2698 "read_bytes: %llu\n"
2699 "write_bytes: %llu\n"
2700 "cancelled_write_bytes: %llu\n",
2701 (unsigned long long)acct.rchar,
2702 (unsigned long long)acct.wchar,
2703 (unsigned long long)acct.syscr,
2704 (unsigned long long)acct.syscw,
2705 (unsigned long long)acct.read_bytes,
2706 (unsigned long long)acct.write_bytes,
2707 (unsigned long long)acct.cancelled_write_bytes);
2708 result = 0;
2709
Vasiliy Kulikov293eb1e2011-07-26 16:08:38 -07002710out_unlock:
2711 mutex_unlock(&task->signal->cred_guard_mutex);
2712 return result;
Andrew Mortonaba76fd2006-12-10 02:19:48 -08002713}
Andrea Righi297c5d92008-07-25 01:48:49 -07002714
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07002715static int proc_tid_io_accounting(struct seq_file *m, struct pid_namespace *ns,
2716 struct pid *pid, struct task_struct *task)
Andrea Righi297c5d92008-07-25 01:48:49 -07002717{
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07002718 return do_io_accounting(task, m, 0);
Andrea Righi297c5d92008-07-25 01:48:49 -07002719}
2720
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07002721static int proc_tgid_io_accounting(struct seq_file *m, struct pid_namespace *ns,
2722 struct pid *pid, struct task_struct *task)
Andrea Righi297c5d92008-07-25 01:48:49 -07002723{
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07002724 return do_io_accounting(task, m, 1);
Andrea Righi297c5d92008-07-25 01:48:49 -07002725}
2726#endif /* CONFIG_TASK_IO_ACCOUNTING */
Andrew Mortonaba76fd2006-12-10 02:19:48 -08002727
Eric W. Biederman22d917d2011-11-17 00:11:58 -08002728#ifdef CONFIG_USER_NS
2729static int proc_id_map_open(struct inode *inode, struct file *file,
Fabian Frederickccf94f12014-08-08 14:21:22 -07002730 const struct seq_operations *seq_ops)
Eric W. Biederman22d917d2011-11-17 00:11:58 -08002731{
2732 struct user_namespace *ns = NULL;
2733 struct task_struct *task;
2734 struct seq_file *seq;
2735 int ret = -EINVAL;
2736
2737 task = get_proc_task(inode);
2738 if (task) {
2739 rcu_read_lock();
2740 ns = get_user_ns(task_cred_xxx(task, user_ns));
2741 rcu_read_unlock();
2742 put_task_struct(task);
2743 }
2744 if (!ns)
2745 goto err;
2746
2747 ret = seq_open(file, seq_ops);
2748 if (ret)
2749 goto err_put_ns;
2750
2751 seq = file->private_data;
2752 seq->private = ns;
2753
2754 return 0;
2755err_put_ns:
2756 put_user_ns(ns);
2757err:
2758 return ret;
2759}
2760
2761static int proc_id_map_release(struct inode *inode, struct file *file)
2762{
2763 struct seq_file *seq = file->private_data;
2764 struct user_namespace *ns = seq->private;
2765 put_user_ns(ns);
2766 return seq_release(inode, file);
2767}
2768
2769static int proc_uid_map_open(struct inode *inode, struct file *file)
2770{
2771 return proc_id_map_open(inode, file, &proc_uid_seq_operations);
2772}
2773
2774static int proc_gid_map_open(struct inode *inode, struct file *file)
2775{
2776 return proc_id_map_open(inode, file, &proc_gid_seq_operations);
2777}
2778
Eric W. Biedermanf76d2072012-08-30 01:24:05 -07002779static int proc_projid_map_open(struct inode *inode, struct file *file)
2780{
2781 return proc_id_map_open(inode, file, &proc_projid_seq_operations);
2782}
2783
Eric W. Biederman22d917d2011-11-17 00:11:58 -08002784static const struct file_operations proc_uid_map_operations = {
2785 .open = proc_uid_map_open,
2786 .write = proc_uid_map_write,
2787 .read = seq_read,
2788 .llseek = seq_lseek,
2789 .release = proc_id_map_release,
2790};
2791
2792static const struct file_operations proc_gid_map_operations = {
2793 .open = proc_gid_map_open,
2794 .write = proc_gid_map_write,
2795 .read = seq_read,
2796 .llseek = seq_lseek,
2797 .release = proc_id_map_release,
2798};
Eric W. Biedermanf76d2072012-08-30 01:24:05 -07002799
2800static const struct file_operations proc_projid_map_operations = {
2801 .open = proc_projid_map_open,
2802 .write = proc_projid_map_write,
2803 .read = seq_read,
2804 .llseek = seq_lseek,
2805 .release = proc_id_map_release,
2806};
Eric W. Biederman9cc46512014-12-02 12:27:26 -06002807
2808static int proc_setgroups_open(struct inode *inode, struct file *file)
2809{
2810 struct user_namespace *ns = NULL;
2811 struct task_struct *task;
2812 int ret;
2813
2814 ret = -ESRCH;
2815 task = get_proc_task(inode);
2816 if (task) {
2817 rcu_read_lock();
2818 ns = get_user_ns(task_cred_xxx(task, user_ns));
2819 rcu_read_unlock();
2820 put_task_struct(task);
2821 }
2822 if (!ns)
2823 goto err;
2824
2825 if (file->f_mode & FMODE_WRITE) {
2826 ret = -EACCES;
2827 if (!ns_capable(ns, CAP_SYS_ADMIN))
2828 goto err_put_ns;
2829 }
2830
2831 ret = single_open(file, &proc_setgroups_show, ns);
2832 if (ret)
2833 goto err_put_ns;
2834
2835 return 0;
2836err_put_ns:
2837 put_user_ns(ns);
2838err:
2839 return ret;
2840}
2841
2842static int proc_setgroups_release(struct inode *inode, struct file *file)
2843{
2844 struct seq_file *seq = file->private_data;
2845 struct user_namespace *ns = seq->private;
2846 int ret = single_release(inode, file);
2847 put_user_ns(ns);
2848 return ret;
2849}
2850
2851static const struct file_operations proc_setgroups_operations = {
2852 .open = proc_setgroups_open,
2853 .write = proc_setgroups_write,
2854 .read = seq_read,
2855 .llseek = seq_lseek,
2856 .release = proc_setgroups_release,
2857};
Eric W. Biederman22d917d2011-11-17 00:11:58 -08002858#endif /* CONFIG_USER_NS */
2859
Kees Cook47830722008-10-06 03:11:58 +04002860static int proc_pid_personality(struct seq_file *m, struct pid_namespace *ns,
2861 struct pid *pid, struct task_struct *task)
2862{
Al Viroa9712bc2011-03-23 15:52:50 -04002863 int err = lock_trace(task);
2864 if (!err) {
2865 seq_printf(m, "%08x\n", task->personality);
2866 unlock_trace(task);
2867 }
2868 return err;
Kees Cook47830722008-10-06 03:11:58 +04002869}
2870
Josh Poimboeuf7c23b332017-02-13 19:42:41 -06002871#ifdef CONFIG_LIVEPATCH
2872static int proc_pid_patch_state(struct seq_file *m, struct pid_namespace *ns,
2873 struct pid *pid, struct task_struct *task)
2874{
2875 seq_printf(m, "%d\n", task->patch_state);
2876 return 0;
2877}
2878#endif /* CONFIG_LIVEPATCH */
2879
Eric W. Biederman801199c2006-10-02 02:18:48 -07002880/*
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002881 * Thread groups
2882 */
Arjan van de Ven00977a52007-02-12 00:55:34 -08002883static const struct file_operations proc_task_operations;
Arjan van de Venc5ef1c42007-02-12 00:55:40 -08002884static const struct inode_operations proc_task_inode_operations;
Eric W. Biederman20cdc892006-10-02 02:17:07 -07002885
Eric Dumazetc5141e62007-05-08 00:26:15 -07002886static const struct pid_entry tgid_base_stuff[] = {
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002887 DIR("task", S_IRUGO|S_IXUGO, proc_task_inode_operations, proc_task_operations),
2888 DIR("fd", S_IRUSR|S_IXUSR, proc_fd_inode_operations, proc_fd_operations),
Pavel Emelyanov640708a2012-01-10 15:11:23 -08002889 DIR("map_files", S_IRUSR|S_IXUSR, proc_map_files_inode_operations, proc_map_files_operations),
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002890 DIR("fdinfo", S_IRUSR|S_IXUSR, proc_fdinfo_inode_operations, proc_fdinfo_operations),
Eric W. Biederman6b4e3062010-03-07 16:41:34 -08002891 DIR("ns", S_IRUSR|S_IXUGO, proc_ns_dir_inode_operations, proc_ns_dir_operations),
Andrew Mortonb2211a32008-03-11 18:03:35 -07002892#ifdef CONFIG_NET
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002893 DIR("net", S_IRUGO|S_IXUGO, proc_net_inode_operations, proc_net_operations),
Andrew Mortonb2211a32008-03-11 18:03:35 -07002894#endif
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002895 REG("environ", S_IRUSR, proc_environ_operations),
Al Viroc5317162016-10-05 18:43:43 -04002896 REG("auxv", S_IRUSR, proc_auxv_operations),
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002897 ONE("status", S_IRUGO, proc_pid_status),
Djalal Harouni35a35042014-04-07 15:38:36 -07002898 ONE("personality", S_IRUSR, proc_pid_personality),
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -07002899 ONE("limits", S_IRUGO, proc_pid_limits),
Ingo Molnar43ae34c2007-07-09 18:52:00 +02002900#ifdef CONFIG_SCHED_DEBUG
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002901 REG("sched", S_IRUGO|S_IWUSR, proc_pid_sched_operations),
Ingo Molnar43ae34c2007-07-09 18:52:00 +02002902#endif
Mike Galbraith5091faa2010-11-30 14:18:03 +01002903#ifdef CONFIG_SCHED_AUTOGROUP
2904 REG("autogroup", S_IRUGO|S_IWUSR, proc_pid_sched_autogroup_operations),
2905#endif
john stultz4614a696b2009-12-14 18:00:05 -08002906 REG("comm", S_IRUGO|S_IWUSR, proc_pid_set_comm_operations),
Roland McGrathebcb6732008-07-25 19:46:00 -07002907#ifdef CONFIG_HAVE_ARCH_TRACEHOOK
Alexey Dobriyan09d93bd2014-08-08 14:21:39 -07002908 ONE("syscall", S_IRUSR, proc_pid_syscall),
Roland McGrathebcb6732008-07-25 19:46:00 -07002909#endif
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -07002910 REG("cmdline", S_IRUGO, proc_pid_cmdline_ops),
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002911 ONE("stat", S_IRUGO, proc_tgid_stat),
2912 ONE("statm", S_IRUGO, proc_pid_statm),
Siddhesh Poyarekarb7643752012-03-21 16:34:04 -07002913 REG("maps", S_IRUGO, proc_pid_maps_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002914#ifdef CONFIG_NUMA
Siddhesh Poyarekarb7643752012-03-21 16:34:04 -07002915 REG("numa_maps", S_IRUGO, proc_pid_numa_maps_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002916#endif
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002917 REG("mem", S_IRUSR|S_IWUSR, proc_mem_operations),
2918 LNK("cwd", proc_cwd_link),
2919 LNK("root", proc_root_link),
2920 LNK("exe", proc_exe_link),
2921 REG("mounts", S_IRUGO, proc_mounts_operations),
2922 REG("mountinfo", S_IRUGO, proc_mountinfo_operations),
2923 REG("mountstats", S_IRUSR, proc_mountstats_operations),
Matt Mackall1e883282008-02-04 22:29:07 -08002924#ifdef CONFIG_PROC_PAGE_MONITOR
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002925 REG("clear_refs", S_IWUSR, proc_clear_refs_operations),
Siddhesh Poyarekarb7643752012-03-21 16:34:04 -07002926 REG("smaps", S_IRUGO, proc_pid_smaps_operations),
Daniel Colascione493b0e92017-09-06 16:25:08 -07002927 REG("smaps_rollup", S_IRUGO, proc_pid_smaps_rollup_operations),
Djalal Harouni32ed74a2014-04-07 15:38:38 -07002928 REG("pagemap", S_IRUSR, proc_pagemap_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002929#endif
2930#ifdef CONFIG_SECURITY
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002931 DIR("attr", S_IRUGO|S_IXUGO, proc_attr_dir_inode_operations, proc_attr_dir_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002932#endif
2933#ifdef CONFIG_KALLSYMS
Alexey Dobriyanedfcd602014-08-08 14:21:44 -07002934 ONE("wchan", S_IRUGO, proc_pid_wchan),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002935#endif
Ken Chen2ec220e2008-11-10 11:26:08 +03002936#ifdef CONFIG_STACKTRACE
Djalal Harouni35a35042014-04-07 15:38:36 -07002937 ONE("stack", S_IRUSR, proc_pid_stack),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002938#endif
Naveen N. Rao5968cec2015-06-30 14:36:03 +05302939#ifdef CONFIG_SCHED_INFO
Alexey Dobriyanf6e826c2014-08-08 14:21:46 -07002940 ONE("schedstat", S_IRUGO, proc_pid_schedstat),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002941#endif
Arjan van de Ven97455122008-01-25 21:08:34 +01002942#ifdef CONFIG_LATENCYTOP
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002943 REG("latency", S_IRUGO, proc_lstats_operations),
Arjan van de Ven97455122008-01-25 21:08:34 +01002944#endif
Paul Menage8793d852007-10-18 23:39:39 -07002945#ifdef CONFIG_PROC_PID_CPUSET
Zefan Li52de4772014-09-18 16:03:36 +08002946 ONE("cpuset", S_IRUGO, proc_cpuset_show),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002947#endif
Paul Menagea4243162007-10-18 23:39:35 -07002948#ifdef CONFIG_CGROUPS
Zefan Li006f4ac2014-09-18 16:03:15 +08002949 ONE("cgroup", S_IRUGO, proc_cgroup_show),
Paul Menagea4243162007-10-18 23:39:35 -07002950#endif
Alexey Dobriyan6ba51e32014-08-08 14:21:48 -07002951 ONE("oom_score", S_IRUGO, proc_oom_score),
David Rientjesfa0cbbf2012-11-12 17:53:04 -08002952 REG("oom_adj", S_IRUGO|S_IWUSR, proc_oom_adj_operations),
David Rientjesa63d83f2010-08-09 17:19:46 -07002953 REG("oom_score_adj", S_IRUGO|S_IWUSR, proc_oom_score_adj_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002954#ifdef CONFIG_AUDITSYSCALL
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002955 REG("loginuid", S_IWUSR|S_IRUGO, proc_loginuid_operations),
2956 REG("sessionid", S_IRUGO, proc_sessionid_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002957#endif
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08002958#ifdef CONFIG_FAULT_INJECTION
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002959 REG("make-it-fail", S_IRUGO|S_IWUSR, proc_fault_inject_operations),
Akinobu Mita168c42b2017-07-14 14:50:00 -07002960 REG("fail-nth", 0644, proc_fail_nth_operations),
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08002961#endif
Christoph Hellwig698ba7b2009-12-15 16:47:37 -08002962#ifdef CONFIG_ELF_CORE
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03002963 REG("coredump_filter", S_IRUGO|S_IWUSR, proc_coredump_filter_operations),
Kawai, Hidehiro3cb4a0b2007-07-19 01:48:28 -07002964#endif
Andrew Mortonaba76fd2006-12-10 02:19:48 -08002965#ifdef CONFIG_TASK_IO_ACCOUNTING
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07002966 ONE("io", S_IRUSR, proc_tgid_io_accounting),
Andrew Mortonaba76fd2006-12-10 02:19:48 -08002967#endif
Eric W. Biederman22d917d2011-11-17 00:11:58 -08002968#ifdef CONFIG_USER_NS
2969 REG("uid_map", S_IRUGO|S_IWUSR, proc_uid_map_operations),
2970 REG("gid_map", S_IRUGO|S_IWUSR, proc_gid_map_operations),
Eric W. Biedermanf76d2072012-08-30 01:24:05 -07002971 REG("projid_map", S_IRUGO|S_IWUSR, proc_projid_map_operations),
Eric W. Biederman9cc46512014-12-02 12:27:26 -06002972 REG("setgroups", S_IRUGO|S_IWUSR, proc_setgroups_operations),
Eric W. Biederman22d917d2011-11-17 00:11:58 -08002973#endif
Nicolas Pitreb18b6a92017-01-21 00:09:08 -05002974#if defined(CONFIG_CHECKPOINT_RESTORE) && defined(CONFIG_POSIX_TIMERS)
Pavel Emelyanov48f6a7a2013-03-11 13:12:45 +04002975 REG("timers", S_IRUGO, proc_timers_operations),
2976#endif
John Stultz5de23d42016-03-17 14:20:54 -07002977 REG("timerslack_ns", S_IRUGO|S_IWUGO, proc_pid_set_timerslack_ns_operations),
Josh Poimboeuf7c23b332017-02-13 19:42:41 -06002978#ifdef CONFIG_LIVEPATCH
2979 ONE("patch_state", S_IRUSR, proc_pid_patch_state),
2980#endif
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002981};
2982
Al Virof0c3b502013-05-16 12:07:31 -04002983static int proc_tgid_base_readdir(struct file *file, struct dir_context *ctx)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002984{
Al Virof0c3b502013-05-16 12:07:31 -04002985 return proc_pident_readdir(file, ctx,
2986 tgid_base_stuff, ARRAY_SIZE(tgid_base_stuff));
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002987}
2988
Arjan van de Ven00977a52007-02-12 00:55:34 -08002989static const struct file_operations proc_tgid_base_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002990 .read = generic_read_dir,
Al Virof50752e2016-04-20 17:13:54 -04002991 .iterate_shared = proc_tgid_base_readdir,
2992 .llseek = generic_file_llseek,
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002993};
2994
Al Viro00cd8dd2012-06-10 17:13:09 -04002995static struct dentry *proc_tgid_base_lookup(struct inode *dir, struct dentry *dentry, unsigned int flags)
2996{
Eric W. Biederman7bcd6b02006-10-02 02:18:56 -07002997 return proc_pident_lookup(dir, dentry,
2998 tgid_base_stuff, ARRAY_SIZE(tgid_base_stuff));
Eric W. Biederman28a6d672006-10-02 02:17:05 -07002999}
3000
Arjan van de Venc5ef1c42007-02-12 00:55:40 -08003001static const struct inode_operations proc_tgid_base_inode_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003002 .lookup = proc_tgid_base_lookup,
3003 .getattr = pid_getattr,
3004 .setattr = proc_setattr,
Vasiliy Kulikov04996802012-01-10 15:11:31 -08003005 .permission = proc_pid_permission,
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003006};
3007
Pavel Emelyanov60347f62007-10-18 23:40:03 -07003008static void proc_flush_task_mnt(struct vfsmount *mnt, pid_t pid, pid_t tgid)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003009{
Eric W. Biederman48e64842006-06-26 00:25:48 -07003010 struct dentry *dentry, *leader, *dir;
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003011 char buf[10 + 1];
Eric W. Biederman48e64842006-06-26 00:25:48 -07003012 struct qstr name;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003013
Eric W. Biederman48e64842006-06-26 00:25:48 -07003014 name.name = buf;
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003015 name.len = snprintf(buf, sizeof(buf), "%u", pid);
Al Viro4f522a22013-02-11 23:20:37 -05003016 /* no ->d_hash() rejects on procfs */
Pavel Emelyanov60347f62007-10-18 23:40:03 -07003017 dentry = d_hash_and_lookup(mnt->mnt_root, &name);
Eric W. Biederman48e64842006-06-26 00:25:48 -07003018 if (dentry) {
Eric W. Biedermanbbd51922014-02-13 10:24:23 -08003019 d_invalidate(dentry);
Eric W. Biederman48e64842006-06-26 00:25:48 -07003020 dput(dentry);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003021 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07003022
Oleg Nesterovc35a7f12014-12-10 15:54:56 -08003023 if (pid == tgid)
3024 return;
3025
Eric W. Biederman48e64842006-06-26 00:25:48 -07003026 name.name = buf;
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003027 name.len = snprintf(buf, sizeof(buf), "%u", tgid);
Pavel Emelyanov60347f62007-10-18 23:40:03 -07003028 leader = d_hash_and_lookup(mnt->mnt_root, &name);
Eric W. Biederman48e64842006-06-26 00:25:48 -07003029 if (!leader)
3030 goto out;
3031
3032 name.name = "task";
3033 name.len = strlen(name.name);
3034 dir = d_hash_and_lookup(leader, &name);
3035 if (!dir)
3036 goto out_put_leader;
3037
3038 name.name = buf;
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003039 name.len = snprintf(buf, sizeof(buf), "%u", pid);
Eric W. Biederman48e64842006-06-26 00:25:48 -07003040 dentry = d_hash_and_lookup(dir, &name);
3041 if (dentry) {
Eric W. Biedermanbbd51922014-02-13 10:24:23 -08003042 d_invalidate(dentry);
Eric W. Biederman48e64842006-06-26 00:25:48 -07003043 dput(dentry);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003044 }
Eric W. Biederman48e64842006-06-26 00:25:48 -07003045
3046 dput(dir);
3047out_put_leader:
3048 dput(leader);
3049out:
3050 return;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003051}
3052
Randy Dunlap0895e912007-10-21 21:00:10 -07003053/**
3054 * proc_flush_task - Remove dcache entries for @task from the /proc dcache.
3055 * @task: task that should be flushed.
3056 *
3057 * When flushing dentries from proc, one needs to flush them from global
Pavel Emelyanov60347f62007-10-18 23:40:03 -07003058 * proc (proc_mnt) and from all the namespaces' procs this task was seen
Randy Dunlap0895e912007-10-21 21:00:10 -07003059 * in. This call is supposed to do all of this job.
3060 *
3061 * Looks in the dcache for
3062 * /proc/@pid
3063 * /proc/@tgid/task/@pid
3064 * if either directory is present flushes it and all of it'ts children
3065 * from the dcache.
3066 *
3067 * It is safe and reasonable to cache /proc entries for a task until
3068 * that task exits. After that they just clog up the dcache with
3069 * useless entries, possibly causing useful dcache entries to be
3070 * flushed instead. This routine is proved to flush those useless
3071 * dcache entries at process exit time.
3072 *
3073 * NOTE: This routine is just an optimization so it does not guarantee
3074 * that no dcache entries will exist at process exit time it
3075 * just makes it very unlikely that any will persist.
Pavel Emelyanov60347f62007-10-18 23:40:03 -07003076 */
3077
3078void proc_flush_task(struct task_struct *task)
3079{
Eric W. Biederman9fcc2d12007-11-14 17:00:07 -08003080 int i;
Oleg Nesterov9b4d1cbe2009-09-22 16:45:34 -07003081 struct pid *pid, *tgid;
Pavel Emelyanov130f77e2007-10-18 23:40:11 -07003082 struct upid *upid;
3083
Pavel Emelyanov130f77e2007-10-18 23:40:11 -07003084 pid = task_pid(task);
Oleg Nesterov9b4d1cbe2009-09-22 16:45:34 -07003085 tgid = task_tgid(task);
Pavel Emelyanov130f77e2007-10-18 23:40:11 -07003086
Eric W. Biederman9fcc2d12007-11-14 17:00:07 -08003087 for (i = 0; i <= pid->level; i++) {
Pavel Emelyanov130f77e2007-10-18 23:40:11 -07003088 upid = &pid->numbers[i];
3089 proc_flush_task_mnt(upid->ns->proc_mnt, upid->nr,
Oleg Nesterov9b4d1cbe2009-09-22 16:45:34 -07003090 tgid->numbers[i].nr);
Pavel Emelyanov130f77e2007-10-18 23:40:11 -07003091 }
Pavel Emelyanov60347f62007-10-18 23:40:03 -07003092}
3093
Al Viro0168b9e2018-05-03 09:21:05 -04003094static struct dentry *proc_pid_instantiate(struct dentry * dentry,
Al Viroc52a47a2013-06-15 11:15:20 +04003095 struct task_struct *task, const void *ptr)
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003096{
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003097 struct inode *inode;
3098
Al Viro0168b9e2018-05-03 09:21:05 -04003099 inode = proc_pid_make_inode(dentry->d_sb, task, S_IFDIR | S_IRUGO | S_IXUGO);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003100 if (!inode)
Al Viro0168b9e2018-05-03 09:21:05 -04003101 return ERR_PTR(-ENOENT);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003102
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003103 inode->i_op = &proc_tgid_base_inode_operations;
3104 inode->i_fop = &proc_tgid_base_operations;
3105 inode->i_flags|=S_IMMUTABLE;
Vegard Nossumaed54172008-06-05 22:46:53 -07003106
Alexey Dobriyan1270dd82016-12-12 16:45:32 -08003107 set_nlink(inode, nlink_tgid);
Al Viro1bbc5512018-05-02 21:26:16 -04003108 pid_update_inode(task, inode);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003109
Nick Pigginfb045ad2011-01-07 17:49:55 +11003110 d_set_d_op(dentry, &pid_dentry_operations);
Al Viro0168b9e2018-05-03 09:21:05 -04003111 return d_splice_alias(inode, dentry);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003112}
3113
Al Viro00cd8dd2012-06-10 17:13:09 -04003114struct dentry *proc_pid_lookup(struct inode *dir, struct dentry * dentry, unsigned int flags)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003115{
3116 struct task_struct *task;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003117 unsigned tgid;
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003118 struct pid_namespace *ns;
Al Viro0168b9e2018-05-03 09:21:05 -04003119 struct dentry *result = ERR_PTR(-ENOENT);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003120
Alexey Dobriyandbcdb502014-08-08 14:21:25 -07003121 tgid = name_to_int(&dentry->d_name);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003122 if (tgid == ~0U)
3123 goto out;
3124
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003125 ns = dentry->d_sb->s_fs_info;
Eric W. Biedermande758732006-06-26 00:25:51 -07003126 rcu_read_lock();
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003127 task = find_task_by_pid_ns(tgid, ns);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003128 if (task)
3129 get_task_struct(task);
Eric W. Biedermande758732006-06-26 00:25:51 -07003130 rcu_read_unlock();
Linus Torvalds1da177e2005-04-16 15:20:36 -07003131 if (!task)
3132 goto out;
3133
Al Viro0168b9e2018-05-03 09:21:05 -04003134 result = proc_pid_instantiate(dentry, task, NULL);
Eric W. Biederman48e64842006-06-26 00:25:48 -07003135 put_task_struct(task);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003136out:
Al Viro0168b9e2018-05-03 09:21:05 -04003137 return result;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003138}
3139
Linus Torvalds1da177e2005-04-16 15:20:36 -07003140/*
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003141 * Find the first task with tgid >= tgid
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003142 *
Linus Torvalds1da177e2005-04-16 15:20:36 -07003143 */
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003144struct tgid_iter {
3145 unsigned int tgid;
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003146 struct task_struct *task;
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003147};
3148static struct tgid_iter next_tgid(struct pid_namespace *ns, struct tgid_iter iter)
3149{
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003150 struct pid *pid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003151
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003152 if (iter.task)
3153 put_task_struct(iter.task);
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003154 rcu_read_lock();
3155retry:
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003156 iter.task = NULL;
3157 pid = find_ge_pid(iter.tgid, ns);
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003158 if (pid) {
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003159 iter.tgid = pid_nr_ns(pid, ns);
3160 iter.task = pid_task(pid, PIDTYPE_PID);
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003161 /* What we to know is if the pid we have find is the
3162 * pid of a thread_group_leader. Testing for task
3163 * being a thread_group_leader is the obvious thing
3164 * todo but there is a window when it fails, due to
3165 * the pid transfer logic in de_thread.
3166 *
3167 * So we perform the straight forward test of seeing
3168 * if the pid we have found is the pid of a thread
3169 * group leader, and don't worry if the task we have
3170 * found doesn't happen to be a thread group leader.
3171 * As we don't care in the case of readdir.
3172 */
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003173 if (!iter.task || !has_group_leader_pid(iter.task)) {
3174 iter.tgid += 1;
Eric W. Biederman0804ef42006-10-02 02:17:04 -07003175 goto retry;
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003176 }
3177 get_task_struct(iter.task);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003178 }
Eric W. Biederman454cc102006-06-26 00:25:51 -07003179 rcu_read_unlock();
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003180 return iter;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003181}
3182
Eric W. Biederman00978752014-07-31 03:10:50 -07003183#define TGID_OFFSET (FIRST_PROCESS_ENTRY + 2)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003184
3185/* for the /proc/ directory itself, after non-process stuff has been done */
Al Virof0c3b502013-05-16 12:07:31 -04003186int proc_pid_readdir(struct file *file, struct dir_context *ctx)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003187{
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003188 struct tgid_iter iter;
Christoph Hellwig76f668b2018-05-16 07:19:01 +02003189 struct pid_namespace *ns = proc_pid_ns(file_inode(file));
Al Virof0c3b502013-05-16 12:07:31 -04003190 loff_t pos = ctx->pos;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003191
Al Viro021ada72013-03-29 19:27:05 -04003192 if (pos >= PID_MAX_LIMIT + TGID_OFFSET)
Al Virof0c3b502013-05-16 12:07:31 -04003193 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003194
Eric W. Biederman00978752014-07-31 03:10:50 -07003195 if (pos == TGID_OFFSET - 2) {
David Howells2b0143b2015-03-17 22:25:59 +00003196 struct inode *inode = d_inode(ns->proc_self);
Al Virodb963162013-06-15 10:45:10 +04003197 if (!dir_emit(ctx, "self", 4, inode->i_ino, DT_LNK))
Al Virof0c3b502013-05-16 12:07:31 -04003198 return 0;
Eric W. Biederman00978752014-07-31 03:10:50 -07003199 ctx->pos = pos = pos + 1;
Al Viro021ada72013-03-29 19:27:05 -04003200 }
Eric W. Biederman00978752014-07-31 03:10:50 -07003201 if (pos == TGID_OFFSET - 1) {
David Howells2b0143b2015-03-17 22:25:59 +00003202 struct inode *inode = d_inode(ns->proc_thread_self);
Eric W. Biederman00978752014-07-31 03:10:50 -07003203 if (!dir_emit(ctx, "thread-self", 11, inode->i_ino, DT_LNK))
3204 return 0;
3205 ctx->pos = pos = pos + 1;
3206 }
3207 iter.tgid = pos - TGID_OFFSET;
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003208 iter.task = NULL;
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003209 for (iter = next_tgid(ns, iter);
3210 iter.task;
3211 iter.tgid += 1, iter = next_tgid(ns, iter)) {
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003212 char name[10 + 1];
Alexey Dobriyana4ef3892018-06-07 17:10:10 -07003213 unsigned int len;
Eric Dumazet3ba4bce2017-01-24 15:18:07 -08003214
3215 cond_resched();
Lafcadio Wluiki796f5712017-02-24 15:00:23 -08003216 if (!has_pid_permissions(ns, iter.task, HIDEPID_INVISIBLE))
Al Virof0c3b502013-05-16 12:07:31 -04003217 continue;
Vasiliy Kulikov04996802012-01-10 15:11:31 -08003218
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003219 len = snprintf(name, sizeof(name), "%u", iter.tgid);
Al Virof0c3b502013-05-16 12:07:31 -04003220 ctx->pos = iter.tgid + TGID_OFFSET;
3221 if (!proc_fill_cache(file, ctx, name, len,
3222 proc_pid_instantiate, iter.task, NULL)) {
Eric W. Biederman19fd4bb2007-11-28 16:21:26 -08003223 put_task_struct(iter.task);
Al Virof0c3b502013-05-16 12:07:31 -04003224 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003225 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07003226 }
Al Virof0c3b502013-05-16 12:07:31 -04003227 ctx->pos = PID_MAX_LIMIT + TGID_OFFSET;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003228 return 0;
3229}
3230
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003231/*
Janis Danisevskis1b3044e2016-05-20 17:00:08 -07003232 * proc_tid_comm_permission is a special permission function exclusively
3233 * used for the node /proc/<pid>/task/<tid>/comm.
3234 * It bypasses generic permission checks in the case where a task of the same
3235 * task group attempts to access the node.
3236 * The rationale behind this is that glibc and bionic access this node for
3237 * cross thread naming (pthread_set/getname_np(!self)). However, if
3238 * PR_SET_DUMPABLE gets set to 0 this node among others becomes uid=0 gid=0,
3239 * which locks out the cross thread naming implementation.
3240 * This function makes sure that the node is always accessible for members of
3241 * same thread group.
3242 */
3243static int proc_tid_comm_permission(struct inode *inode, int mask)
3244{
3245 bool is_same_tgroup;
3246 struct task_struct *task;
3247
3248 task = get_proc_task(inode);
3249 if (!task)
3250 return -ESRCH;
3251 is_same_tgroup = same_thread_group(current, task);
3252 put_task_struct(task);
3253
3254 if (likely(is_same_tgroup && !(mask & MAY_EXEC))) {
3255 /* This file (/proc/<pid>/task/<tid>/comm) can always be
3256 * read or written by the members of the corresponding
3257 * thread group.
3258 */
3259 return 0;
3260 }
3261
3262 return generic_permission(inode, mask);
3263}
3264
3265static const struct inode_operations proc_tid_comm_inode_operations = {
3266 .permission = proc_tid_comm_permission,
3267};
3268
3269/*
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003270 * Tasks
3271 */
Eric Dumazetc5141e62007-05-08 00:26:15 -07003272static const struct pid_entry tid_base_stuff[] = {
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003273 DIR("fd", S_IRUSR|S_IXUSR, proc_fd_inode_operations, proc_fd_operations),
Jerome Marchand38355412010-04-27 13:13:06 -07003274 DIR("fdinfo", S_IRUSR|S_IXUSR, proc_fdinfo_inode_operations, proc_fdinfo_operations),
Eric W. Biederman6b4e3062010-03-07 16:41:34 -08003275 DIR("ns", S_IRUSR|S_IXUGO, proc_ns_dir_inode_operations, proc_ns_dir_operations),
Eric W. Biederman6ba8ed72014-07-31 16:27:08 -07003276#ifdef CONFIG_NET
3277 DIR("net", S_IRUGO|S_IXUGO, proc_net_inode_operations, proc_net_operations),
3278#endif
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003279 REG("environ", S_IRUSR, proc_environ_operations),
Al Viroc5317162016-10-05 18:43:43 -04003280 REG("auxv", S_IRUSR, proc_auxv_operations),
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003281 ONE("status", S_IRUGO, proc_pid_status),
Djalal Harouni35a35042014-04-07 15:38:36 -07003282 ONE("personality", S_IRUSR, proc_pid_personality),
Alexey Dobriyan1c963eb2014-08-08 14:21:37 -07003283 ONE("limits", S_IRUGO, proc_pid_limits),
Ingo Molnar43ae34c2007-07-09 18:52:00 +02003284#ifdef CONFIG_SCHED_DEBUG
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003285 REG("sched", S_IRUGO|S_IWUSR, proc_pid_sched_operations),
Ingo Molnar43ae34c2007-07-09 18:52:00 +02003286#endif
Janis Danisevskis1b3044e2016-05-20 17:00:08 -07003287 NOD("comm", S_IFREG|S_IRUGO|S_IWUSR,
3288 &proc_tid_comm_inode_operations,
3289 &proc_pid_set_comm_operations, {}),
Roland McGrathebcb6732008-07-25 19:46:00 -07003290#ifdef CONFIG_HAVE_ARCH_TRACEHOOK
Alexey Dobriyan09d93bd2014-08-08 14:21:39 -07003291 ONE("syscall", S_IRUSR, proc_pid_syscall),
Roland McGrathebcb6732008-07-25 19:46:00 -07003292#endif
Alexey Dobriyanc2c0bb42015-06-25 15:00:54 -07003293 REG("cmdline", S_IRUGO, proc_pid_cmdline_ops),
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003294 ONE("stat", S_IRUGO, proc_tid_stat),
3295 ONE("statm", S_IRUGO, proc_pid_statm),
Siddhesh Poyarekarb7643752012-03-21 16:34:04 -07003296 REG("maps", S_IRUGO, proc_tid_maps_operations),
Iago López Galeiras2e13ba52015-06-25 15:00:57 -07003297#ifdef CONFIG_PROC_CHILDREN
Cyrill Gorcunov818411612012-05-31 16:26:43 -07003298 REG("children", S_IRUGO, proc_tid_children_operations),
3299#endif
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003300#ifdef CONFIG_NUMA
Siddhesh Poyarekarb7643752012-03-21 16:34:04 -07003301 REG("numa_maps", S_IRUGO, proc_tid_numa_maps_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003302#endif
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003303 REG("mem", S_IRUSR|S_IWUSR, proc_mem_operations),
3304 LNK("cwd", proc_cwd_link),
3305 LNK("root", proc_root_link),
3306 LNK("exe", proc_exe_link),
3307 REG("mounts", S_IRUGO, proc_mounts_operations),
3308 REG("mountinfo", S_IRUGO, proc_mountinfo_operations),
Matt Mackall1e883282008-02-04 22:29:07 -08003309#ifdef CONFIG_PROC_PAGE_MONITOR
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003310 REG("clear_refs", S_IWUSR, proc_clear_refs_operations),
Siddhesh Poyarekarb7643752012-03-21 16:34:04 -07003311 REG("smaps", S_IRUGO, proc_tid_smaps_operations),
Daniel Colascione493b0e92017-09-06 16:25:08 -07003312 REG("smaps_rollup", S_IRUGO, proc_pid_smaps_rollup_operations),
Djalal Harouni32ed74a2014-04-07 15:38:38 -07003313 REG("pagemap", S_IRUSR, proc_pagemap_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003314#endif
3315#ifdef CONFIG_SECURITY
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003316 DIR("attr", S_IRUGO|S_IXUGO, proc_attr_dir_inode_operations, proc_attr_dir_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003317#endif
3318#ifdef CONFIG_KALLSYMS
Alexey Dobriyanedfcd602014-08-08 14:21:44 -07003319 ONE("wchan", S_IRUGO, proc_pid_wchan),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003320#endif
Ken Chen2ec220e2008-11-10 11:26:08 +03003321#ifdef CONFIG_STACKTRACE
Djalal Harouni35a35042014-04-07 15:38:36 -07003322 ONE("stack", S_IRUSR, proc_pid_stack),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003323#endif
Naveen N. Rao5968cec2015-06-30 14:36:03 +05303324#ifdef CONFIG_SCHED_INFO
Alexey Dobriyanf6e826c2014-08-08 14:21:46 -07003325 ONE("schedstat", S_IRUGO, proc_pid_schedstat),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003326#endif
Arjan van de Ven97455122008-01-25 21:08:34 +01003327#ifdef CONFIG_LATENCYTOP
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003328 REG("latency", S_IRUGO, proc_lstats_operations),
Arjan van de Ven97455122008-01-25 21:08:34 +01003329#endif
Paul Menage8793d852007-10-18 23:39:39 -07003330#ifdef CONFIG_PROC_PID_CPUSET
Zefan Li52de4772014-09-18 16:03:36 +08003331 ONE("cpuset", S_IRUGO, proc_cpuset_show),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003332#endif
Paul Menagea4243162007-10-18 23:39:35 -07003333#ifdef CONFIG_CGROUPS
Zefan Li006f4ac2014-09-18 16:03:15 +08003334 ONE("cgroup", S_IRUGO, proc_cgroup_show),
Paul Menagea4243162007-10-18 23:39:35 -07003335#endif
Alexey Dobriyan6ba51e32014-08-08 14:21:48 -07003336 ONE("oom_score", S_IRUGO, proc_oom_score),
David Rientjesfa0cbbf2012-11-12 17:53:04 -08003337 REG("oom_adj", S_IRUGO|S_IWUSR, proc_oom_adj_operations),
David Rientjesa63d83f2010-08-09 17:19:46 -07003338 REG("oom_score_adj", S_IRUGO|S_IWUSR, proc_oom_score_adj_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003339#ifdef CONFIG_AUDITSYSCALL
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003340 REG("loginuid", S_IWUSR|S_IRUGO, proc_loginuid_operations),
Al Viro26ec3c62011-02-15 21:24:05 -05003341 REG("sessionid", S_IRUGO, proc_sessionid_operations),
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003342#endif
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08003343#ifdef CONFIG_FAULT_INJECTION
Alexey Dobriyan631f9c12008-11-10 01:32:52 +03003344 REG("make-it-fail", S_IRUGO|S_IWUSR, proc_fault_inject_operations),
Akinobu Mita1203c8e2017-07-14 14:49:57 -07003345 REG("fail-nth", 0644, proc_fail_nth_operations),
Akinobu Mitaf4f154f2006-12-08 02:39:47 -08003346#endif
Andrea Righi297c5d92008-07-25 01:48:49 -07003347#ifdef CONFIG_TASK_IO_ACCOUNTING
Alexey Dobriyan19aadc92014-08-08 14:21:50 -07003348 ONE("io", S_IRUSR, proc_tid_io_accounting),
Andrea Righi297c5d92008-07-25 01:48:49 -07003349#endif
Eric W. Biederman22d917d2011-11-17 00:11:58 -08003350#ifdef CONFIG_USER_NS
3351 REG("uid_map", S_IRUGO|S_IWUSR, proc_uid_map_operations),
3352 REG("gid_map", S_IRUGO|S_IWUSR, proc_gid_map_operations),
Eric W. Biedermanf76d2072012-08-30 01:24:05 -07003353 REG("projid_map", S_IRUGO|S_IWUSR, proc_projid_map_operations),
Eric W. Biederman9cc46512014-12-02 12:27:26 -06003354 REG("setgroups", S_IRUGO|S_IWUSR, proc_setgroups_operations),
Eric W. Biederman22d917d2011-11-17 00:11:58 -08003355#endif
Josh Poimboeuf7c23b332017-02-13 19:42:41 -06003356#ifdef CONFIG_LIVEPATCH
3357 ONE("patch_state", S_IRUSR, proc_pid_patch_state),
3358#endif
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003359};
3360
Al Virof0c3b502013-05-16 12:07:31 -04003361static int proc_tid_base_readdir(struct file *file, struct dir_context *ctx)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003362{
Al Virof0c3b502013-05-16 12:07:31 -04003363 return proc_pident_readdir(file, ctx,
3364 tid_base_stuff, ARRAY_SIZE(tid_base_stuff));
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003365}
3366
Al Viro00cd8dd2012-06-10 17:13:09 -04003367static struct dentry *proc_tid_base_lookup(struct inode *dir, struct dentry *dentry, unsigned int flags)
3368{
Eric W. Biederman7bcd6b02006-10-02 02:18:56 -07003369 return proc_pident_lookup(dir, dentry,
3370 tid_base_stuff, ARRAY_SIZE(tid_base_stuff));
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003371}
3372
Arjan van de Ven00977a52007-02-12 00:55:34 -08003373static const struct file_operations proc_tid_base_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003374 .read = generic_read_dir,
Al Virof50752e2016-04-20 17:13:54 -04003375 .iterate_shared = proc_tid_base_readdir,
3376 .llseek = generic_file_llseek,
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003377};
3378
Arjan van de Venc5ef1c42007-02-12 00:55:40 -08003379static const struct inode_operations proc_tid_base_inode_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003380 .lookup = proc_tid_base_lookup,
3381 .getattr = pid_getattr,
3382 .setattr = proc_setattr,
3383};
3384
Al Viro0168b9e2018-05-03 09:21:05 -04003385static struct dentry *proc_task_instantiate(struct dentry *dentry,
3386 struct task_struct *task, const void *ptr)
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003387{
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003388 struct inode *inode;
Al Viro0168b9e2018-05-03 09:21:05 -04003389 inode = proc_pid_make_inode(dentry->d_sb, task, S_IFDIR | S_IRUGO | S_IXUGO);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003390 if (!inode)
Al Viro0168b9e2018-05-03 09:21:05 -04003391 return ERR_PTR(-ENOENT);
Al Viro1bbc5512018-05-02 21:26:16 -04003392
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003393 inode->i_op = &proc_tid_base_inode_operations;
3394 inode->i_fop = &proc_tid_base_operations;
Al Viro1bbc5512018-05-02 21:26:16 -04003395 inode->i_flags |= S_IMMUTABLE;
Vegard Nossumaed54172008-06-05 22:46:53 -07003396
Alexey Dobriyan1270dd82016-12-12 16:45:32 -08003397 set_nlink(inode, nlink_tid);
Al Viro1bbc5512018-05-02 21:26:16 -04003398 pid_update_inode(task, inode);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003399
Nick Pigginfb045ad2011-01-07 17:49:55 +11003400 d_set_d_op(dentry, &pid_dentry_operations);
Al Viro0168b9e2018-05-03 09:21:05 -04003401 return d_splice_alias(inode, dentry);
Eric W. Biederman444ceed2006-10-02 02:18:49 -07003402}
3403
Al Viro00cd8dd2012-06-10 17:13:09 -04003404static struct dentry *proc_task_lookup(struct inode *dir, struct dentry * dentry, unsigned int flags)
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003405{
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003406 struct task_struct *task;
3407 struct task_struct *leader = get_proc_task(dir);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003408 unsigned tid;
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003409 struct pid_namespace *ns;
Al Viro0168b9e2018-05-03 09:21:05 -04003410 struct dentry *result = ERR_PTR(-ENOENT);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003411
3412 if (!leader)
3413 goto out_no_task;
3414
Alexey Dobriyandbcdb502014-08-08 14:21:25 -07003415 tid = name_to_int(&dentry->d_name);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003416 if (tid == ~0U)
3417 goto out;
3418
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003419 ns = dentry->d_sb->s_fs_info;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003420 rcu_read_lock();
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003421 task = find_task_by_pid_ns(tid, ns);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003422 if (task)
3423 get_task_struct(task);
3424 rcu_read_unlock();
3425 if (!task)
3426 goto out;
Pavel Emelyanovbac0abd2007-10-18 23:40:18 -07003427 if (!same_thread_group(leader, task))
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003428 goto out_drop_task;
3429
Al Viro0168b9e2018-05-03 09:21:05 -04003430 result = proc_task_instantiate(dentry, task, NULL);
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003431out_drop_task:
3432 put_task_struct(task);
3433out:
3434 put_task_struct(leader);
3435out_no_task:
Al Viro0168b9e2018-05-03 09:21:05 -04003436 return result;
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003437}
3438
3439/*
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003440 * Find the first tid of a thread group to return to user space.
3441 *
3442 * Usually this is just the thread group leader, but if the users
3443 * buffer was too small or there was a seek into the middle of the
3444 * directory we have more work todo.
3445 *
3446 * In the case of a short read we start with find_task_by_pid.
3447 *
3448 * In the case of a seek we start with the leader and walk nr
3449 * threads past it.
3450 */
Oleg Nesterov9f6e9632014-01-23 15:55:40 -08003451static struct task_struct *first_tid(struct pid *pid, int tid, loff_t f_pos,
3452 struct pid_namespace *ns)
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003453{
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003454 struct task_struct *pos, *task;
Oleg Nesterov9f6e9632014-01-23 15:55:40 -08003455 unsigned long nr = f_pos;
3456
3457 if (nr != f_pos) /* 32bit overflow? */
3458 return NULL;
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003459
Eric W. Biedermancc288732006-06-26 00:26:01 -07003460 rcu_read_lock();
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003461 task = pid_task(pid, PIDTYPE_PID);
3462 if (!task)
3463 goto fail;
3464
3465 /* Attempt to start with the tid of a thread */
Oleg Nesterov9f6e9632014-01-23 15:55:40 -08003466 if (tid && nr) {
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003467 pos = find_task_by_pid_ns(tid, ns);
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003468 if (pos && same_thread_group(pos, task))
Oleg Nesterova872ff02006-06-26 00:26:01 -07003469 goto found;
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003470 }
3471
3472 /* If nr exceeds the number of threads there is nothing todo */
Oleg Nesterov9f6e9632014-01-23 15:55:40 -08003473 if (nr >= get_nr_threads(task))
Oleg Nesterovc986c142014-01-23 15:55:38 -08003474 goto fail;
Oleg Nesterova872ff02006-06-26 00:26:01 -07003475
3476 /* If we haven't found our starting place yet start
3477 * with the leader and walk nr threads forward.
3478 */
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003479 pos = task = task->group_leader;
Oleg Nesterovc986c142014-01-23 15:55:38 -08003480 do {
Oleg Nesterov9f6e9632014-01-23 15:55:40 -08003481 if (!nr--)
Oleg Nesterovc986c142014-01-23 15:55:38 -08003482 goto found;
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003483 } while_each_thread(task, pos);
Oleg Nesterovc986c142014-01-23 15:55:38 -08003484fail:
3485 pos = NULL;
3486 goto out;
Oleg Nesterova872ff02006-06-26 00:26:01 -07003487found:
3488 get_task_struct(pos);
3489out:
Eric W. Biedermancc288732006-06-26 00:26:01 -07003490 rcu_read_unlock();
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003491 return pos;
3492}
3493
3494/*
3495 * Find the next thread in the thread list.
3496 * Return NULL if there is an error or no next thread.
3497 *
3498 * The reference to the input task_struct is released.
3499 */
3500static struct task_struct *next_tid(struct task_struct *start)
3501{
Oleg Nesterovc1df7fb2006-06-26 00:26:02 -07003502 struct task_struct *pos = NULL;
Eric W. Biedermancc288732006-06-26 00:26:01 -07003503 rcu_read_lock();
Oleg Nesterovc1df7fb2006-06-26 00:26:02 -07003504 if (pid_alive(start)) {
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003505 pos = next_thread(start);
Oleg Nesterovc1df7fb2006-06-26 00:26:02 -07003506 if (thread_group_leader(pos))
3507 pos = NULL;
3508 else
3509 get_task_struct(pos);
3510 }
Eric W. Biedermancc288732006-06-26 00:26:01 -07003511 rcu_read_unlock();
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003512 put_task_struct(start);
3513 return pos;
3514}
3515
Linus Torvalds1da177e2005-04-16 15:20:36 -07003516/* for the /proc/TGID/task/ directories */
Al Virof0c3b502013-05-16 12:07:31 -04003517static int proc_task_readdir(struct file *file, struct dir_context *ctx)
Linus Torvalds1da177e2005-04-16 15:20:36 -07003518{
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003519 struct inode *inode = file_inode(file);
3520 struct task_struct *task;
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003521 struct pid_namespace *ns;
Al Virof0c3b502013-05-16 12:07:31 -04003522 int tid;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003523
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003524 if (proc_inode_is_dead(inode))
Al Virof0c3b502013-05-16 12:07:31 -04003525 return -ENOENT;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003526
Al Virof0c3b502013-05-16 12:07:31 -04003527 if (!dir_emit_dots(file, ctx))
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003528 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003529
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003530 /* f_version caches the tgid value that the last readdir call couldn't
3531 * return. lseek aka telldir automagically resets f_version to 0.
3532 */
Christoph Hellwig76f668b2018-05-16 07:19:01 +02003533 ns = proc_pid_ns(inode);
Al Virof0c3b502013-05-16 12:07:31 -04003534 tid = (int)file->f_version;
3535 file->f_version = 0;
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003536 for (task = first_tid(proc_pid(inode), tid, ctx->pos - 2, ns);
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003537 task;
Al Virof0c3b502013-05-16 12:07:31 -04003538 task = next_tid(task), ctx->pos++) {
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003539 char name[10 + 1];
Alexey Dobriyana4ef3892018-06-07 17:10:10 -07003540 unsigned int len;
Pavel Emelyanovb4888932007-10-18 23:40:14 -07003541 tid = task_pid_nr_ns(task, ns);
Alexey Dobriyane3912ac2018-02-06 15:36:51 -08003542 len = snprintf(name, sizeof(name), "%u", tid);
Al Virof0c3b502013-05-16 12:07:31 -04003543 if (!proc_fill_cache(file, ctx, name, len,
3544 proc_task_instantiate, task, NULL)) {
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003545 /* returning this tgid failed, save it as the first
3546 * pid for the next readir call */
Al Virof0c3b502013-05-16 12:07:31 -04003547 file->f_version = (u64)tid;
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003548 put_task_struct(task);
Linus Torvalds1da177e2005-04-16 15:20:36 -07003549 break;
Eric W. Biederman0bc58a92006-06-26 00:25:50 -07003550 }
Linus Torvalds1da177e2005-04-16 15:20:36 -07003551 }
Oleg Nesterovd855a4b2014-01-23 15:55:39 -08003552
Al Virof0c3b502013-05-16 12:07:31 -04003553 return 0;
Linus Torvalds1da177e2005-04-16 15:20:36 -07003554}
Eric W. Biederman6e66b522006-06-26 00:25:47 -07003555
David Howellsa528d352017-01-31 16:46:22 +00003556static int proc_task_getattr(const struct path *path, struct kstat *stat,
3557 u32 request_mask, unsigned int query_flags)
Eric W. Biederman6e66b522006-06-26 00:25:47 -07003558{
David Howellsa528d352017-01-31 16:46:22 +00003559 struct inode *inode = d_inode(path->dentry);
Eric W. Biederman99f89552006-06-26 00:25:55 -07003560 struct task_struct *p = get_proc_task(inode);
Eric W. Biederman6e66b522006-06-26 00:25:47 -07003561 generic_fillattr(inode, stat);
3562
Eric W. Biederman99f89552006-06-26 00:25:55 -07003563 if (p) {
Eric W. Biederman99f89552006-06-26 00:25:55 -07003564 stat->nlink += get_nr_threads(p);
Eric W. Biederman99f89552006-06-26 00:25:55 -07003565 put_task_struct(p);
Eric W. Biederman6e66b522006-06-26 00:25:47 -07003566 }
3567
3568 return 0;
3569}
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003570
Arjan van de Venc5ef1c42007-02-12 00:55:40 -08003571static const struct inode_operations proc_task_inode_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003572 .lookup = proc_task_lookup,
3573 .getattr = proc_task_getattr,
3574 .setattr = proc_setattr,
Vasiliy Kulikov04996802012-01-10 15:11:31 -08003575 .permission = proc_pid_permission,
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003576};
3577
Arjan van de Ven00977a52007-02-12 00:55:34 -08003578static const struct file_operations proc_task_operations = {
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003579 .read = generic_read_dir,
Al Virof50752e2016-04-20 17:13:54 -04003580 .iterate_shared = proc_task_readdir,
3581 .llseek = generic_file_llseek,
Eric W. Biederman28a6d672006-10-02 02:17:05 -07003582};
Alexey Dobriyan1270dd82016-12-12 16:45:32 -08003583
3584void __init set_proc_pid_nlink(void)
3585{
3586 nlink_tid = pid_entry_nlink(tid_base_stuff, ARRAY_SIZE(tid_base_stuff));
3587 nlink_tgid = pid_entry_nlink(tgid_base_stuff, ARRAY_SIZE(tgid_base_stuff));
3588}