Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 1 | // SPDX-License-Identifier: GPL-2.0 |
| 2 | /* |
| 3 | * linux/fs/proc/array.c |
| 4 | * |
| 5 | * Copyright (C) 1992 by Linus Torvalds |
| 6 | * based on ideas by Darren Senn |
| 7 | * |
| 8 | * Fixes: |
| 9 | * Michael. K. Johnson: stat,statm extensions. |
| 10 | * <johnsonm@stolaf.edu> |
| 11 | * |
| 12 | * Pauline Middelink : Made cmdline,envline only break at '\0's, to |
| 13 | * make sure SET_PROCTITLE works. Also removed |
| 14 | * bad '!' which forced address recalculation for |
| 15 | * EVERY character on the current page. |
| 16 | * <middelin@polyware.iaf.nl> |
| 17 | * |
| 18 | * Danny ter Haar : added cpuinfo |
| 19 | * <dth@cistron.nl> |
| 20 | * |
| 21 | * Alessandro Rubini : profile extension. |
| 22 | * <rubini@ipvvis.unipv.it> |
| 23 | * |
| 24 | * Jeff Tranter : added BogoMips field to cpuinfo |
| 25 | * <Jeff_Tranter@Mitel.COM> |
| 26 | * |
| 27 | * Bruno Haible : remove 4K limit for the maps file |
| 28 | * <haible@ma2s2.mathematik.uni-karlsruhe.de> |
| 29 | * |
| 30 | * Yves Arrouye : remove removal of trailing spaces in get_array. |
| 31 | * <Yves.Arrouye@marin.fdn.fr> |
| 32 | * |
| 33 | * Jerome Forissier : added per-CPU time information to /proc/stat |
| 34 | * and /proc/<pid>/cpu extension |
| 35 | * <forissier@isia.cma.fr> |
| 36 | * - Incorporation and non-SMP safe operation |
| 37 | * of forissier patch in 2.1.78 by |
| 38 | * Hans Marcus <crowbar@concepts.nl> |
| 39 | * |
| 40 | * aeb@cwi.nl : /proc/partitions |
| 41 | * |
| 42 | * |
| 43 | * Alan Cox : security fixes. |
| 44 | * <alan@lxorguk.ukuu.org.uk> |
| 45 | * |
| 46 | * Al Viro : safe handling of mm_struct |
| 47 | * |
| 48 | * Gerhard Wichert : added BIGMEM support |
| 49 | * Siemens AG <Gerhard.Wichert@pdb.siemens.de> |
| 50 | * |
| 51 | * Al Viro & Jeff Garzik : moved most of the thing into base.c and |
| 52 | * : proc_misc.c. The rest may eventually go into |
| 53 | * : base.c too. |
| 54 | */ |
| 55 | |
| 56 | #include <linux/types.h> |
| 57 | #include <linux/errno.h> |
| 58 | #include <linux/time.h> |
| 59 | #include <linux/kernel.h> |
| 60 | #include <linux/kernel_stat.h> |
| 61 | #include <linux/tty.h> |
| 62 | #include <linux/string.h> |
| 63 | #include <linux/mman.h> |
| 64 | #include <linux/sched/mm.h> |
| 65 | #include <linux/sched/numa_balancing.h> |
| 66 | #include <linux/sched/task_stack.h> |
| 67 | #include <linux/sched/task.h> |
| 68 | #include <linux/sched/cputime.h> |
| 69 | #include <linux/proc_fs.h> |
| 70 | #include <linux/ioport.h> |
| 71 | #include <linux/uaccess.h> |
| 72 | #include <linux/io.h> |
| 73 | #include <linux/mm.h> |
| 74 | #include <linux/hugetlb.h> |
| 75 | #include <linux/pagemap.h> |
| 76 | #include <linux/swap.h> |
| 77 | #include <linux/smp.h> |
| 78 | #include <linux/signal.h> |
| 79 | #include <linux/highmem.h> |
| 80 | #include <linux/file.h> |
| 81 | #include <linux/fdtable.h> |
| 82 | #include <linux/times.h> |
| 83 | #include <linux/cpuset.h> |
| 84 | #include <linux/rcupdate.h> |
| 85 | #include <linux/delayacct.h> |
| 86 | #include <linux/seq_file.h> |
| 87 | #include <linux/pid_namespace.h> |
| 88 | #include <linux/prctl.h> |
| 89 | #include <linux/ptrace.h> |
| 90 | #include <linux/tracehook.h> |
| 91 | #include <linux/string_helpers.h> |
| 92 | #include <linux/user_namespace.h> |
| 93 | #include <linux/fs_struct.h> |
| 94 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 95 | #include <asm/processor.h> |
| 96 | #include "internal.h" |
| 97 | |
| 98 | void proc_task_name(struct seq_file *m, struct task_struct *p, bool escape) |
| 99 | { |
| 100 | char *buf; |
| 101 | size_t size; |
| 102 | char tcomm[64]; |
| 103 | int ret; |
| 104 | |
| 105 | if (p->flags & PF_WQ_WORKER) |
| 106 | wq_worker_comm(tcomm, sizeof(tcomm), p); |
| 107 | else |
| 108 | __get_task_comm(tcomm, sizeof(tcomm), p); |
| 109 | |
| 110 | size = seq_get_buf(m, &buf); |
| 111 | if (escape) { |
| 112 | ret = string_escape_str(tcomm, buf, size, |
| 113 | ESCAPE_SPACE | ESCAPE_SPECIAL, "\n\\"); |
| 114 | if (ret >= size) |
| 115 | ret = -1; |
| 116 | } else { |
| 117 | ret = strscpy(buf, tcomm, size); |
| 118 | } |
| 119 | |
| 120 | seq_commit(m, ret); |
| 121 | } |
| 122 | |
| 123 | /* |
| 124 | * The task state array is a strange "bitmap" of |
| 125 | * reasons to sleep. Thus "running" is zero, and |
| 126 | * you can test for combinations of others with |
| 127 | * simple bit tests. |
| 128 | */ |
| 129 | static const char * const task_state_array[] = { |
| 130 | |
| 131 | /* states in TASK_REPORT: */ |
| 132 | "R (running)", /* 0x00 */ |
| 133 | "S (sleeping)", /* 0x01 */ |
| 134 | "D (disk sleep)", /* 0x02 */ |
| 135 | "T (stopped)", /* 0x04 */ |
| 136 | "t (tracing stop)", /* 0x08 */ |
| 137 | "X (dead)", /* 0x10 */ |
| 138 | "Z (zombie)", /* 0x20 */ |
| 139 | "P (parked)", /* 0x40 */ |
| 140 | |
| 141 | /* states beyond TASK_REPORT: */ |
| 142 | "I (idle)", /* 0x80 */ |
| 143 | }; |
| 144 | |
| 145 | static inline const char *get_task_state(struct task_struct *tsk) |
| 146 | { |
| 147 | BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != ARRAY_SIZE(task_state_array)); |
| 148 | return task_state_array[task_state_index(tsk)]; |
| 149 | } |
| 150 | |
| 151 | static inline void task_state(struct seq_file *m, struct pid_namespace *ns, |
| 152 | struct pid *pid, struct task_struct *p) |
| 153 | { |
| 154 | struct user_namespace *user_ns = seq_user_ns(m); |
| 155 | struct group_info *group_info; |
| 156 | int g, umask = -1; |
| 157 | struct task_struct *tracer; |
| 158 | const struct cred *cred; |
| 159 | pid_t ppid, tpid = 0, tgid, ngid; |
| 160 | unsigned int max_fds = 0; |
| 161 | |
| 162 | rcu_read_lock(); |
| 163 | ppid = pid_alive(p) ? |
| 164 | task_tgid_nr_ns(rcu_dereference(p->real_parent), ns) : 0; |
| 165 | |
| 166 | tracer = ptrace_parent(p); |
| 167 | if (tracer) |
| 168 | tpid = task_pid_nr_ns(tracer, ns); |
| 169 | |
| 170 | tgid = task_tgid_nr_ns(p, ns); |
| 171 | ngid = task_numa_group_id(p); |
| 172 | cred = get_task_cred(p); |
| 173 | |
| 174 | task_lock(p); |
| 175 | if (p->fs) |
| 176 | umask = p->fs->umask; |
| 177 | if (p->files) |
| 178 | max_fds = files_fdtable(p->files)->max_fds; |
| 179 | task_unlock(p); |
| 180 | rcu_read_unlock(); |
| 181 | |
| 182 | if (umask >= 0) |
| 183 | seq_printf(m, "Umask:\t%#04o\n", umask); |
| 184 | seq_puts(m, "State:\t"); |
| 185 | seq_puts(m, get_task_state(p)); |
| 186 | |
| 187 | seq_put_decimal_ull(m, "\nTgid:\t", tgid); |
| 188 | seq_put_decimal_ull(m, "\nNgid:\t", ngid); |
| 189 | seq_put_decimal_ull(m, "\nPid:\t", pid_nr_ns(pid, ns)); |
| 190 | seq_put_decimal_ull(m, "\nPPid:\t", ppid); |
| 191 | seq_put_decimal_ull(m, "\nTracerPid:\t", tpid); |
| 192 | seq_put_decimal_ull(m, "\nUid:\t", from_kuid_munged(user_ns, cred->uid)); |
| 193 | seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->euid)); |
| 194 | seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->suid)); |
| 195 | seq_put_decimal_ull(m, "\t", from_kuid_munged(user_ns, cred->fsuid)); |
| 196 | seq_put_decimal_ull(m, "\nGid:\t", from_kgid_munged(user_ns, cred->gid)); |
| 197 | seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->egid)); |
| 198 | seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->sgid)); |
| 199 | seq_put_decimal_ull(m, "\t", from_kgid_munged(user_ns, cred->fsgid)); |
| 200 | seq_put_decimal_ull(m, "\nFDSize:\t", max_fds); |
| 201 | |
| 202 | seq_puts(m, "\nGroups:\t"); |
| 203 | group_info = cred->group_info; |
| 204 | for (g = 0; g < group_info->ngroups; g++) |
| 205 | seq_put_decimal_ull(m, g ? " " : "", |
| 206 | from_kgid_munged(user_ns, group_info->gid[g])); |
| 207 | put_cred(cred); |
| 208 | /* Trailing space shouldn't have been added in the first place. */ |
| 209 | seq_putc(m, ' '); |
| 210 | |
| 211 | #ifdef CONFIG_PID_NS |
| 212 | seq_puts(m, "\nNStgid:"); |
| 213 | for (g = ns->level; g <= pid->level; g++) |
| 214 | seq_put_decimal_ull(m, "\t", task_tgid_nr_ns(p, pid->numbers[g].ns)); |
| 215 | seq_puts(m, "\nNSpid:"); |
| 216 | for (g = ns->level; g <= pid->level; g++) |
| 217 | seq_put_decimal_ull(m, "\t", task_pid_nr_ns(p, pid->numbers[g].ns)); |
| 218 | seq_puts(m, "\nNSpgid:"); |
| 219 | for (g = ns->level; g <= pid->level; g++) |
| 220 | seq_put_decimal_ull(m, "\t", task_pgrp_nr_ns(p, pid->numbers[g].ns)); |
| 221 | seq_puts(m, "\nNSsid:"); |
| 222 | for (g = ns->level; g <= pid->level; g++) |
| 223 | seq_put_decimal_ull(m, "\t", task_session_nr_ns(p, pid->numbers[g].ns)); |
| 224 | #endif |
| 225 | seq_putc(m, '\n'); |
| 226 | } |
| 227 | |
| 228 | void render_sigset_t(struct seq_file *m, const char *header, |
| 229 | sigset_t *set) |
| 230 | { |
| 231 | int i; |
| 232 | |
| 233 | seq_puts(m, header); |
| 234 | |
| 235 | i = _NSIG; |
| 236 | do { |
| 237 | int x = 0; |
| 238 | |
| 239 | i -= 4; |
| 240 | if (sigismember(set, i+1)) x |= 1; |
| 241 | if (sigismember(set, i+2)) x |= 2; |
| 242 | if (sigismember(set, i+3)) x |= 4; |
| 243 | if (sigismember(set, i+4)) x |= 8; |
| 244 | seq_putc(m, hex_asc[x]); |
| 245 | } while (i >= 4); |
| 246 | |
| 247 | seq_putc(m, '\n'); |
| 248 | } |
| 249 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 250 | static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *sigign, |
| 251 | sigset_t *sigcatch) |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 252 | { |
| 253 | struct k_sigaction *k; |
| 254 | int i; |
| 255 | |
| 256 | k = p->sighand->action; |
| 257 | for (i = 1; i <= _NSIG; ++i, ++k) { |
| 258 | if (k->sa.sa_handler == SIG_IGN) |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 259 | sigaddset(sigign, i); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 260 | else if (k->sa.sa_handler != SIG_DFL) |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 261 | sigaddset(sigcatch, i); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 262 | } |
| 263 | } |
| 264 | |
| 265 | static inline void task_sig(struct seq_file *m, struct task_struct *p) |
| 266 | { |
| 267 | unsigned long flags; |
| 268 | sigset_t pending, shpending, blocked, ignored, caught; |
| 269 | int num_threads = 0; |
| 270 | unsigned int qsize = 0; |
| 271 | unsigned long qlim = 0; |
| 272 | |
| 273 | sigemptyset(&pending); |
| 274 | sigemptyset(&shpending); |
| 275 | sigemptyset(&blocked); |
| 276 | sigemptyset(&ignored); |
| 277 | sigemptyset(&caught); |
| 278 | |
| 279 | if (lock_task_sighand(p, &flags)) { |
| 280 | pending = p->pending.signal; |
| 281 | shpending = p->signal->shared_pending.signal; |
| 282 | blocked = p->blocked; |
| 283 | collect_sigign_sigcatch(p, &ignored, &caught); |
| 284 | num_threads = get_nr_threads(p); |
| 285 | rcu_read_lock(); /* FIXME: is this correct? */ |
| 286 | qsize = atomic_read(&__task_cred(p)->user->sigpending); |
| 287 | rcu_read_unlock(); |
| 288 | qlim = task_rlimit(p, RLIMIT_SIGPENDING); |
| 289 | unlock_task_sighand(p, &flags); |
| 290 | } |
| 291 | |
| 292 | seq_put_decimal_ull(m, "Threads:\t", num_threads); |
| 293 | seq_put_decimal_ull(m, "\nSigQ:\t", qsize); |
| 294 | seq_put_decimal_ull(m, "/", qlim); |
| 295 | |
| 296 | /* render them all */ |
| 297 | render_sigset_t(m, "\nSigPnd:\t", &pending); |
| 298 | render_sigset_t(m, "ShdPnd:\t", &shpending); |
| 299 | render_sigset_t(m, "SigBlk:\t", &blocked); |
| 300 | render_sigset_t(m, "SigIgn:\t", &ignored); |
| 301 | render_sigset_t(m, "SigCgt:\t", &caught); |
| 302 | } |
| 303 | |
| 304 | static void render_cap_t(struct seq_file *m, const char *header, |
| 305 | kernel_cap_t *a) |
| 306 | { |
| 307 | unsigned __capi; |
| 308 | |
| 309 | seq_puts(m, header); |
| 310 | CAP_FOR_EACH_U32(__capi) { |
| 311 | seq_put_hex_ll(m, NULL, |
| 312 | a->cap[CAP_LAST_U32 - __capi], 8); |
| 313 | } |
| 314 | seq_putc(m, '\n'); |
| 315 | } |
| 316 | |
| 317 | static inline void task_cap(struct seq_file *m, struct task_struct *p) |
| 318 | { |
| 319 | const struct cred *cred; |
| 320 | kernel_cap_t cap_inheritable, cap_permitted, cap_effective, |
| 321 | cap_bset, cap_ambient; |
| 322 | |
| 323 | rcu_read_lock(); |
| 324 | cred = __task_cred(p); |
| 325 | cap_inheritable = cred->cap_inheritable; |
| 326 | cap_permitted = cred->cap_permitted; |
| 327 | cap_effective = cred->cap_effective; |
| 328 | cap_bset = cred->cap_bset; |
| 329 | cap_ambient = cred->cap_ambient; |
| 330 | rcu_read_unlock(); |
| 331 | |
| 332 | render_cap_t(m, "CapInh:\t", &cap_inheritable); |
| 333 | render_cap_t(m, "CapPrm:\t", &cap_permitted); |
| 334 | render_cap_t(m, "CapEff:\t", &cap_effective); |
| 335 | render_cap_t(m, "CapBnd:\t", &cap_bset); |
| 336 | render_cap_t(m, "CapAmb:\t", &cap_ambient); |
| 337 | } |
| 338 | |
| 339 | static inline void task_seccomp(struct seq_file *m, struct task_struct *p) |
| 340 | { |
| 341 | seq_put_decimal_ull(m, "NoNewPrivs:\t", task_no_new_privs(p)); |
| 342 | #ifdef CONFIG_SECCOMP |
| 343 | seq_put_decimal_ull(m, "\nSeccomp:\t", p->seccomp.mode); |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 344 | #ifdef CONFIG_SECCOMP_FILTER |
| 345 | seq_put_decimal_ull(m, "\nSeccomp_filters:\t", |
| 346 | atomic_read(&p->seccomp.filter_count)); |
| 347 | #endif |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 348 | #endif |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 349 | seq_puts(m, "\nSpeculation_Store_Bypass:\t"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 350 | switch (arch_prctl_spec_ctrl_get(p, PR_SPEC_STORE_BYPASS)) { |
| 351 | case -EINVAL: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 352 | seq_puts(m, "unknown"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 353 | break; |
| 354 | case PR_SPEC_NOT_AFFECTED: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 355 | seq_puts(m, "not vulnerable"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 356 | break; |
| 357 | case PR_SPEC_PRCTL | PR_SPEC_FORCE_DISABLE: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 358 | seq_puts(m, "thread force mitigated"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 359 | break; |
| 360 | case PR_SPEC_PRCTL | PR_SPEC_DISABLE: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 361 | seq_puts(m, "thread mitigated"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 362 | break; |
| 363 | case PR_SPEC_PRCTL | PR_SPEC_ENABLE: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 364 | seq_puts(m, "thread vulnerable"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 365 | break; |
| 366 | case PR_SPEC_DISABLE: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 367 | seq_puts(m, "globally mitigated"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 368 | break; |
| 369 | default: |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 370 | seq_puts(m, "vulnerable"); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 371 | break; |
| 372 | } |
| 373 | seq_putc(m, '\n'); |
| 374 | } |
| 375 | |
| 376 | static inline void task_context_switch_counts(struct seq_file *m, |
| 377 | struct task_struct *p) |
| 378 | { |
| 379 | seq_put_decimal_ull(m, "voluntary_ctxt_switches:\t", p->nvcsw); |
| 380 | seq_put_decimal_ull(m, "\nnonvoluntary_ctxt_switches:\t", p->nivcsw); |
| 381 | seq_putc(m, '\n'); |
| 382 | } |
| 383 | |
| 384 | static void task_cpus_allowed(struct seq_file *m, struct task_struct *task) |
| 385 | { |
| 386 | seq_printf(m, "Cpus_allowed:\t%*pb\n", |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 387 | cpumask_pr_args(task->cpus_ptr)); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 388 | seq_printf(m, "Cpus_allowed_list:\t%*pbl\n", |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 389 | cpumask_pr_args(task->cpus_ptr)); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 390 | } |
| 391 | |
| 392 | static inline void task_core_dumping(struct seq_file *m, struct mm_struct *mm) |
| 393 | { |
| 394 | seq_put_decimal_ull(m, "CoreDumping:\t", !!mm->core_state); |
| 395 | seq_putc(m, '\n'); |
| 396 | } |
| 397 | |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 398 | static inline void task_thp_status(struct seq_file *m, struct mm_struct *mm) |
| 399 | { |
| 400 | bool thp_enabled = IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE); |
| 401 | |
| 402 | if (thp_enabled) |
| 403 | thp_enabled = !test_bit(MMF_DISABLE_THP, &mm->flags); |
| 404 | seq_printf(m, "THP_enabled:\t%d\n", thp_enabled); |
| 405 | } |
| 406 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 407 | int proc_pid_status(struct seq_file *m, struct pid_namespace *ns, |
| 408 | struct pid *pid, struct task_struct *task) |
| 409 | { |
| 410 | struct mm_struct *mm = get_task_mm(task); |
| 411 | |
| 412 | seq_puts(m, "Name:\t"); |
| 413 | proc_task_name(m, task, true); |
| 414 | seq_putc(m, '\n'); |
| 415 | |
| 416 | task_state(m, ns, pid, task); |
| 417 | |
| 418 | if (mm) { |
| 419 | task_mem(m, mm); |
| 420 | task_core_dumping(m, mm); |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 421 | task_thp_status(m, mm); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 422 | mmput(mm); |
| 423 | } |
| 424 | task_sig(m, task); |
| 425 | task_cap(m, task); |
| 426 | task_seccomp(m, task); |
| 427 | task_cpus_allowed(m, task); |
| 428 | cpuset_task_status_allowed(m, task); |
| 429 | task_context_switch_counts(m, task); |
| 430 | return 0; |
| 431 | } |
| 432 | |
| 433 | static int do_task_stat(struct seq_file *m, struct pid_namespace *ns, |
| 434 | struct pid *pid, struct task_struct *task, int whole) |
| 435 | { |
| 436 | unsigned long vsize, eip, esp, wchan = 0; |
| 437 | int priority, nice; |
| 438 | int tty_pgrp = -1, tty_nr = 0; |
| 439 | sigset_t sigign, sigcatch; |
| 440 | char state; |
| 441 | pid_t ppid = 0, pgid = -1, sid = -1; |
| 442 | int num_threads = 0; |
| 443 | int permitted; |
| 444 | struct mm_struct *mm; |
| 445 | unsigned long long start_time; |
| 446 | unsigned long cmin_flt = 0, cmaj_flt = 0; |
| 447 | unsigned long min_flt = 0, maj_flt = 0; |
| 448 | u64 cutime, cstime, utime, stime; |
| 449 | u64 cgtime, gtime; |
| 450 | unsigned long rsslim = 0; |
| 451 | unsigned long flags; |
| 452 | |
| 453 | state = *get_task_state(task); |
| 454 | vsize = eip = esp = 0; |
| 455 | permitted = ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS | PTRACE_MODE_NOAUDIT); |
| 456 | mm = get_task_mm(task); |
| 457 | if (mm) { |
| 458 | vsize = task_vsize(mm); |
| 459 | /* |
| 460 | * esp and eip are intentionally zeroed out. There is no |
| 461 | * non-racy way to read them without freezing the task. |
| 462 | * Programs that need reliable values can use ptrace(2). |
| 463 | * |
| 464 | * The only exception is if the task is core dumping because |
| 465 | * a program is not able to use ptrace(2) in that case. It is |
| 466 | * safe because the task has stopped executing permanently. |
| 467 | */ |
David Brazdil | 0f672f6 | 2019-12-10 10:32:29 +0000 | [diff] [blame] | 468 | if (permitted && (task->flags & (PF_EXITING|PF_DUMPCORE))) { |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 469 | if (try_get_task_stack(task)) { |
| 470 | eip = KSTK_EIP(task); |
| 471 | esp = KSTK_ESP(task); |
| 472 | put_task_stack(task); |
| 473 | } |
| 474 | } |
| 475 | } |
| 476 | |
| 477 | sigemptyset(&sigign); |
| 478 | sigemptyset(&sigcatch); |
| 479 | cutime = cstime = utime = stime = 0; |
| 480 | cgtime = gtime = 0; |
| 481 | |
| 482 | if (lock_task_sighand(task, &flags)) { |
| 483 | struct signal_struct *sig = task->signal; |
| 484 | |
| 485 | if (sig->tty) { |
| 486 | struct pid *pgrp = tty_get_pgrp(sig->tty); |
| 487 | tty_pgrp = pid_nr_ns(pgrp, ns); |
| 488 | put_pid(pgrp); |
| 489 | tty_nr = new_encode_dev(tty_devnum(sig->tty)); |
| 490 | } |
| 491 | |
| 492 | num_threads = get_nr_threads(task); |
| 493 | collect_sigign_sigcatch(task, &sigign, &sigcatch); |
| 494 | |
| 495 | cmin_flt = sig->cmin_flt; |
| 496 | cmaj_flt = sig->cmaj_flt; |
| 497 | cutime = sig->cutime; |
| 498 | cstime = sig->cstime; |
| 499 | cgtime = sig->cgtime; |
| 500 | rsslim = READ_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur); |
| 501 | |
| 502 | /* add up live thread stats at the group level */ |
| 503 | if (whole) { |
| 504 | struct task_struct *t = task; |
| 505 | do { |
| 506 | min_flt += t->min_flt; |
| 507 | maj_flt += t->maj_flt; |
| 508 | gtime += task_gtime(t); |
| 509 | } while_each_thread(task, t); |
| 510 | |
| 511 | min_flt += sig->min_flt; |
| 512 | maj_flt += sig->maj_flt; |
| 513 | thread_group_cputime_adjusted(task, &utime, &stime); |
| 514 | gtime += sig->gtime; |
| 515 | } |
| 516 | |
| 517 | sid = task_session_nr_ns(task, ns); |
| 518 | ppid = task_tgid_nr_ns(task->real_parent, ns); |
| 519 | pgid = task_pgrp_nr_ns(task, ns); |
| 520 | |
| 521 | unlock_task_sighand(task, &flags); |
| 522 | } |
| 523 | |
| 524 | if (permitted && (!whole || num_threads < 2)) |
| 525 | wchan = get_wchan(task); |
| 526 | if (!whole) { |
| 527 | min_flt = task->min_flt; |
| 528 | maj_flt = task->maj_flt; |
| 529 | task_cputime_adjusted(task, &utime, &stime); |
| 530 | gtime = task_gtime(task); |
| 531 | } |
| 532 | |
| 533 | /* scale priority and nice values from timeslices to -20..20 */ |
| 534 | /* to make it look like a "normal" Unix priority/nice value */ |
| 535 | priority = task_prio(task); |
| 536 | nice = task_nice(task); |
| 537 | |
| 538 | /* convert nsec -> ticks */ |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 539 | start_time = nsec_to_clock_t(task->start_boottime); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 540 | |
| 541 | seq_put_decimal_ull(m, "", pid_nr_ns(pid, ns)); |
| 542 | seq_puts(m, " ("); |
| 543 | proc_task_name(m, task, false); |
| 544 | seq_puts(m, ") "); |
| 545 | seq_putc(m, state); |
| 546 | seq_put_decimal_ll(m, " ", ppid); |
| 547 | seq_put_decimal_ll(m, " ", pgid); |
| 548 | seq_put_decimal_ll(m, " ", sid); |
| 549 | seq_put_decimal_ll(m, " ", tty_nr); |
| 550 | seq_put_decimal_ll(m, " ", tty_pgrp); |
| 551 | seq_put_decimal_ull(m, " ", task->flags); |
| 552 | seq_put_decimal_ull(m, " ", min_flt); |
| 553 | seq_put_decimal_ull(m, " ", cmin_flt); |
| 554 | seq_put_decimal_ull(m, " ", maj_flt); |
| 555 | seq_put_decimal_ull(m, " ", cmaj_flt); |
| 556 | seq_put_decimal_ull(m, " ", nsec_to_clock_t(utime)); |
| 557 | seq_put_decimal_ull(m, " ", nsec_to_clock_t(stime)); |
| 558 | seq_put_decimal_ll(m, " ", nsec_to_clock_t(cutime)); |
| 559 | seq_put_decimal_ll(m, " ", nsec_to_clock_t(cstime)); |
| 560 | seq_put_decimal_ll(m, " ", priority); |
| 561 | seq_put_decimal_ll(m, " ", nice); |
| 562 | seq_put_decimal_ll(m, " ", num_threads); |
| 563 | seq_put_decimal_ull(m, " ", 0); |
| 564 | seq_put_decimal_ull(m, " ", start_time); |
| 565 | seq_put_decimal_ull(m, " ", vsize); |
| 566 | seq_put_decimal_ull(m, " ", mm ? get_mm_rss(mm) : 0); |
| 567 | seq_put_decimal_ull(m, " ", rsslim); |
| 568 | seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->start_code : 1) : 0); |
| 569 | seq_put_decimal_ull(m, " ", mm ? (permitted ? mm->end_code : 1) : 0); |
| 570 | seq_put_decimal_ull(m, " ", (permitted && mm) ? mm->start_stack : 0); |
| 571 | seq_put_decimal_ull(m, " ", esp); |
| 572 | seq_put_decimal_ull(m, " ", eip); |
| 573 | /* The signal information here is obsolete. |
| 574 | * It must be decimal for Linux 2.0 compatibility. |
| 575 | * Use /proc/#/status for real-time signals. |
| 576 | */ |
| 577 | seq_put_decimal_ull(m, " ", task->pending.signal.sig[0] & 0x7fffffffUL); |
| 578 | seq_put_decimal_ull(m, " ", task->blocked.sig[0] & 0x7fffffffUL); |
| 579 | seq_put_decimal_ull(m, " ", sigign.sig[0] & 0x7fffffffUL); |
| 580 | seq_put_decimal_ull(m, " ", sigcatch.sig[0] & 0x7fffffffUL); |
| 581 | |
| 582 | /* |
| 583 | * We used to output the absolute kernel address, but that's an |
| 584 | * information leak - so instead we show a 0/1 flag here, to signal |
| 585 | * to user-space whether there's a wchan field in /proc/PID/wchan. |
| 586 | * |
| 587 | * This works with older implementations of procps as well. |
| 588 | */ |
| 589 | if (wchan) |
| 590 | seq_puts(m, " 1"); |
| 591 | else |
| 592 | seq_puts(m, " 0"); |
| 593 | |
| 594 | seq_put_decimal_ull(m, " ", 0); |
| 595 | seq_put_decimal_ull(m, " ", 0); |
| 596 | seq_put_decimal_ll(m, " ", task->exit_signal); |
| 597 | seq_put_decimal_ll(m, " ", task_cpu(task)); |
| 598 | seq_put_decimal_ull(m, " ", task->rt_priority); |
| 599 | seq_put_decimal_ull(m, " ", task->policy); |
| 600 | seq_put_decimal_ull(m, " ", delayacct_blkio_ticks(task)); |
| 601 | seq_put_decimal_ull(m, " ", nsec_to_clock_t(gtime)); |
| 602 | seq_put_decimal_ll(m, " ", nsec_to_clock_t(cgtime)); |
| 603 | |
| 604 | if (mm && permitted) { |
| 605 | seq_put_decimal_ull(m, " ", mm->start_data); |
| 606 | seq_put_decimal_ull(m, " ", mm->end_data); |
| 607 | seq_put_decimal_ull(m, " ", mm->start_brk); |
| 608 | seq_put_decimal_ull(m, " ", mm->arg_start); |
| 609 | seq_put_decimal_ull(m, " ", mm->arg_end); |
| 610 | seq_put_decimal_ull(m, " ", mm->env_start); |
| 611 | seq_put_decimal_ull(m, " ", mm->env_end); |
| 612 | } else |
| 613 | seq_puts(m, " 0 0 0 0 0 0 0"); |
| 614 | |
| 615 | if (permitted) |
| 616 | seq_put_decimal_ll(m, " ", task->exit_code); |
| 617 | else |
| 618 | seq_puts(m, " 0"); |
| 619 | |
| 620 | seq_putc(m, '\n'); |
| 621 | if (mm) |
| 622 | mmput(mm); |
| 623 | return 0; |
| 624 | } |
| 625 | |
| 626 | int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns, |
| 627 | struct pid *pid, struct task_struct *task) |
| 628 | { |
| 629 | return do_task_stat(m, ns, pid, task, 0); |
| 630 | } |
| 631 | |
| 632 | int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns, |
| 633 | struct pid *pid, struct task_struct *task) |
| 634 | { |
| 635 | return do_task_stat(m, ns, pid, task, 1); |
| 636 | } |
| 637 | |
| 638 | int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns, |
| 639 | struct pid *pid, struct task_struct *task) |
| 640 | { |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 641 | struct mm_struct *mm = get_task_mm(task); |
| 642 | |
| 643 | if (mm) { |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 644 | unsigned long size; |
| 645 | unsigned long resident = 0; |
| 646 | unsigned long shared = 0; |
| 647 | unsigned long text = 0; |
| 648 | unsigned long data = 0; |
| 649 | |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 650 | size = task_statm(mm, &shared, &text, &data, &resident); |
| 651 | mmput(mm); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 652 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 653 | /* |
| 654 | * For quick read, open code by putting numbers directly |
| 655 | * expected format is |
| 656 | * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n", |
| 657 | * size, resident, shared, text, data); |
| 658 | */ |
| 659 | seq_put_decimal_ull(m, "", size); |
| 660 | seq_put_decimal_ull(m, " ", resident); |
| 661 | seq_put_decimal_ull(m, " ", shared); |
| 662 | seq_put_decimal_ull(m, " ", text); |
| 663 | seq_put_decimal_ull(m, " ", 0); |
| 664 | seq_put_decimal_ull(m, " ", data); |
| 665 | seq_put_decimal_ull(m, " ", 0); |
| 666 | seq_putc(m, '\n'); |
| 667 | } else { |
| 668 | seq_write(m, "0 0 0 0 0 0 0\n", 14); |
| 669 | } |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 670 | return 0; |
| 671 | } |
| 672 | |
| 673 | #ifdef CONFIG_PROC_CHILDREN |
| 674 | static struct pid * |
| 675 | get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos) |
| 676 | { |
| 677 | struct task_struct *start, *task; |
| 678 | struct pid *pid = NULL; |
| 679 | |
| 680 | read_lock(&tasklist_lock); |
| 681 | |
| 682 | start = pid_task(proc_pid(inode), PIDTYPE_PID); |
| 683 | if (!start) |
| 684 | goto out; |
| 685 | |
| 686 | /* |
| 687 | * Lets try to continue searching first, this gives |
| 688 | * us significant speedup on children-rich processes. |
| 689 | */ |
| 690 | if (pid_prev) { |
| 691 | task = pid_task(pid_prev, PIDTYPE_PID); |
| 692 | if (task && task->real_parent == start && |
| 693 | !(list_empty(&task->sibling))) { |
| 694 | if (list_is_last(&task->sibling, &start->children)) |
| 695 | goto out; |
| 696 | task = list_first_entry(&task->sibling, |
| 697 | struct task_struct, sibling); |
| 698 | pid = get_pid(task_pid(task)); |
| 699 | goto out; |
| 700 | } |
| 701 | } |
| 702 | |
| 703 | /* |
| 704 | * Slow search case. |
| 705 | * |
| 706 | * We might miss some children here if children |
| 707 | * are exited while we were not holding the lock, |
| 708 | * but it was never promised to be accurate that |
| 709 | * much. |
| 710 | * |
| 711 | * "Just suppose that the parent sleeps, but N children |
| 712 | * exit after we printed their tids. Now the slow paths |
| 713 | * skips N extra children, we miss N tasks." (c) |
| 714 | * |
| 715 | * So one need to stop or freeze the leader and all |
| 716 | * its children to get a precise result. |
| 717 | */ |
| 718 | list_for_each_entry(task, &start->children, sibling) { |
| 719 | if (pos-- == 0) { |
| 720 | pid = get_pid(task_pid(task)); |
| 721 | break; |
| 722 | } |
| 723 | } |
| 724 | |
| 725 | out: |
| 726 | read_unlock(&tasklist_lock); |
| 727 | return pid; |
| 728 | } |
| 729 | |
| 730 | static int children_seq_show(struct seq_file *seq, void *v) |
| 731 | { |
| 732 | struct inode *inode = file_inode(seq->file); |
| 733 | |
Olivier Deprez | 157378f | 2022-04-04 15:47:50 +0200 | [diff] [blame^] | 734 | seq_printf(seq, "%d ", pid_nr_ns(v, proc_pid_ns(inode->i_sb))); |
Andrew Scull | b4b6d4a | 2019-01-02 15:54:55 +0000 | [diff] [blame] | 735 | return 0; |
| 736 | } |
| 737 | |
| 738 | static void *children_seq_start(struct seq_file *seq, loff_t *pos) |
| 739 | { |
| 740 | return get_children_pid(file_inode(seq->file), NULL, *pos); |
| 741 | } |
| 742 | |
| 743 | static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos) |
| 744 | { |
| 745 | struct pid *pid; |
| 746 | |
| 747 | pid = get_children_pid(file_inode(seq->file), v, *pos + 1); |
| 748 | put_pid(v); |
| 749 | |
| 750 | ++*pos; |
| 751 | return pid; |
| 752 | } |
| 753 | |
| 754 | static void children_seq_stop(struct seq_file *seq, void *v) |
| 755 | { |
| 756 | put_pid(v); |
| 757 | } |
| 758 | |
| 759 | static const struct seq_operations children_seq_ops = { |
| 760 | .start = children_seq_start, |
| 761 | .next = children_seq_next, |
| 762 | .stop = children_seq_stop, |
| 763 | .show = children_seq_show, |
| 764 | }; |
| 765 | |
| 766 | static int children_seq_open(struct inode *inode, struct file *file) |
| 767 | { |
| 768 | return seq_open(file, &children_seq_ops); |
| 769 | } |
| 770 | |
| 771 | const struct file_operations proc_tid_children_operations = { |
| 772 | .open = children_seq_open, |
| 773 | .read = seq_read, |
| 774 | .llseek = seq_lseek, |
| 775 | .release = seq_release, |
| 776 | }; |
| 777 | #endif /* CONFIG_PROC_CHILDREN */ |