| 1 | // SPDX-License-Identifier: GPL-2.0 |
| 2 | /* |
| 3 | * linux/fs/proc/array.c |
| 4 | * |
| 5 | * Copyright (C) 1992 by Linus Torvalds |
| 6 | * based on ideas by Darren Senn |
| 7 | * |
| 8 | * Fixes: |
| 9 | * Michael. K. Johnson: stat,statm extensions. |
| 10 | * <johnsonm@stolaf.edu> |
| 11 | * |
| 12 | * Pauline Middelink : Made cmdline,envline only break at '\0's, to |
| 13 | * make sure SET_PROCTITLE works. Also removed |
| 14 | * bad '!' which forced address recalculation for |
| 15 | * EVERY character on the current page. |
| 16 | * <middelin@polyware.iaf.nl> |
| 17 | * |
| 18 | * Danny ter Haar : added cpuinfo |
| 19 | * <dth@cistron.nl> |
| 20 | * |
| 21 | * Alessandro Rubini : profile extension. |
| 22 | * <rubini@ipvvis.unipv.it> |
| 23 | * |
| 24 | * Jeff Tranter : added BogoMips field to cpuinfo |
| 25 | * <Jeff_Tranter@Mitel.COM> |
| 26 | * |
| 27 | * Bruno Haible : remove 4K limit for the maps file |
| 28 | * <haible@ma2s2.mathematik.uni-karlsruhe.de> |
| 29 | * |
| 30 | * Yves Arrouye : remove removal of trailing spaces in get_array. |
| 31 | * <Yves.Arrouye@marin.fdn.fr> |
| 32 | * |
| 33 | * Jerome Forissier : added per-CPU time information to /proc/stat |
| 34 | * and /proc/<pid>/cpu extension |
| 35 | * <forissier@isia.cma.fr> |
| 36 | * - Incorporation and non-SMP safe operation |
| 37 | * of forissier patch in 2.1.78 by |
| 38 | * Hans Marcus <crowbar@concepts.nl> |
| 39 | * |
| 40 | * aeb@cwi.nl : /proc/partitions |
| 41 | * |
| 42 | * |
| 43 | * Alan Cox : security fixes. |
| 44 | * <alan@lxorguk.ukuu.org.uk> |
| 45 | * |
| 46 | * Al Viro : safe handling of mm_struct |
| 47 | * |
| 48 | * Gerhard Wichert : added BIGMEM support |
| 49 | * Siemens AG <Gerhard.Wichert@pdb.siemens.de> |
| 50 | * |
| 51 | * Al Viro & Jeff Garzik : moved most of the thing into base.c and |
| 52 | * : proc_misc.c. The rest may eventually go into |
| 53 | * : base.c too. |
| 54 | */ |
| 55 | |
| 56 | #include <linux/types.h> |
| 57 | #include <linux/errno.h> |
| 58 | #include <linux/time.h> |
| 59 | #include <linux/time_namespace.h> |
| 60 | #include <linux/kernel.h> |
| 61 | #include <linux/kernel_stat.h> |
| 62 | #include <linux/tty.h> |
| 63 | #include <linux/string.h> |
| 64 | #include <linux/mman.h> |
| 65 | #include <linux/sched/mm.h> |
| 66 | #include <linux/sched/numa_balancing.h> |
| 67 | #include <linux/sched/task_stack.h> |
| 68 | #include <linux/sched/task.h> |
| 69 | #include <linux/sched/cputime.h> |
| 70 | #include <linux/proc_fs.h> |
| 71 | #include <linux/ioport.h> |
| 72 | #include <linux/io.h> |
| 73 | #include <linux/mm.h> |
| 74 | #include <linux/hugetlb.h> |
| 75 | #include <linux/pagemap.h> |
| 76 | #include <linux/swap.h> |
| 77 | #include <linux/smp.h> |
| 78 | #include <linux/signal.h> |
| 79 | #include <linux/highmem.h> |
| 80 | #include <linux/file.h> |
| 81 | #include <linux/fdtable.h> |
| 82 | #include <linux/times.h> |
| 83 | #include <linux/cpuset.h> |
| 84 | #include <linux/rcupdate.h> |
| 85 | #include <linux/delayacct.h> |
| 86 | #include <linux/seq_file.h> |
| 87 | #include <linux/pid_namespace.h> |
| 88 | #include <linux/prctl.h> |
| 89 | #include <linux/ptrace.h> |
| 90 | #include <linux/string_helpers.h> |
| 91 | #include <linux/user_namespace.h> |
| 92 | #include <linux/fs_struct.h> |
| 93 | #include <linux/kthread.h> |
| 94 | #include <linux/mmu_context.h> |
| 95 | |
| 96 | #include <asm/processor.h> |
| 97 | #include "internal.h" |
| 98 | |
| 99 | void proc_task_name(struct seq_file *m, struct task_struct *p, bool escape) |
| 100 | { |
| 101 | char tcomm[64]; |
| 102 | |
| 103 | /* |
| 104 | * Test before PF_KTHREAD because all workqueue worker threads are |
| 105 | * kernel threads. |
| 106 | */ |
| 107 | if (p->flags & PF_WQ_WORKER) |
| 108 | wq_worker_comm(buf: tcomm, size: sizeof(tcomm), task: p); |
| 109 | else if (p->flags & PF_KTHREAD) |
| 110 | get_kthread_comm(buf: tcomm, buf_size: sizeof(tcomm), tsk: p); |
| 111 | else |
| 112 | get_task_comm(tcomm, p); |
| 113 | |
| 114 | if (escape) |
| 115 | seq_escape_str(m, src: tcomm, ESCAPE_SPACE | ESCAPE_SPECIAL, esc: "\n\\" ); |
| 116 | else |
| 117 | seq_printf(m, fmt: "%.64s" , tcomm); |
| 118 | } |
| 119 | |
| 120 | /* |
| 121 | * The task state array is a strange "bitmap" of |
| 122 | * reasons to sleep. Thus "running" is zero, and |
| 123 | * you can test for combinations of others with |
| 124 | * simple bit tests. |
| 125 | */ |
| 126 | static const char * const task_state_array[] = { |
| 127 | |
| 128 | /* states in TASK_REPORT: */ |
| 129 | "R (running)" , /* 0x00 */ |
| 130 | "S (sleeping)" , /* 0x01 */ |
| 131 | "D (disk sleep)" , /* 0x02 */ |
| 132 | "T (stopped)" , /* 0x04 */ |
| 133 | "t (tracing stop)" , /* 0x08 */ |
| 134 | "X (dead)" , /* 0x10 */ |
| 135 | "Z (zombie)" , /* 0x20 */ |
| 136 | "P (parked)" , /* 0x40 */ |
| 137 | |
| 138 | /* states beyond TASK_REPORT: */ |
| 139 | "I (idle)" , /* 0x80 */ |
| 140 | }; |
| 141 | |
| 142 | static inline const char *get_task_state(struct task_struct *tsk) |
| 143 | { |
| 144 | BUILD_BUG_ON(1 + ilog2(TASK_REPORT_MAX) != ARRAY_SIZE(task_state_array)); |
| 145 | return task_state_array[task_state_index(tsk)]; |
| 146 | } |
| 147 | |
| 148 | static inline void task_state(struct seq_file *m, struct pid_namespace *ns, |
| 149 | struct pid *pid, struct task_struct *p) |
| 150 | { |
| 151 | struct user_namespace *user_ns = seq_user_ns(seq: m); |
| 152 | struct group_info *group_info; |
| 153 | int g, umask = -1; |
| 154 | struct task_struct *tracer; |
| 155 | const struct cred *cred; |
| 156 | pid_t ppid, tpid = 0, tgid, ngid; |
| 157 | unsigned int max_fds = 0; |
| 158 | |
| 159 | rcu_read_lock(); |
| 160 | tracer = ptrace_parent(task: p); |
| 161 | if (tracer) |
| 162 | tpid = task_pid_nr_ns(tsk: tracer, ns); |
| 163 | |
| 164 | ppid = task_ppid_nr_ns(tsk: p, ns); |
| 165 | tgid = task_tgid_nr_ns(tsk: p, ns); |
| 166 | ngid = task_numa_group_id(p); |
| 167 | cred = get_task_cred(p); |
| 168 | |
| 169 | task_lock(p); |
| 170 | if (p->fs) |
| 171 | umask = p->fs->umask; |
| 172 | if (p->files) |
| 173 | max_fds = files_fdtable(p->files)->max_fds; |
| 174 | task_unlock(p); |
| 175 | rcu_read_unlock(); |
| 176 | |
| 177 | if (umask >= 0) |
| 178 | seq_printf(m, fmt: "Umask:\t%#04o\n" , umask); |
| 179 | seq_puts(m, s: "State:\t" ); |
| 180 | seq_puts(m, s: get_task_state(tsk: p)); |
| 181 | |
| 182 | seq_put_decimal_ull(m, delimiter: "\nTgid:\t" , num: tgid); |
| 183 | seq_put_decimal_ull(m, delimiter: "\nNgid:\t" , num: ngid); |
| 184 | seq_put_decimal_ull(m, delimiter: "\nPid:\t" , num: pid_nr_ns(pid, ns)); |
| 185 | seq_put_decimal_ull(m, delimiter: "\nPPid:\t" , num: ppid); |
| 186 | seq_put_decimal_ull(m, delimiter: "\nTracerPid:\t" , num: tpid); |
| 187 | seq_put_decimal_ull(m, delimiter: "\nUid:\t" , num: from_kuid_munged(to: user_ns, uid: cred->uid)); |
| 188 | seq_put_decimal_ull(m, delimiter: "\t" , num: from_kuid_munged(to: user_ns, uid: cred->euid)); |
| 189 | seq_put_decimal_ull(m, delimiter: "\t" , num: from_kuid_munged(to: user_ns, uid: cred->suid)); |
| 190 | seq_put_decimal_ull(m, delimiter: "\t" , num: from_kuid_munged(to: user_ns, uid: cred->fsuid)); |
| 191 | seq_put_decimal_ull(m, delimiter: "\nGid:\t" , num: from_kgid_munged(to: user_ns, gid: cred->gid)); |
| 192 | seq_put_decimal_ull(m, delimiter: "\t" , num: from_kgid_munged(to: user_ns, gid: cred->egid)); |
| 193 | seq_put_decimal_ull(m, delimiter: "\t" , num: from_kgid_munged(to: user_ns, gid: cred->sgid)); |
| 194 | seq_put_decimal_ull(m, delimiter: "\t" , num: from_kgid_munged(to: user_ns, gid: cred->fsgid)); |
| 195 | seq_put_decimal_ull(m, delimiter: "\nFDSize:\t" , num: max_fds); |
| 196 | |
| 197 | seq_puts(m, s: "\nGroups:\t" ); |
| 198 | group_info = cred->group_info; |
| 199 | for (g = 0; g < group_info->ngroups; g++) |
| 200 | seq_put_decimal_ull(m, delimiter: g ? " " : "" , |
| 201 | num: from_kgid_munged(to: user_ns, gid: group_info->gid[g])); |
| 202 | put_cred(cred); |
| 203 | /* Trailing space shouldn't have been added in the first place. */ |
| 204 | seq_putc(m, c: ' '); |
| 205 | |
| 206 | #ifdef CONFIG_PID_NS |
| 207 | seq_puts(m, s: "\nNStgid:" ); |
| 208 | for (g = ns->level; g <= pid->level; g++) |
| 209 | seq_put_decimal_ull(m, delimiter: "\t" , num: task_tgid_nr_ns(tsk: p, ns: pid->numbers[g].ns)); |
| 210 | seq_puts(m, s: "\nNSpid:" ); |
| 211 | for (g = ns->level; g <= pid->level; g++) |
| 212 | seq_put_decimal_ull(m, delimiter: "\t" , num: task_pid_nr_ns(tsk: p, ns: pid->numbers[g].ns)); |
| 213 | seq_puts(m, s: "\nNSpgid:" ); |
| 214 | for (g = ns->level; g <= pid->level; g++) |
| 215 | seq_put_decimal_ull(m, delimiter: "\t" , num: task_pgrp_nr_ns(tsk: p, ns: pid->numbers[g].ns)); |
| 216 | seq_puts(m, s: "\nNSsid:" ); |
| 217 | for (g = ns->level; g <= pid->level; g++) |
| 218 | seq_put_decimal_ull(m, delimiter: "\t" , num: task_session_nr_ns(tsk: p, ns: pid->numbers[g].ns)); |
| 219 | #endif |
| 220 | seq_putc(m, c: '\n'); |
| 221 | |
| 222 | seq_printf(m, fmt: "Kthread:\t%c\n" , p->flags & PF_KTHREAD ? '1' : '0'); |
| 223 | } |
| 224 | |
| 225 | void render_sigset_t(struct seq_file *m, const char *, |
| 226 | sigset_t *set) |
| 227 | { |
| 228 | int i; |
| 229 | |
| 230 | seq_puts(m, s: header); |
| 231 | |
| 232 | i = _NSIG; |
| 233 | do { |
| 234 | int x = 0; |
| 235 | |
| 236 | i -= 4; |
| 237 | if (sigismember(set, sig: i+1)) x |= 1; |
| 238 | if (sigismember(set, sig: i+2)) x |= 2; |
| 239 | if (sigismember(set, sig: i+3)) x |= 4; |
| 240 | if (sigismember(set, sig: i+4)) x |= 8; |
| 241 | seq_putc(m, c: hex_asc[x]); |
| 242 | } while (i >= 4); |
| 243 | |
| 244 | seq_putc(m, c: '\n'); |
| 245 | } |
| 246 | |
| 247 | static void collect_sigign_sigcatch(struct task_struct *p, sigset_t *sigign, |
| 248 | sigset_t *sigcatch) |
| 249 | { |
| 250 | struct k_sigaction *k; |
| 251 | int i; |
| 252 | |
| 253 | k = p->sighand->action; |
| 254 | for (i = 1; i <= _NSIG; ++i, ++k) { |
| 255 | if (k->sa.sa_handler == SIG_IGN) |
| 256 | sigaddset(set: sigign, sig: i); |
| 257 | else if (k->sa.sa_handler != SIG_DFL) |
| 258 | sigaddset(set: sigcatch, sig: i); |
| 259 | } |
| 260 | } |
| 261 | |
| 262 | static inline void task_sig(struct seq_file *m, struct task_struct *p) |
| 263 | { |
| 264 | unsigned long flags; |
| 265 | sigset_t pending, shpending, blocked, ignored, caught; |
| 266 | int num_threads = 0; |
| 267 | unsigned int qsize = 0; |
| 268 | unsigned long qlim = 0; |
| 269 | |
| 270 | sigemptyset(set: &pending); |
| 271 | sigemptyset(set: &shpending); |
| 272 | sigemptyset(set: &blocked); |
| 273 | sigemptyset(set: &ignored); |
| 274 | sigemptyset(set: &caught); |
| 275 | |
| 276 | if (lock_task_sighand(task: p, flags: &flags)) { |
| 277 | pending = p->pending.signal; |
| 278 | shpending = p->signal->shared_pending.signal; |
| 279 | blocked = p->blocked; |
| 280 | collect_sigign_sigcatch(p, sigign: &ignored, sigcatch: &caught); |
| 281 | num_threads = get_nr_threads(task: p); |
| 282 | rcu_read_lock(); /* FIXME: is this correct? */ |
| 283 | qsize = get_rlimit_value(task_ucounts(p), type: UCOUNT_RLIMIT_SIGPENDING); |
| 284 | rcu_read_unlock(); |
| 285 | qlim = task_rlimit(task: p, RLIMIT_SIGPENDING); |
| 286 | unlock_task_sighand(task: p, flags: &flags); |
| 287 | } |
| 288 | |
| 289 | seq_put_decimal_ull(m, delimiter: "Threads:\t" , num: num_threads); |
| 290 | seq_put_decimal_ull(m, delimiter: "\nSigQ:\t" , num: qsize); |
| 291 | seq_put_decimal_ull(m, delimiter: "/" , num: qlim); |
| 292 | |
| 293 | /* render them all */ |
| 294 | render_sigset_t(m, header: "\nSigPnd:\t" , set: &pending); |
| 295 | render_sigset_t(m, header: "ShdPnd:\t" , set: &shpending); |
| 296 | render_sigset_t(m, header: "SigBlk:\t" , set: &blocked); |
| 297 | render_sigset_t(m, header: "SigIgn:\t" , set: &ignored); |
| 298 | render_sigset_t(m, header: "SigCgt:\t" , set: &caught); |
| 299 | } |
| 300 | |
| 301 | static void render_cap_t(struct seq_file *m, const char *, |
| 302 | kernel_cap_t *a) |
| 303 | { |
| 304 | seq_puts(m, s: header); |
| 305 | seq_put_hex_ll(m, NULL, v: a->val, width: 16); |
| 306 | seq_putc(m, c: '\n'); |
| 307 | } |
| 308 | |
| 309 | static inline void task_cap(struct seq_file *m, struct task_struct *p) |
| 310 | { |
| 311 | const struct cred *cred; |
| 312 | kernel_cap_t cap_inheritable, cap_permitted, cap_effective, |
| 313 | cap_bset, cap_ambient; |
| 314 | |
| 315 | rcu_read_lock(); |
| 316 | cred = __task_cred(p); |
| 317 | cap_inheritable = cred->cap_inheritable; |
| 318 | cap_permitted = cred->cap_permitted; |
| 319 | cap_effective = cred->cap_effective; |
| 320 | cap_bset = cred->cap_bset; |
| 321 | cap_ambient = cred->cap_ambient; |
| 322 | rcu_read_unlock(); |
| 323 | |
| 324 | render_cap_t(m, header: "CapInh:\t" , a: &cap_inheritable); |
| 325 | render_cap_t(m, header: "CapPrm:\t" , a: &cap_permitted); |
| 326 | render_cap_t(m, header: "CapEff:\t" , a: &cap_effective); |
| 327 | render_cap_t(m, header: "CapBnd:\t" , a: &cap_bset); |
| 328 | render_cap_t(m, header: "CapAmb:\t" , a: &cap_ambient); |
| 329 | } |
| 330 | |
| 331 | static inline void task_seccomp(struct seq_file *m, struct task_struct *p) |
| 332 | { |
| 333 | seq_put_decimal_ull(m, delimiter: "NoNewPrivs:\t" , num: task_no_new_privs(p)); |
| 334 | #ifdef CONFIG_SECCOMP |
| 335 | seq_put_decimal_ull(m, delimiter: "\nSeccomp:\t" , num: p->seccomp.mode); |
| 336 | #ifdef CONFIG_SECCOMP_FILTER |
| 337 | seq_put_decimal_ull(m, delimiter: "\nSeccomp_filters:\t" , |
| 338 | num: atomic_read(v: &p->seccomp.filter_count)); |
| 339 | #endif |
| 340 | #endif |
| 341 | seq_puts(m, s: "\nSpeculation_Store_Bypass:\t" ); |
| 342 | switch (arch_prctl_spec_ctrl_get(task: p, PR_SPEC_STORE_BYPASS)) { |
| 343 | case -EINVAL: |
| 344 | seq_puts(m, s: "unknown" ); |
| 345 | break; |
| 346 | case PR_SPEC_NOT_AFFECTED: |
| 347 | seq_puts(m, s: "not vulnerable" ); |
| 348 | break; |
| 349 | case PR_SPEC_PRCTL | PR_SPEC_FORCE_DISABLE: |
| 350 | seq_puts(m, s: "thread force mitigated" ); |
| 351 | break; |
| 352 | case PR_SPEC_PRCTL | PR_SPEC_DISABLE: |
| 353 | seq_puts(m, s: "thread mitigated" ); |
| 354 | break; |
| 355 | case PR_SPEC_PRCTL | PR_SPEC_ENABLE: |
| 356 | seq_puts(m, s: "thread vulnerable" ); |
| 357 | break; |
| 358 | case PR_SPEC_DISABLE: |
| 359 | seq_puts(m, s: "globally mitigated" ); |
| 360 | break; |
| 361 | default: |
| 362 | seq_puts(m, s: "vulnerable" ); |
| 363 | break; |
| 364 | } |
| 365 | |
| 366 | seq_puts(m, s: "\nSpeculationIndirectBranch:\t" ); |
| 367 | switch (arch_prctl_spec_ctrl_get(task: p, PR_SPEC_INDIRECT_BRANCH)) { |
| 368 | case -EINVAL: |
| 369 | seq_puts(m, s: "unsupported" ); |
| 370 | break; |
| 371 | case PR_SPEC_NOT_AFFECTED: |
| 372 | seq_puts(m, s: "not affected" ); |
| 373 | break; |
| 374 | case PR_SPEC_PRCTL | PR_SPEC_FORCE_DISABLE: |
| 375 | seq_puts(m, s: "conditional force disabled" ); |
| 376 | break; |
| 377 | case PR_SPEC_PRCTL | PR_SPEC_DISABLE: |
| 378 | seq_puts(m, s: "conditional disabled" ); |
| 379 | break; |
| 380 | case PR_SPEC_PRCTL | PR_SPEC_ENABLE: |
| 381 | seq_puts(m, s: "conditional enabled" ); |
| 382 | break; |
| 383 | case PR_SPEC_ENABLE: |
| 384 | seq_puts(m, s: "always enabled" ); |
| 385 | break; |
| 386 | case PR_SPEC_DISABLE: |
| 387 | seq_puts(m, s: "always disabled" ); |
| 388 | break; |
| 389 | default: |
| 390 | seq_puts(m, s: "unknown" ); |
| 391 | break; |
| 392 | } |
| 393 | seq_putc(m, c: '\n'); |
| 394 | } |
| 395 | |
| 396 | static inline void task_context_switch_counts(struct seq_file *m, |
| 397 | struct task_struct *p) |
| 398 | { |
| 399 | seq_put_decimal_ull(m, delimiter: "voluntary_ctxt_switches:\t" , num: p->nvcsw); |
| 400 | seq_put_decimal_ull(m, delimiter: "\nnonvoluntary_ctxt_switches:\t" , num: p->nivcsw); |
| 401 | seq_putc(m, c: '\n'); |
| 402 | } |
| 403 | |
| 404 | static void task_cpus_allowed(struct seq_file *m, struct task_struct *task) |
| 405 | { |
| 406 | seq_printf(m, fmt: "Cpus_allowed:\t%*pb\n" , |
| 407 | cpumask_pr_args(&task->cpus_mask)); |
| 408 | seq_printf(m, fmt: "Cpus_allowed_list:\t%*pbl\n" , |
| 409 | cpumask_pr_args(&task->cpus_mask)); |
| 410 | } |
| 411 | |
| 412 | static inline void task_core_dumping(struct seq_file *m, struct task_struct *task) |
| 413 | { |
| 414 | seq_put_decimal_ull(m, delimiter: "CoreDumping:\t" , num: !!task->signal->core_state); |
| 415 | seq_putc(m, c: '\n'); |
| 416 | } |
| 417 | |
| 418 | static inline void task_thp_status(struct seq_file *m, struct mm_struct *mm) |
| 419 | { |
| 420 | bool thp_enabled = IS_ENABLED(CONFIG_TRANSPARENT_HUGEPAGE); |
| 421 | |
| 422 | if (thp_enabled) |
| 423 | thp_enabled = !mm_flags_test(MMF_DISABLE_THP_COMPLETELY, mm); |
| 424 | seq_printf(m, fmt: "THP_enabled:\t%d\n" , thp_enabled); |
| 425 | } |
| 426 | |
| 427 | static inline void task_untag_mask(struct seq_file *m, struct mm_struct *mm) |
| 428 | { |
| 429 | seq_printf(m, fmt: "untag_mask:\t%#lx\n" , mm_untag_mask(mm)); |
| 430 | } |
| 431 | |
| 432 | __weak void arch_proc_pid_thread_features(struct seq_file *m, |
| 433 | struct task_struct *task) |
| 434 | { |
| 435 | } |
| 436 | |
| 437 | int proc_pid_status(struct seq_file *m, struct pid_namespace *ns, |
| 438 | struct pid *pid, struct task_struct *task) |
| 439 | { |
| 440 | struct mm_struct *mm = get_task_mm(task); |
| 441 | |
| 442 | seq_puts(m, s: "Name:\t" ); |
| 443 | proc_task_name(m, p: task, escape: true); |
| 444 | seq_putc(m, c: '\n'); |
| 445 | |
| 446 | task_state(m, ns, pid, p: task); |
| 447 | |
| 448 | if (mm) { |
| 449 | task_mem(m, mm); |
| 450 | task_core_dumping(m, task); |
| 451 | task_thp_status(m, mm); |
| 452 | task_untag_mask(m, mm); |
| 453 | mmput(mm); |
| 454 | } |
| 455 | task_sig(m, p: task); |
| 456 | task_cap(m, p: task); |
| 457 | task_seccomp(m, p: task); |
| 458 | task_cpus_allowed(m, task); |
| 459 | cpuset_task_status_allowed(m, task); |
| 460 | task_context_switch_counts(m, p: task); |
| 461 | arch_proc_pid_thread_features(m, task); |
| 462 | return 0; |
| 463 | } |
| 464 | |
| 465 | static int do_task_stat(struct seq_file *m, struct pid_namespace *ns, |
| 466 | struct pid *pid, struct task_struct *task, int whole) |
| 467 | { |
| 468 | unsigned long vsize, eip, esp, wchan = 0; |
| 469 | int priority, nice; |
| 470 | int tty_pgrp = -1, tty_nr = 0; |
| 471 | sigset_t sigign, sigcatch; |
| 472 | char state; |
| 473 | pid_t ppid = 0, pgid = -1, sid = -1; |
| 474 | int num_threads = 0; |
| 475 | int permitted; |
| 476 | struct mm_struct *mm; |
| 477 | unsigned long long start_time; |
| 478 | unsigned long cmin_flt, cmaj_flt, min_flt, maj_flt; |
| 479 | u64 cutime, cstime, cgtime, utime, stime, gtime; |
| 480 | unsigned long = 0; |
| 481 | unsigned long flags; |
| 482 | int exit_code = task->exit_code; |
| 483 | struct signal_struct *sig = task->signal; |
| 484 | |
| 485 | state = *get_task_state(tsk: task); |
| 486 | vsize = eip = esp = 0; |
| 487 | permitted = ptrace_may_access(task, PTRACE_MODE_READ_FSCREDS | PTRACE_MODE_NOAUDIT); |
| 488 | mm = get_task_mm(task); |
| 489 | if (mm) { |
| 490 | vsize = task_vsize(mm); |
| 491 | /* |
| 492 | * esp and eip are intentionally zeroed out. There is no |
| 493 | * non-racy way to read them without freezing the task. |
| 494 | * Programs that need reliable values can use ptrace(2). |
| 495 | * |
| 496 | * The only exception is if the task is core dumping because |
| 497 | * a program is not able to use ptrace(2) in that case. It is |
| 498 | * safe because the task has stopped executing permanently. |
| 499 | */ |
| 500 | if (permitted && (task->flags & (PF_EXITING|PF_DUMPCORE|PF_POSTCOREDUMP))) { |
| 501 | if (try_get_task_stack(tsk: task)) { |
| 502 | eip = KSTK_EIP(task); |
| 503 | esp = KSTK_ESP(task); |
| 504 | put_task_stack(tsk: task); |
| 505 | } |
| 506 | } |
| 507 | } |
| 508 | |
| 509 | sigemptyset(set: &sigign); |
| 510 | sigemptyset(set: &sigcatch); |
| 511 | |
| 512 | if (lock_task_sighand(task, flags: &flags)) { |
| 513 | if (sig->tty) { |
| 514 | struct pid *pgrp = tty_get_pgrp(tty: sig->tty); |
| 515 | tty_pgrp = pid_nr_ns(pid: pgrp, ns); |
| 516 | put_pid(pid: pgrp); |
| 517 | tty_nr = new_encode_dev(dev: tty_devnum(tty: sig->tty)); |
| 518 | } |
| 519 | |
| 520 | num_threads = get_nr_threads(task); |
| 521 | collect_sigign_sigcatch(p: task, sigign: &sigign, sigcatch: &sigcatch); |
| 522 | |
| 523 | rsslim = READ_ONCE(sig->rlim[RLIMIT_RSS].rlim_cur); |
| 524 | |
| 525 | if (whole) { |
| 526 | if (sig->flags & (SIGNAL_GROUP_EXIT | SIGNAL_STOP_STOPPED)) |
| 527 | exit_code = sig->group_exit_code; |
| 528 | } |
| 529 | |
| 530 | sid = task_session_nr_ns(tsk: task, ns); |
| 531 | ppid = task_tgid_nr_ns(tsk: task->real_parent, ns); |
| 532 | pgid = task_pgrp_nr_ns(tsk: task, ns); |
| 533 | |
| 534 | unlock_task_sighand(task, flags: &flags); |
| 535 | } |
| 536 | |
| 537 | if (permitted && (!whole || num_threads < 2)) |
| 538 | wchan = !task_is_running(task); |
| 539 | |
| 540 | scoped_guard(rcu) { |
| 541 | scoped_seqlock_read (&sig->stats_lock, ss_lock_irqsave) { |
| 542 | cmin_flt = sig->cmin_flt; |
| 543 | cmaj_flt = sig->cmaj_flt; |
| 544 | cutime = sig->cutime; |
| 545 | cstime = sig->cstime; |
| 546 | cgtime = sig->cgtime; |
| 547 | |
| 548 | if (whole) { |
| 549 | struct task_struct *t; |
| 550 | |
| 551 | min_flt = sig->min_flt; |
| 552 | maj_flt = sig->maj_flt; |
| 553 | gtime = sig->gtime; |
| 554 | |
| 555 | __for_each_thread(sig, t) { |
| 556 | min_flt += t->min_flt; |
| 557 | maj_flt += t->maj_flt; |
| 558 | gtime += task_gtime(t); |
| 559 | } |
| 560 | } |
| 561 | } |
| 562 | } |
| 563 | |
| 564 | if (whole) { |
| 565 | thread_group_cputime_adjusted(p: task, ut: &utime, st: &stime); |
| 566 | } else { |
| 567 | task_cputime_adjusted(p: task, ut: &utime, st: &stime); |
| 568 | min_flt = task->min_flt; |
| 569 | maj_flt = task->maj_flt; |
| 570 | gtime = task_gtime(t: task); |
| 571 | } |
| 572 | |
| 573 | /* scale priority and nice values from timeslices to -20..20 */ |
| 574 | /* to make it look like a "normal" Unix priority/nice value */ |
| 575 | priority = task_prio(p: task); |
| 576 | nice = task_nice(p: task); |
| 577 | |
| 578 | /* apply timens offset for boottime and convert nsec -> ticks */ |
| 579 | start_time = |
| 580 | nsec_to_clock_t(x: timens_add_boottime_ns(nsec: task->start_boottime)); |
| 581 | |
| 582 | seq_put_decimal_ull(m, delimiter: "" , num: pid_nr_ns(pid, ns)); |
| 583 | seq_puts(m, s: " (" ); |
| 584 | proc_task_name(m, p: task, escape: false); |
| 585 | seq_puts(m, s: ") " ); |
| 586 | seq_putc(m, c: state); |
| 587 | seq_put_decimal_ll(m, delimiter: " " , num: ppid); |
| 588 | seq_put_decimal_ll(m, delimiter: " " , num: pgid); |
| 589 | seq_put_decimal_ll(m, delimiter: " " , num: sid); |
| 590 | seq_put_decimal_ll(m, delimiter: " " , num: tty_nr); |
| 591 | seq_put_decimal_ll(m, delimiter: " " , num: tty_pgrp); |
| 592 | seq_put_decimal_ull(m, delimiter: " " , num: task->flags); |
| 593 | seq_put_decimal_ull(m, delimiter: " " , num: min_flt); |
| 594 | seq_put_decimal_ull(m, delimiter: " " , num: cmin_flt); |
| 595 | seq_put_decimal_ull(m, delimiter: " " , num: maj_flt); |
| 596 | seq_put_decimal_ull(m, delimiter: " " , num: cmaj_flt); |
| 597 | seq_put_decimal_ull(m, delimiter: " " , num: nsec_to_clock_t(x: utime)); |
| 598 | seq_put_decimal_ull(m, delimiter: " " , num: nsec_to_clock_t(x: stime)); |
| 599 | seq_put_decimal_ll(m, delimiter: " " , num: nsec_to_clock_t(x: cutime)); |
| 600 | seq_put_decimal_ll(m, delimiter: " " , num: nsec_to_clock_t(x: cstime)); |
| 601 | seq_put_decimal_ll(m, delimiter: " " , num: priority); |
| 602 | seq_put_decimal_ll(m, delimiter: " " , num: nice); |
| 603 | seq_put_decimal_ll(m, delimiter: " " , num: num_threads); |
| 604 | seq_put_decimal_ull(m, delimiter: " " , num: 0); |
| 605 | seq_put_decimal_ull(m, delimiter: " " , num: start_time); |
| 606 | seq_put_decimal_ull(m, delimiter: " " , num: vsize); |
| 607 | seq_put_decimal_ull(m, delimiter: " " , num: mm ? get_mm_rss(mm) : 0); |
| 608 | seq_put_decimal_ull(m, delimiter: " " , num: rsslim); |
| 609 | seq_put_decimal_ull(m, delimiter: " " , num: mm ? (permitted ? mm->start_code : 1) : 0); |
| 610 | seq_put_decimal_ull(m, delimiter: " " , num: mm ? (permitted ? mm->end_code : 1) : 0); |
| 611 | seq_put_decimal_ull(m, delimiter: " " , num: (permitted && mm) ? mm->start_stack : 0); |
| 612 | seq_put_decimal_ull(m, delimiter: " " , num: esp); |
| 613 | seq_put_decimal_ull(m, delimiter: " " , num: eip); |
| 614 | /* The signal information here is obsolete. |
| 615 | * It must be decimal for Linux 2.0 compatibility. |
| 616 | * Use /proc/#/status for real-time signals. |
| 617 | */ |
| 618 | seq_put_decimal_ull(m, delimiter: " " , num: task->pending.signal.sig[0] & 0x7fffffffUL); |
| 619 | seq_put_decimal_ull(m, delimiter: " " , num: task->blocked.sig[0] & 0x7fffffffUL); |
| 620 | seq_put_decimal_ull(m, delimiter: " " , num: sigign.sig[0] & 0x7fffffffUL); |
| 621 | seq_put_decimal_ull(m, delimiter: " " , num: sigcatch.sig[0] & 0x7fffffffUL); |
| 622 | |
| 623 | /* |
| 624 | * We used to output the absolute kernel address, but that's an |
| 625 | * information leak - so instead we show a 0/1 flag here, to signal |
| 626 | * to user-space whether there's a wchan field in /proc/PID/wchan. |
| 627 | * |
| 628 | * This works with older implementations of procps as well. |
| 629 | */ |
| 630 | seq_put_decimal_ull(m, delimiter: " " , num: wchan); |
| 631 | |
| 632 | seq_put_decimal_ull(m, delimiter: " " , num: 0); |
| 633 | seq_put_decimal_ull(m, delimiter: " " , num: 0); |
| 634 | seq_put_decimal_ll(m, delimiter: " " , num: task->exit_signal); |
| 635 | seq_put_decimal_ll(m, delimiter: " " , num: task_cpu(p: task)); |
| 636 | seq_put_decimal_ull(m, delimiter: " " , num: task->rt_priority); |
| 637 | seq_put_decimal_ull(m, delimiter: " " , num: task->policy); |
| 638 | seq_put_decimal_ull(m, delimiter: " " , num: delayacct_blkio_ticks(tsk: task)); |
| 639 | seq_put_decimal_ull(m, delimiter: " " , num: nsec_to_clock_t(x: gtime)); |
| 640 | seq_put_decimal_ll(m, delimiter: " " , num: nsec_to_clock_t(x: cgtime)); |
| 641 | |
| 642 | if (mm && permitted) { |
| 643 | seq_put_decimal_ull(m, delimiter: " " , num: mm->start_data); |
| 644 | seq_put_decimal_ull(m, delimiter: " " , num: mm->end_data); |
| 645 | seq_put_decimal_ull(m, delimiter: " " , num: mm->start_brk); |
| 646 | seq_put_decimal_ull(m, delimiter: " " , num: mm->arg_start); |
| 647 | seq_put_decimal_ull(m, delimiter: " " , num: mm->arg_end); |
| 648 | seq_put_decimal_ull(m, delimiter: " " , num: mm->env_start); |
| 649 | seq_put_decimal_ull(m, delimiter: " " , num: mm->env_end); |
| 650 | } else |
| 651 | seq_puts(m, s: " 0 0 0 0 0 0 0" ); |
| 652 | |
| 653 | if (permitted) |
| 654 | seq_put_decimal_ll(m, delimiter: " " , num: exit_code); |
| 655 | else |
| 656 | seq_puts(m, s: " 0" ); |
| 657 | |
| 658 | seq_putc(m, c: '\n'); |
| 659 | if (mm) |
| 660 | mmput(mm); |
| 661 | return 0; |
| 662 | } |
| 663 | |
| 664 | int proc_tid_stat(struct seq_file *m, struct pid_namespace *ns, |
| 665 | struct pid *pid, struct task_struct *task) |
| 666 | { |
| 667 | return do_task_stat(m, ns, pid, task, whole: 0); |
| 668 | } |
| 669 | |
| 670 | int proc_tgid_stat(struct seq_file *m, struct pid_namespace *ns, |
| 671 | struct pid *pid, struct task_struct *task) |
| 672 | { |
| 673 | return do_task_stat(m, ns, pid, task, whole: 1); |
| 674 | } |
| 675 | |
| 676 | int proc_pid_statm(struct seq_file *m, struct pid_namespace *ns, |
| 677 | struct pid *pid, struct task_struct *task) |
| 678 | { |
| 679 | struct mm_struct *mm = get_task_mm(task); |
| 680 | |
| 681 | if (mm) { |
| 682 | unsigned long size; |
| 683 | unsigned long resident = 0; |
| 684 | unsigned long shared = 0; |
| 685 | unsigned long text = 0; |
| 686 | unsigned long data = 0; |
| 687 | |
| 688 | size = task_statm(mm, &shared, &text, &data, &resident); |
| 689 | mmput(mm); |
| 690 | |
| 691 | /* |
| 692 | * For quick read, open code by putting numbers directly |
| 693 | * expected format is |
| 694 | * seq_printf(m, "%lu %lu %lu %lu 0 %lu 0\n", |
| 695 | * size, resident, shared, text, data); |
| 696 | */ |
| 697 | seq_put_decimal_ull(m, delimiter: "" , num: size); |
| 698 | seq_put_decimal_ull(m, delimiter: " " , num: resident); |
| 699 | seq_put_decimal_ull(m, delimiter: " " , num: shared); |
| 700 | seq_put_decimal_ull(m, delimiter: " " , num: text); |
| 701 | seq_put_decimal_ull(m, delimiter: " " , num: 0); |
| 702 | seq_put_decimal_ull(m, delimiter: " " , num: data); |
| 703 | seq_put_decimal_ull(m, delimiter: " " , num: 0); |
| 704 | seq_putc(m, c: '\n'); |
| 705 | } else { |
| 706 | seq_write(seq: m, data: "0 0 0 0 0 0 0\n" , len: 14); |
| 707 | } |
| 708 | return 0; |
| 709 | } |
| 710 | |
| 711 | #ifdef CONFIG_PROC_CHILDREN |
| 712 | static struct pid * |
| 713 | get_children_pid(struct inode *inode, struct pid *pid_prev, loff_t pos) |
| 714 | { |
| 715 | struct task_struct *start, *task; |
| 716 | struct pid *pid = NULL; |
| 717 | |
| 718 | read_lock(&tasklist_lock); |
| 719 | |
| 720 | start = pid_task(pid: proc_pid(inode), PIDTYPE_PID); |
| 721 | if (!start) |
| 722 | goto out; |
| 723 | |
| 724 | /* |
| 725 | * Lets try to continue searching first, this gives |
| 726 | * us significant speedup on children-rich processes. |
| 727 | */ |
| 728 | if (pid_prev) { |
| 729 | task = pid_task(pid: pid_prev, PIDTYPE_PID); |
| 730 | if (task && task->real_parent == start && |
| 731 | !(list_empty(head: &task->sibling))) { |
| 732 | if (list_is_last(list: &task->sibling, head: &start->children)) |
| 733 | goto out; |
| 734 | task = list_first_entry(&task->sibling, |
| 735 | struct task_struct, sibling); |
| 736 | pid = get_pid(pid: task_pid(task)); |
| 737 | goto out; |
| 738 | } |
| 739 | } |
| 740 | |
| 741 | /* |
| 742 | * Slow search case. |
| 743 | * |
| 744 | * We might miss some children here if children |
| 745 | * are exited while we were not holding the lock, |
| 746 | * but it was never promised to be accurate that |
| 747 | * much. |
| 748 | * |
| 749 | * "Just suppose that the parent sleeps, but N children |
| 750 | * exit after we printed their tids. Now the slow paths |
| 751 | * skips N extra children, we miss N tasks." (c) |
| 752 | * |
| 753 | * So one need to stop or freeze the leader and all |
| 754 | * its children to get a precise result. |
| 755 | */ |
| 756 | list_for_each_entry(task, &start->children, sibling) { |
| 757 | if (pos-- == 0) { |
| 758 | pid = get_pid(pid: task_pid(task)); |
| 759 | break; |
| 760 | } |
| 761 | } |
| 762 | |
| 763 | out: |
| 764 | read_unlock(&tasklist_lock); |
| 765 | return pid; |
| 766 | } |
| 767 | |
| 768 | static int children_seq_show(struct seq_file *seq, void *v) |
| 769 | { |
| 770 | struct inode *inode = file_inode(f: seq->file); |
| 771 | |
| 772 | seq_printf(m: seq, fmt: "%d " , pid_nr_ns(pid: v, ns: proc_pid_ns(sb: inode->i_sb))); |
| 773 | return 0; |
| 774 | } |
| 775 | |
| 776 | static void *children_seq_start(struct seq_file *seq, loff_t *pos) |
| 777 | { |
| 778 | return get_children_pid(inode: file_inode(f: seq->file), NULL, pos: *pos); |
| 779 | } |
| 780 | |
| 781 | static void *children_seq_next(struct seq_file *seq, void *v, loff_t *pos) |
| 782 | { |
| 783 | struct pid *pid; |
| 784 | |
| 785 | pid = get_children_pid(inode: file_inode(f: seq->file), pid_prev: v, pos: *pos + 1); |
| 786 | put_pid(pid: v); |
| 787 | |
| 788 | ++*pos; |
| 789 | return pid; |
| 790 | } |
| 791 | |
| 792 | static void children_seq_stop(struct seq_file *seq, void *v) |
| 793 | { |
| 794 | put_pid(pid: v); |
| 795 | } |
| 796 | |
| 797 | static const struct seq_operations children_seq_ops = { |
| 798 | .start = children_seq_start, |
| 799 | .next = children_seq_next, |
| 800 | .stop = children_seq_stop, |
| 801 | .show = children_seq_show, |
| 802 | }; |
| 803 | |
| 804 | static int children_seq_open(struct inode *inode, struct file *file) |
| 805 | { |
| 806 | return seq_open(file, &children_seq_ops); |
| 807 | } |
| 808 | |
| 809 | const struct file_operations proc_tid_children_operations = { |
| 810 | .open = children_seq_open, |
| 811 | .read = seq_read, |
| 812 | .llseek = seq_lseek, |
| 813 | .release = seq_release, |
| 814 | }; |
| 815 | #endif /* CONFIG_PROC_CHILDREN */ |
| 816 | |