2 * linux/fs/proc/array.c
4 * Copyright (C) 1992 by Linus Torvalds
5 * based on ideas by Darren Senn
8 * Michael. K. Johnson: stat,statm extensions.
9 * <johnsonm@stolaf.edu>
11 * Pauline Middelink : Made cmdline,envline only break at '\0's, to
12 * make sure SET_PROCTITLE works. Also removed
13 * bad '!' which forced address recalculation for
14 * EVERY character on the current page.
15 * <middelin@polyware.iaf.nl>
17 * Danny ter Haar : added cpuinfo
20 * Alessandro Rubini : profile extension.
21 * <rubini@ipvvis.unipv.it>
23 * Jeff Tranter : added BogoMips field to cpuinfo
24 * <Jeff_Tranter@Mitel.COM>
26 * Bruno Haible : remove 4K limit for the maps file
27 * <haible@ma2s2.mathematik.uni-karlsruhe.de>
29 * Yves Arrouye : remove removal of trailing spaces in get_array.
30 * <Yves.Arrouye@marin.fdn.fr>
32 * Jerome Forissier : added per-CPU time information to /proc/stat
33 * and /proc/<pid>/cpu extension
34 * <forissier@isia.cma.fr>
35 * - Incorporation and non-SMP safe operation
36 * of forissier patch in 2.1.78 by
37 * Hans Marcus <crowbar@concepts.nl>
39 * aeb@cwi.nl : /proc/partitions
42 * Alan Cox : security fixes.
43 * <alan@lxorguk.ukuu.org.uk>
45 * Al Viro : safe handling of mm_struct
47 * Gerhard Wichert : added BIGMEM support
48 * Siemens AG <Gerhard.Wichert@pdb.siemens.de>
50 * Al Viro & Jeff Garzik : moved most of the thing into base.c and
51 * : proc_misc.c. The rest may eventually go into
55 #include <linux/types.h>
56 #include <linux/errno.h>
57 #include <linux/time.h>
58 #include <linux/kernel.h>
59 #include <linux/kernel_stat.h>
60 #include <linux/tty.h>
61 #include <linux/string.h>
62 #include <linux/mman.h>
63 #include <linux/proc_fs.h>
64 #include <linux/ioport.h>
65 #include <linux/uaccess.h>
68 #include <linux/hugetlb.h>
69 #include <linux/pagemap.h>
70 #include <linux/swap.h>
71 #include <linux/slab.h>
72 #include <linux/smp.h>
73 #include <linux/signal.h>
74 #include <linux/highmem.h>
75 #include <linux/file.h>
76 #include <linux/fdtable.h>
77 #include <linux/times.h>
78 #include <linux/cpuset.h>
79 #include <linux/rcupdate.h>
80 #include <linux/delayacct.h>
81 #include <linux/seq_file.h>
82 #include <linux/pid_namespace.h>
83 #include <linux/ptrace.h>
84 #include <linux/tracehook.h>
85 #include <linux/swapops.h>
87 #include <asm/pgtable.h>
88 #include <asm/processor.h>
91 static inline void task_name(struct seq_file
*m
, struct task_struct
*p
)
96 char tcomm
[sizeof(p
->comm
)];
98 get_task_comm(tcomm
, p
);
100 seq_printf(m
, "Name:\t");
101 end
= m
->buf
+ m
->size
;
102 buf
= m
->buf
+ m
->count
;
105 while (i
&& (buf
< end
)) {
106 unsigned char c
= *name
;
126 m
->count
= buf
- m
->buf
;
131 * The task state array is a strange "bitmap" of
132 * reasons to sleep. Thus "running" is zero, and
133 * you can test for combinations of others with
136 static const char *task_state_array
[] = {
137 "R (running)", /* 0 */
138 "S (sleeping)", /* 1 */
139 "D (disk sleep)", /* 2 */
140 "T (stopped)", /* 4 */
141 "T (tracing stop)", /* 8 */
142 "Z (zombie)", /* 16 */
146 static inline const char *get_task_state(struct task_struct
*tsk
)
148 unsigned int state
= (tsk
->state
& TASK_REPORT
) | tsk
->exit_state
;
149 const char **p
= &task_state_array
[0];
158 static inline void task_state(struct seq_file
*m
, struct pid_namespace
*ns
,
159 struct pid
*pid
, struct task_struct
*p
)
161 struct group_info
*group_info
;
163 struct fdtable
*fdt
= NULL
;
164 const struct cred
*cred
;
168 ppid
= pid_alive(p
) ?
169 task_tgid_nr_ns(rcu_dereference(p
->real_parent
), ns
) : 0;
172 struct task_struct
*tracer
= tracehook_tracer_task(p
);
174 tpid
= task_pid_nr_ns(tracer
, ns
);
176 cred
= get_cred((struct cred
*) __task_cred(p
));
183 "Uid:\t%d\t%d\t%d\t%d\n"
184 "Gid:\t%d\t%d\t%d\t%d\n",
186 task_tgid_nr_ns(p
, ns
),
189 cred
->uid
, cred
->euid
, cred
->suid
, cred
->fsuid
,
190 cred
->gid
, cred
->egid
, cred
->sgid
, cred
->fsgid
);
194 fdt
= files_fdtable(p
->files
);
198 fdt
? fdt
->max_fds
: 0);
201 group_info
= cred
->group_info
;
204 for (g
= 0; g
< min(group_info
->ngroups
, NGROUPS_SMALL
); g
++)
205 seq_printf(m
, "%d ", GROUP_AT(group_info
, g
));
211 static void render_sigset_t(struct seq_file
*m
, const char *header
,
216 seq_printf(m
, "%s", header
);
223 if (sigismember(set
, i
+1)) x
|= 1;
224 if (sigismember(set
, i
+2)) x
|= 2;
225 if (sigismember(set
, i
+3)) x
|= 4;
226 if (sigismember(set
, i
+4)) x
|= 8;
227 seq_printf(m
, "%x", x
);
233 static void collect_sigign_sigcatch(struct task_struct
*p
, sigset_t
*ign
,
236 struct k_sigaction
*k
;
239 k
= p
->sighand
->action
;
240 for (i
= 1; i
<= _NSIG
; ++i
, ++k
) {
241 if (k
->sa
.sa_handler
== SIG_IGN
)
243 else if (k
->sa
.sa_handler
!= SIG_DFL
)
248 static inline void task_sig(struct seq_file
*m
, struct task_struct
*p
)
251 sigset_t pending
, shpending
, blocked
, ignored
, caught
;
253 unsigned long qsize
= 0;
254 unsigned long qlim
= 0;
256 sigemptyset(&pending
);
257 sigemptyset(&shpending
);
258 sigemptyset(&blocked
);
259 sigemptyset(&ignored
);
260 sigemptyset(&caught
);
262 if (lock_task_sighand(p
, &flags
)) {
263 pending
= p
->pending
.signal
;
264 shpending
= p
->signal
->shared_pending
.signal
;
265 blocked
= p
->blocked
;
266 collect_sigign_sigcatch(p
, &ignored
, &caught
);
267 num_threads
= atomic_read(&p
->signal
->count
);
268 qsize
= atomic_read(&__task_cred(p
)->user
->sigpending
);
269 qlim
= p
->signal
->rlim
[RLIMIT_SIGPENDING
].rlim_cur
;
270 unlock_task_sighand(p
, &flags
);
273 seq_printf(m
, "Threads:\t%d\n", num_threads
);
274 seq_printf(m
, "SigQ:\t%lu/%lu\n", qsize
, qlim
);
276 /* render them all */
277 render_sigset_t(m
, "SigPnd:\t", &pending
);
278 render_sigset_t(m
, "ShdPnd:\t", &shpending
);
279 render_sigset_t(m
, "SigBlk:\t", &blocked
);
280 render_sigset_t(m
, "SigIgn:\t", &ignored
);
281 render_sigset_t(m
, "SigCgt:\t", &caught
);
284 static void render_cap_t(struct seq_file
*m
, const char *header
,
289 seq_printf(m
, "%s", header
);
290 CAP_FOR_EACH_U32(__capi
) {
291 seq_printf(m
, "%08x",
292 a
->cap
[(_KERNEL_CAPABILITY_U32S
-1) - __capi
]);
297 static inline void task_cap(struct seq_file
*m
, struct task_struct
*p
)
299 const struct cred
*cred
;
300 kernel_cap_t cap_inheritable
, cap_permitted
, cap_effective
, cap_bset
;
303 cred
= __task_cred(p
);
304 cap_inheritable
= cred
->cap_inheritable
;
305 cap_permitted
= cred
->cap_permitted
;
306 cap_effective
= cred
->cap_effective
;
307 cap_bset
= cred
->cap_bset
;
310 render_cap_t(m
, "CapInh:\t", &cap_inheritable
);
311 render_cap_t(m
, "CapPrm:\t", &cap_permitted
);
312 render_cap_t(m
, "CapEff:\t", &cap_effective
);
313 render_cap_t(m
, "CapBnd:\t", &cap_bset
);
316 static inline void task_context_switch_counts(struct seq_file
*m
,
317 struct task_struct
*p
)
319 seq_printf(m
, "voluntary_ctxt_switches:\t%lu\n"
320 "nonvoluntary_ctxt_switches:\t%lu\n",
326 struct vm_area_struct
*vma
;
327 unsigned long startpage
;
331 static int stack_usage_pte_range(pmd_t
*pmd
, unsigned long addr
,
332 unsigned long end
, struct mm_walk
*walk
)
334 struct stack_stats
*ss
= walk
->private;
335 struct vm_area_struct
*vma
= ss
->vma
;
340 pte
= pte_offset_map_lock(vma
->vm_mm
, pmd
, addr
, &ptl
);
341 for (; addr
!= end
; pte
++, addr
+= PAGE_SIZE
) {
344 #ifdef CONFIG_STACK_GROWSUP
345 if (pte_present(ptent
) || is_swap_pte(ptent
))
346 ss
->usage
= addr
- ss
->startpage
+ PAGE_SIZE
;
348 if (pte_present(ptent
) || is_swap_pte(ptent
)) {
349 ss
->usage
= ss
->startpage
- addr
+ PAGE_SIZE
;
356 pte_unmap_unlock(pte
- 1, ptl
);
361 static inline unsigned long get_stack_usage_in_bytes(struct vm_area_struct
*vma
,
362 struct task_struct
*task
)
364 struct stack_stats ss
;
365 struct mm_walk stack_walk
= {
366 .pmd_entry
= stack_usage_pte_range
,
371 if (!vma
->vm_mm
|| is_vm_hugetlb_page(vma
))
375 ss
.startpage
= task
->stack_start
& PAGE_MASK
;
378 #ifdef CONFIG_STACK_GROWSUP
379 walk_page_range(KSTK_ESP(task
) & PAGE_MASK
, vma
->vm_end
,
382 walk_page_range(vma
->vm_start
, (KSTK_ESP(task
) & PAGE_MASK
) + PAGE_SIZE
,
388 static inline void task_show_stack_usage(struct seq_file
*m
,
389 struct task_struct
*task
)
391 struct vm_area_struct
*vma
;
392 struct mm_struct
*mm
= get_task_mm(task
);
395 down_read(&mm
->mmap_sem
);
396 vma
= find_vma(mm
, task
->stack_start
);
398 seq_printf(m
, "Stack usage:\t%lu kB\n",
399 get_stack_usage_in_bytes(vma
, task
) >> 10);
401 up_read(&mm
->mmap_sem
);
406 int proc_pid_status(struct seq_file
*m
, struct pid_namespace
*ns
,
407 struct pid
*pid
, struct task_struct
*task
)
409 struct mm_struct
*mm
= get_task_mm(task
);
412 task_state(m
, ns
, pid
, task
);
420 cpuset_task_status_allowed(m
, task
);
421 #if defined(CONFIG_S390)
422 task_show_regs(m
, task
);
424 task_context_switch_counts(m
, task
);
425 task_show_stack_usage(m
, task
);
429 static int do_task_stat(struct seq_file
*m
, struct pid_namespace
*ns
,
430 struct pid
*pid
, struct task_struct
*task
, int whole
)
432 unsigned long vsize
, eip
, esp
, wchan
= ~0UL;
434 int tty_pgrp
= -1, tty_nr
= 0;
435 sigset_t sigign
, sigcatch
;
437 pid_t ppid
= 0, pgid
= -1, sid
= -1;
440 struct mm_struct
*mm
;
441 unsigned long long start_time
;
442 unsigned long cmin_flt
= 0, cmaj_flt
= 0;
443 unsigned long min_flt
= 0, maj_flt
= 0;
444 cputime_t cutime
, cstime
, utime
, stime
;
445 cputime_t cgtime
, gtime
;
446 unsigned long rsslim
= 0;
447 char tcomm
[sizeof(task
->comm
)];
450 state
= *get_task_state(task
);
451 vsize
= eip
= esp
= 0;
452 permitted
= ptrace_may_access(task
, PTRACE_MODE_READ
);
453 mm
= get_task_mm(task
);
455 vsize
= task_vsize(mm
);
457 eip
= KSTK_EIP(task
);
458 esp
= KSTK_ESP(task
);
462 get_task_comm(tcomm
, task
);
464 sigemptyset(&sigign
);
465 sigemptyset(&sigcatch
);
466 cutime
= cstime
= utime
= stime
= cputime_zero
;
467 cgtime
= gtime
= cputime_zero
;
469 if (lock_task_sighand(task
, &flags
)) {
470 struct signal_struct
*sig
= task
->signal
;
473 struct pid
*pgrp
= tty_get_pgrp(sig
->tty
);
474 tty_pgrp
= pid_nr_ns(pgrp
, ns
);
476 tty_nr
= new_encode_dev(tty_devnum(sig
->tty
));
479 num_threads
= atomic_read(&sig
->count
);
480 collect_sigign_sigcatch(task
, &sigign
, &sigcatch
);
482 cmin_flt
= sig
->cmin_flt
;
483 cmaj_flt
= sig
->cmaj_flt
;
484 cutime
= sig
->cutime
;
485 cstime
= sig
->cstime
;
486 cgtime
= sig
->cgtime
;
487 rsslim
= sig
->rlim
[RLIMIT_RSS
].rlim_cur
;
489 /* add up live thread stats at the group level */
491 struct task_cputime cputime
;
492 struct task_struct
*t
= task
;
494 min_flt
+= t
->min_flt
;
495 maj_flt
+= t
->maj_flt
;
496 gtime
= cputime_add(gtime
, task_gtime(t
));
500 min_flt
+= sig
->min_flt
;
501 maj_flt
+= sig
->maj_flt
;
502 thread_group_cputime(task
, &cputime
);
503 utime
= cputime
.utime
;
504 stime
= cputime
.stime
;
505 gtime
= cputime_add(gtime
, sig
->gtime
);
508 sid
= task_session_nr_ns(task
, ns
);
509 ppid
= task_tgid_nr_ns(task
->real_parent
, ns
);
510 pgid
= task_pgrp_nr_ns(task
, ns
);
512 unlock_task_sighand(task
, &flags
);
515 if (permitted
&& (!whole
|| num_threads
< 2))
516 wchan
= get_wchan(task
);
518 min_flt
= task
->min_flt
;
519 maj_flt
= task
->maj_flt
;
520 utime
= task_utime(task
);
521 stime
= task_stime(task
);
522 gtime
= task_gtime(task
);
525 /* scale priority and nice values from timeslices to -20..20 */
526 /* to make it look like a "normal" Unix priority/nice value */
527 priority
= task_prio(task
);
528 nice
= task_nice(task
);
530 /* Temporary variable needed for gcc-2.96 */
531 /* convert timespec -> nsec*/
533 (unsigned long long)task
->real_start_time
.tv_sec
* NSEC_PER_SEC
534 + task
->real_start_time
.tv_nsec
;
535 /* convert nsec -> ticks */
536 start_time
= nsec_to_clock_t(start_time
);
538 seq_printf(m
, "%d (%s) %c %d %d %d %d %d %u %lu \
539 %lu %lu %lu %lu %lu %ld %ld %ld %ld %d 0 %llu %lu %ld %lu %lu %lu %lu %lu \
540 %lu %lu %lu %lu %lu %lu %lu %lu %d %d %u %u %llu %lu %ld\n",
554 cputime_to_clock_t(utime
),
555 cputime_to_clock_t(stime
),
556 cputime_to_clock_t(cutime
),
557 cputime_to_clock_t(cstime
),
563 mm
? get_mm_rss(mm
) : 0,
565 mm
? mm
->start_code
: 0,
566 mm
? mm
->end_code
: 0,
567 (permitted
) ? task
->stack_start
: 0,
570 /* The signal information here is obsolete.
571 * It must be decimal for Linux 2.0 compatibility.
572 * Use /proc/#/status for real-time signals.
574 task
->pending
.signal
.sig
[0] & 0x7fffffffUL
,
575 task
->blocked
.sig
[0] & 0x7fffffffUL
,
576 sigign
.sig
[0] & 0x7fffffffUL
,
577 sigcatch
.sig
[0] & 0x7fffffffUL
,
585 (unsigned long long)delayacct_blkio_ticks(task
),
586 cputime_to_clock_t(gtime
),
587 cputime_to_clock_t(cgtime
));
593 int proc_tid_stat(struct seq_file
*m
, struct pid_namespace
*ns
,
594 struct pid
*pid
, struct task_struct
*task
)
596 return do_task_stat(m
, ns
, pid
, task
, 0);
599 int proc_tgid_stat(struct seq_file
*m
, struct pid_namespace
*ns
,
600 struct pid
*pid
, struct task_struct
*task
)
602 return do_task_stat(m
, ns
, pid
, task
, 1);
605 int proc_pid_statm(struct seq_file
*m
, struct pid_namespace
*ns
,
606 struct pid
*pid
, struct task_struct
*task
)
608 int size
= 0, resident
= 0, shared
= 0, text
= 0, lib
= 0, data
= 0;
609 struct mm_struct
*mm
= get_task_mm(task
);
612 size
= task_statm(mm
, &shared
, &text
, &data
, &resident
);
615 seq_printf(m
, "%d %d %d %d %d %d %d\n",
616 size
, resident
, shared
, text
, lib
, data
, 0);