2 * linux/kernel/ptrace.c
4 * (C) Copyright 1999 Linus Torvalds
6 * Common interfaces for "ptrace()" which we do not want
7 * to continually duplicate across every architecture.
10 #include <linux/capability.h>
11 #include <linux/module.h>
12 #include <linux/sched.h>
13 #include <linux/errno.h>
15 #include <linux/highmem.h>
16 #include <linux/pagemap.h>
17 #include <linux/smp_lock.h>
18 #include <linux/ptrace.h>
19 #include <linux/security.h>
20 #include <linux/signal.h>
21 #include <linux/audit.h>
22 #include <linux/pid_namespace.h>
23 #include <linux/syscalls.h>
24 #include <linux/uaccess.h>
28 * ptrace a task: make the debugger its new parent and
29 * move it to the ptrace list.
31 * Must be called with the tasklist lock write-held.
33 void __ptrace_link(struct task_struct
*child
, struct task_struct
*new_parent
)
35 BUG_ON(!list_empty(&child
->ptrace_entry
));
36 list_add(&child
->ptrace_entry
, &new_parent
->ptraced
);
37 child
->parent
= new_parent
;
41 * Turn a tracing stop into a normal stop now, since with no tracer there
42 * would be no way to wake it up with SIGCONT or SIGKILL. If there was a
43 * signal sent that would resume the child, but didn't because it was in
44 * TASK_TRACED, resume it now.
45 * Requires that irqs be disabled.
47 static void ptrace_untrace(struct task_struct
*child
)
49 spin_lock(&child
->sighand
->siglock
);
50 if (task_is_traced(child
)) {
52 * If the group stop is completed or in progress,
53 * this thread was already counted as stopped.
55 if (child
->signal
->flags
& SIGNAL_STOP_STOPPED
||
56 child
->signal
->group_stop_count
)
57 __set_task_state(child
, TASK_STOPPED
);
59 signal_wake_up(child
, 1);
61 spin_unlock(&child
->sighand
->siglock
);
65 * unptrace a task: move it back to its original parent and
66 * remove it from the ptrace list.
68 * Must be called with the tasklist lock write-held.
70 void __ptrace_unlink(struct task_struct
*child
)
72 BUG_ON(!child
->ptrace
);
75 child
->parent
= child
->real_parent
;
76 list_del_init(&child
->ptrace_entry
);
78 arch_ptrace_untrace(child
);
79 if (task_is_traced(child
))
80 ptrace_untrace(child
);
84 * Check that we have indeed attached to the thing..
86 int ptrace_check_attach(struct task_struct
*child
, int kill
)
91 * We take the read lock around doing both checks to close a
92 * possible race where someone else was tracing our child and
93 * detached between these two checks. After this locked check,
94 * we are sure that this is our traced child and that can only
95 * be changed by us so it's not changing right after this.
97 read_lock(&tasklist_lock
);
98 if ((child
->ptrace
& PT_PTRACED
) && child
->parent
== current
) {
101 * child->sighand can't be NULL, release_task()
102 * does ptrace_unlink() before __exit_signal().
104 spin_lock_irq(&child
->sighand
->siglock
);
105 if (task_is_stopped(child
))
106 child
->state
= TASK_TRACED
;
107 else if (!task_is_traced(child
) && !kill
)
109 spin_unlock_irq(&child
->sighand
->siglock
);
111 read_unlock(&tasklist_lock
);
114 ret
= wait_task_inactive(child
, TASK_TRACED
) ? 0 : -ESRCH
;
116 /* All systems go.. */
120 int __ptrace_may_access(struct task_struct
*task
, unsigned int mode
)
122 const struct cred
*cred
= current_cred(), *tcred
;
124 /* May we inspect the given task?
125 * This check is used both for attaching with ptrace
126 * and for allowing access to sensitive information in /proc.
128 * ptrace_attach denies several cases that /proc allows
129 * because setting up the necessary parent/child relationship
130 * or halting the specified task is impossible.
133 /* Don't let security modules deny introspection */
137 tcred
= __task_cred(task
);
138 if ((cred
->uid
!= tcred
->euid
||
139 cred
->uid
!= tcred
->suid
||
140 cred
->uid
!= tcred
->uid
||
141 cred
->gid
!= tcred
->egid
||
142 cred
->gid
!= tcred
->sgid
||
143 cred
->gid
!= tcred
->gid
) &&
144 !capable(CAP_SYS_PTRACE
)) {
151 dumpable
= get_dumpable(task
->mm
);
152 if (!dumpable
&& !capable(CAP_SYS_PTRACE
))
155 return security_ptrace_may_access(task
, mode
);
158 bool ptrace_may_access(struct task_struct
*task
, unsigned int mode
)
162 err
= __ptrace_may_access(task
, mode
);
167 int ptrace_attach(struct task_struct
*task
)
175 if (same_thread_group(task
, current
))
178 /* Protect the target's credential calculations against our
179 * interference; SUID, SGID and LSM creds get determined differently
182 retval
= mutex_lock_interruptible(&task
->cred_guard_mutex
);
191 * We want to hold both the task-lock and the
192 * tasklist_lock for writing at the same time.
193 * But that's against the rules (tasklist_lock
194 * is taken for reading by interrupts on other
195 * cpu's that may have task_lock).
198 if (!write_trylock_irqsave(&tasklist_lock
, flags
)) {
202 } while (!write_can_lock(&tasklist_lock
));
208 /* the same process cannot be attached many times */
209 if (task
->ptrace
& PT_PTRACED
)
211 retval
= __ptrace_may_access(task
, PTRACE_MODE_ATTACH
);
216 task
->ptrace
|= PT_PTRACED
;
217 if (capable(CAP_SYS_PTRACE
))
218 task
->ptrace
|= PT_PTRACE_CAP
;
220 __ptrace_link(task
, current
);
222 send_sig_info(SIGSTOP
, SEND_SIG_FORCED
, task
);
224 write_unlock_irqrestore(&tasklist_lock
, flags
);
226 mutex_unlock(&task
->cred_guard_mutex
);
232 * Called with irqs disabled, returns true if childs should reap themselves.
234 static int ignoring_children(struct sighand_struct
*sigh
)
237 spin_lock(&sigh
->siglock
);
238 ret
= (sigh
->action
[SIGCHLD
-1].sa
.sa_handler
== SIG_IGN
) ||
239 (sigh
->action
[SIGCHLD
-1].sa
.sa_flags
& SA_NOCLDWAIT
);
240 spin_unlock(&sigh
->siglock
);
245 * Called with tasklist_lock held for writing.
246 * Unlink a traced task, and clean it up if it was a traced zombie.
247 * Return true if it needs to be reaped with release_task().
248 * (We can't call release_task() here because we already hold tasklist_lock.)
250 * If it's a zombie, our attachedness prevented normal parent notification
251 * or self-reaping. Do notification now if it would have happened earlier.
252 * If it should reap itself, return true.
254 * If it's our own child, there is no notification to do.
255 * But if our normal children self-reap, then this child
256 * was prevented by ptrace and we must reap it now.
258 static bool __ptrace_detach(struct task_struct
*tracer
, struct task_struct
*p
)
262 if (p
->exit_state
== EXIT_ZOMBIE
) {
263 if (!task_detached(p
) && thread_group_empty(p
)) {
264 if (!same_thread_group(p
->real_parent
, tracer
))
265 do_notify_parent(p
, p
->exit_signal
);
266 else if (ignoring_children(tracer
->sighand
))
269 if (task_detached(p
)) {
270 /* Mark it as in the process of being reaped. */
271 p
->exit_state
= EXIT_DEAD
;
279 int ptrace_detach(struct task_struct
*child
, unsigned int data
)
283 if (!valid_signal(data
))
286 /* Architecture-specific hardware disable .. */
287 ptrace_disable(child
);
288 clear_tsk_thread_flag(child
, TIF_SYSCALL_TRACE
);
290 write_lock_irq(&tasklist_lock
);
292 * This child can be already killed. Make sure de_thread() or
293 * our sub-thread doing do_wait() didn't do release_task() yet.
296 child
->exit_code
= data
;
297 dead
= __ptrace_detach(current
, child
);
298 if (!child
->exit_state
)
299 wake_up_process(child
);
301 write_unlock_irq(&tasklist_lock
);
310 * Detach all tasks we were using ptrace on.
312 void exit_ptrace(struct task_struct
*tracer
)
314 struct task_struct
*p
, *n
;
315 LIST_HEAD(ptrace_dead
);
317 write_lock_irq(&tasklist_lock
);
318 list_for_each_entry_safe(p
, n
, &tracer
->ptraced
, ptrace_entry
) {
319 if (__ptrace_detach(tracer
, p
))
320 list_add(&p
->ptrace_entry
, &ptrace_dead
);
322 write_unlock_irq(&tasklist_lock
);
324 BUG_ON(!list_empty(&tracer
->ptraced
));
326 list_for_each_entry_safe(p
, n
, &ptrace_dead
, ptrace_entry
) {
327 list_del_init(&p
->ptrace_entry
);
332 int ptrace_readdata(struct task_struct
*tsk
, unsigned long src
, char __user
*dst
, int len
)
338 int this_len
, retval
;
340 this_len
= (len
> sizeof(buf
)) ? sizeof(buf
) : len
;
341 retval
= access_process_vm(tsk
, src
, buf
, this_len
, 0);
347 if (copy_to_user(dst
, buf
, retval
))
357 int ptrace_writedata(struct task_struct
*tsk
, char __user
*src
, unsigned long dst
, int len
)
363 int this_len
, retval
;
365 this_len
= (len
> sizeof(buf
)) ? sizeof(buf
) : len
;
366 if (copy_from_user(buf
, src
, this_len
))
368 retval
= access_process_vm(tsk
, dst
, buf
, this_len
, 1);
382 static int ptrace_setoptions(struct task_struct
*child
, long data
)
384 child
->ptrace
&= ~PT_TRACE_MASK
;
386 if (data
& PTRACE_O_TRACESYSGOOD
)
387 child
->ptrace
|= PT_TRACESYSGOOD
;
389 if (data
& PTRACE_O_TRACEFORK
)
390 child
->ptrace
|= PT_TRACE_FORK
;
392 if (data
& PTRACE_O_TRACEVFORK
)
393 child
->ptrace
|= PT_TRACE_VFORK
;
395 if (data
& PTRACE_O_TRACECLONE
)
396 child
->ptrace
|= PT_TRACE_CLONE
;
398 if (data
& PTRACE_O_TRACEEXEC
)
399 child
->ptrace
|= PT_TRACE_EXEC
;
401 if (data
& PTRACE_O_TRACEVFORKDONE
)
402 child
->ptrace
|= PT_TRACE_VFORK_DONE
;
404 if (data
& PTRACE_O_TRACEEXIT
)
405 child
->ptrace
|= PT_TRACE_EXIT
;
407 return (data
& ~PTRACE_O_MASK
) ? -EINVAL
: 0;
410 static int ptrace_getsiginfo(struct task_struct
*child
, siginfo_t
*info
)
414 read_lock(&tasklist_lock
);
415 if (likely(child
->sighand
!= NULL
)) {
417 spin_lock_irq(&child
->sighand
->siglock
);
418 if (likely(child
->last_siginfo
!= NULL
)) {
419 *info
= *child
->last_siginfo
;
422 spin_unlock_irq(&child
->sighand
->siglock
);
424 read_unlock(&tasklist_lock
);
428 static int ptrace_setsiginfo(struct task_struct
*child
, const siginfo_t
*info
)
432 read_lock(&tasklist_lock
);
433 if (likely(child
->sighand
!= NULL
)) {
435 spin_lock_irq(&child
->sighand
->siglock
);
436 if (likely(child
->last_siginfo
!= NULL
)) {
437 *child
->last_siginfo
= *info
;
440 spin_unlock_irq(&child
->sighand
->siglock
);
442 read_unlock(&tasklist_lock
);
447 #ifdef PTRACE_SINGLESTEP
448 #define is_singlestep(request) ((request) == PTRACE_SINGLESTEP)
450 #define is_singlestep(request) 0
453 #ifdef PTRACE_SINGLEBLOCK
454 #define is_singleblock(request) ((request) == PTRACE_SINGLEBLOCK)
456 #define is_singleblock(request) 0
460 #define is_sysemu_singlestep(request) ((request) == PTRACE_SYSEMU_SINGLESTEP)
462 #define is_sysemu_singlestep(request) 0
465 static int ptrace_resume(struct task_struct
*child
, long request
, long data
)
467 if (!valid_signal(data
))
470 if (request
== PTRACE_SYSCALL
)
471 set_tsk_thread_flag(child
, TIF_SYSCALL_TRACE
);
473 clear_tsk_thread_flag(child
, TIF_SYSCALL_TRACE
);
475 #ifdef TIF_SYSCALL_EMU
476 if (request
== PTRACE_SYSEMU
|| request
== PTRACE_SYSEMU_SINGLESTEP
)
477 set_tsk_thread_flag(child
, TIF_SYSCALL_EMU
);
479 clear_tsk_thread_flag(child
, TIF_SYSCALL_EMU
);
482 if (is_singleblock(request
)) {
483 if (unlikely(!arch_has_block_step()))
485 user_enable_block_step(child
);
486 } else if (is_singlestep(request
) || is_sysemu_singlestep(request
)) {
487 if (unlikely(!arch_has_single_step()))
489 user_enable_single_step(child
);
491 user_disable_single_step(child
);
494 child
->exit_code
= data
;
495 wake_up_process(child
);
500 int ptrace_request(struct task_struct
*child
, long request
,
501 long addr
, long data
)
507 case PTRACE_PEEKTEXT
:
508 case PTRACE_PEEKDATA
:
509 return generic_ptrace_peekdata(child
, addr
, data
);
510 case PTRACE_POKETEXT
:
511 case PTRACE_POKEDATA
:
512 return generic_ptrace_pokedata(child
, addr
, data
);
514 #ifdef PTRACE_OLDSETOPTIONS
515 case PTRACE_OLDSETOPTIONS
:
517 case PTRACE_SETOPTIONS
:
518 ret
= ptrace_setoptions(child
, data
);
520 case PTRACE_GETEVENTMSG
:
521 ret
= put_user(child
->ptrace_message
, (unsigned long __user
*) data
);
524 case PTRACE_GETSIGINFO
:
525 ret
= ptrace_getsiginfo(child
, &siginfo
);
527 ret
= copy_siginfo_to_user((siginfo_t __user
*) data
,
531 case PTRACE_SETSIGINFO
:
532 if (copy_from_user(&siginfo
, (siginfo_t __user
*) data
,
536 ret
= ptrace_setsiginfo(child
, &siginfo
);
539 case PTRACE_DETACH
: /* detach a process that was attached. */
540 ret
= ptrace_detach(child
, data
);
543 #ifdef PTRACE_SINGLESTEP
544 case PTRACE_SINGLESTEP
:
546 #ifdef PTRACE_SINGLEBLOCK
547 case PTRACE_SINGLEBLOCK
:
551 case PTRACE_SYSEMU_SINGLESTEP
:
555 return ptrace_resume(child
, request
, data
);
558 if (child
->exit_state
) /* already dead */
560 return ptrace_resume(child
, request
, SIGKILL
);
570 * ptrace_traceme -- helper for PTRACE_TRACEME
572 * Performs checks and sets PT_PTRACED.
573 * Should be used by all ptrace implementations for PTRACE_TRACEME.
575 int ptrace_traceme(void)
580 * Are we already being traced?
584 if (!(current
->ptrace
& PT_PTRACED
)) {
586 * See ptrace_attach() comments about the locking here.
589 if (!write_trylock_irqsave(&tasklist_lock
, flags
)) {
590 task_unlock(current
);
593 } while (!write_can_lock(&tasklist_lock
));
597 ret
= security_ptrace_traceme(current
->parent
);
600 * Check PF_EXITING to ensure ->real_parent has not passed
601 * exit_ptrace(). Otherwise we don't report the error but
602 * pretend ->real_parent untraces us right after return.
604 if (!ret
&& !(current
->real_parent
->flags
& PF_EXITING
)) {
605 current
->ptrace
|= PT_PTRACED
;
606 __ptrace_link(current
, current
->real_parent
);
609 write_unlock_irqrestore(&tasklist_lock
, flags
);
611 task_unlock(current
);
616 * ptrace_get_task_struct -- grab a task struct reference for ptrace
617 * @pid: process id to grab a task_struct reference of
619 * This function is a helper for ptrace implementations. It checks
620 * permissions and then grabs a task struct for use of the actual
621 * ptrace implementation.
623 * Returns the task_struct for @pid or an ERR_PTR() on failure.
625 struct task_struct
*ptrace_get_task_struct(pid_t pid
)
627 struct task_struct
*child
;
629 read_lock(&tasklist_lock
);
630 child
= find_task_by_vpid(pid
);
632 get_task_struct(child
);
634 read_unlock(&tasklist_lock
);
636 return ERR_PTR(-ESRCH
);
640 #ifndef arch_ptrace_attach
641 #define arch_ptrace_attach(child) do { } while (0)
644 SYSCALL_DEFINE4(ptrace
, long, request
, long, pid
, long, addr
, long, data
)
646 struct task_struct
*child
;
650 * This lock_kernel fixes a subtle race with suid exec
653 if (request
== PTRACE_TRACEME
) {
654 ret
= ptrace_traceme();
656 arch_ptrace_attach(current
);
660 child
= ptrace_get_task_struct(pid
);
662 ret
= PTR_ERR(child
);
666 if (request
== PTRACE_ATTACH
) {
667 ret
= ptrace_attach(child
);
669 * Some architectures need to do book-keeping after
673 arch_ptrace_attach(child
);
674 goto out_put_task_struct
;
677 ret
= ptrace_check_attach(child
, request
== PTRACE_KILL
);
679 goto out_put_task_struct
;
681 ret
= arch_ptrace(child
, request
, addr
, data
);
684 put_task_struct(child
);
690 int generic_ptrace_peekdata(struct task_struct
*tsk
, long addr
, long data
)
695 copied
= access_process_vm(tsk
, addr
, &tmp
, sizeof(tmp
), 0);
696 if (copied
!= sizeof(tmp
))
698 return put_user(tmp
, (unsigned long __user
*)data
);
701 int generic_ptrace_pokedata(struct task_struct
*tsk
, long addr
, long data
)
705 copied
= access_process_vm(tsk
, addr
, &data
, sizeof(data
), 1);
706 return (copied
== sizeof(data
)) ? 0 : -EIO
;
709 #if defined CONFIG_COMPAT
710 #include <linux/compat.h>
712 int compat_ptrace_request(struct task_struct
*child
, compat_long_t request
,
713 compat_ulong_t addr
, compat_ulong_t data
)
715 compat_ulong_t __user
*datap
= compat_ptr(data
);
721 case PTRACE_PEEKTEXT
:
722 case PTRACE_PEEKDATA
:
723 ret
= access_process_vm(child
, addr
, &word
, sizeof(word
), 0);
724 if (ret
!= sizeof(word
))
727 ret
= put_user(word
, datap
);
730 case PTRACE_POKETEXT
:
731 case PTRACE_POKEDATA
:
732 ret
= access_process_vm(child
, addr
, &data
, sizeof(data
), 1);
733 ret
= (ret
!= sizeof(data
) ? -EIO
: 0);
736 case PTRACE_GETEVENTMSG
:
737 ret
= put_user((compat_ulong_t
) child
->ptrace_message
, datap
);
740 case PTRACE_GETSIGINFO
:
741 ret
= ptrace_getsiginfo(child
, &siginfo
);
743 ret
= copy_siginfo_to_user32(
744 (struct compat_siginfo __user
*) datap
,
748 case PTRACE_SETSIGINFO
:
749 memset(&siginfo
, 0, sizeof siginfo
);
750 if (copy_siginfo_from_user32(
751 &siginfo
, (struct compat_siginfo __user
*) datap
))
754 ret
= ptrace_setsiginfo(child
, &siginfo
);
758 ret
= ptrace_request(child
, request
, addr
, data
);
764 asmlinkage
long compat_sys_ptrace(compat_long_t request
, compat_long_t pid
,
765 compat_long_t addr
, compat_long_t data
)
767 struct task_struct
*child
;
771 * This lock_kernel fixes a subtle race with suid exec
774 if (request
== PTRACE_TRACEME
) {
775 ret
= ptrace_traceme();
779 child
= ptrace_get_task_struct(pid
);
781 ret
= PTR_ERR(child
);
785 if (request
== PTRACE_ATTACH
) {
786 ret
= ptrace_attach(child
);
788 * Some architectures need to do book-keeping after
792 arch_ptrace_attach(child
);
793 goto out_put_task_struct
;
796 ret
= ptrace_check_attach(child
, request
== PTRACE_KILL
);
798 ret
= compat_arch_ptrace(child
, request
, addr
, data
);
801 put_task_struct(child
);
806 #endif /* CONFIG_COMPAT */