2 /* By Ross Biro 1/23/92 */
4 * Pentium III FXSR, SSE support
5 * Gareth Hughes <gareth@valinux.com>, May 2000
7 * x86-64 port 2000-2002 Andi Kleen
10 #include <linux/kernel.h>
11 #include <linux/sched.h>
13 #include <linux/smp.h>
14 #include <linux/smp_lock.h>
15 #include <linux/errno.h>
16 #include <linux/ptrace.h>
17 #include <linux/user.h>
18 #include <linux/security.h>
19 #include <linux/audit.h>
20 #include <linux/seccomp.h>
22 #include <asm/uaccess.h>
23 #include <asm/pgtable.h>
24 #include <asm/system.h>
25 #include <asm/processor.h>
27 #include <asm/debugreg.h>
30 #include <asm/proto.h>
34 * does not yet catch signals sent when the child dies.
35 * in exit.c or in signal.c.
38 /* determines which flags the user has access to. */
39 /* 1 = access 0 = no access */
40 #define FLAG_MASK 0x44dd5UL
42 /* set's the trap flag. */
43 #define TRAP_FLAG 0x100UL
46 * eflags and offset of eflags on child stack..
48 #define EFLAGS offsetof(struct pt_regs, eflags)
49 #define EFL_OFFSET ((int)(EFLAGS-sizeof(struct pt_regs)))
52 * this routine will get a word off of the processes privileged stack.
53 * the offset is how far from the base addr as stored in the TSS.
54 * this routine assumes that all the privileged stacks are in our
57 static inline unsigned long get_stack_long(struct task_struct
*task
, int offset
)
61 stack
= (unsigned char *)task
->thread
.rsp0
;
63 return (*((unsigned long *)stack
));
67 * this routine will put a word on the processes privileged stack.
68 * the offset is how far from the base addr as stored in the TSS.
69 * this routine assumes that all the privileged stacks are in our
72 static inline long put_stack_long(struct task_struct
*task
, int offset
,
75 unsigned char * stack
;
77 stack
= (unsigned char *) task
->thread
.rsp0
;
79 *(unsigned long *) stack
= data
;
84 * Called by kernel/ptrace.c when detaching..
86 * Make sure the single step bit is not set.
88 void ptrace_disable(struct task_struct
*child
)
92 clear_tsk_thread_flag(child
, TIF_SINGLESTEP
);
93 tmp
= get_stack_long(child
, EFL_OFFSET
) & ~TRAP_FLAG
;
94 put_stack_long(child
, EFL_OFFSET
, tmp
);
97 static int putreg(struct task_struct
*child
,
98 unsigned long regno
, unsigned long value
)
102 /* Some code in the 64bit emulation may not be 64bit clean.
103 Don't take any chances. */
104 if (test_tsk_thread_flag(child
, TIF_IA32
))
107 case offsetof(struct user_regs_struct
,fs
):
108 if (value
&& (value
& 3) != 3)
110 child
->thread
.fsindex
= value
& 0xffff;
112 case offsetof(struct user_regs_struct
,gs
):
113 if (value
&& (value
& 3) != 3)
115 child
->thread
.gsindex
= value
& 0xffff;
117 case offsetof(struct user_regs_struct
,ds
):
118 if (value
&& (value
& 3) != 3)
120 child
->thread
.ds
= value
& 0xffff;
122 case offsetof(struct user_regs_struct
,es
):
123 if (value
&& (value
& 3) != 3)
125 child
->thread
.es
= value
& 0xffff;
127 case offsetof(struct user_regs_struct
,ss
):
128 if ((value
& 3) != 3)
132 case offsetof(struct user_regs_struct
,fs_base
):
133 if (!((value
>> 48) == 0 || (value
>> 48) == 0xffff))
135 child
->thread
.fs
= value
;
137 case offsetof(struct user_regs_struct
,gs_base
):
138 if (!((value
>> 48) == 0 || (value
>> 48) == 0xffff))
140 child
->thread
.gs
= value
;
142 case offsetof(struct user_regs_struct
, eflags
):
144 tmp
= get_stack_long(child
, EFL_OFFSET
);
148 case offsetof(struct user_regs_struct
,cs
):
149 if ((value
& 3) != 3)
154 put_stack_long(child
, regno
- sizeof(struct pt_regs
), value
);
158 static unsigned long getreg(struct task_struct
*child
, unsigned long regno
)
162 case offsetof(struct user_regs_struct
, fs
):
163 return child
->thread
.fsindex
;
164 case offsetof(struct user_regs_struct
, gs
):
165 return child
->thread
.gsindex
;
166 case offsetof(struct user_regs_struct
, ds
):
167 return child
->thread
.ds
;
168 case offsetof(struct user_regs_struct
, es
):
169 return child
->thread
.es
;
170 case offsetof(struct user_regs_struct
, fs_base
):
171 return child
->thread
.fs
;
172 case offsetof(struct user_regs_struct
, gs_base
):
173 return child
->thread
.gs
;
175 regno
= regno
- sizeof(struct pt_regs
);
176 val
= get_stack_long(child
, regno
);
177 if (test_tsk_thread_flag(child
, TIF_IA32
))
184 asmlinkage
long sys_ptrace(long request
, long pid
, unsigned long addr
, long data
)
186 struct task_struct
*child
;
190 /* This lock_kernel fixes a subtle race with suid exec */
193 if (request
== PTRACE_TRACEME
) {
194 /* are we already being traced? */
195 if (current
->ptrace
& PT_PTRACED
)
197 ret
= security_ptrace(current
->parent
, current
);
200 /* set the ptrace bit in the process flags. */
201 current
->ptrace
|= PT_PTRACED
;
206 read_lock(&tasklist_lock
);
207 child
= find_task_by_pid(pid
);
209 get_task_struct(child
);
210 read_unlock(&tasklist_lock
);
215 if (pid
== 1) /* you may not mess with init */
218 if (request
== PTRACE_ATTACH
) {
219 ret
= ptrace_attach(child
);
222 ret
= ptrace_check_attach(child
, request
== PTRACE_KILL
);
227 /* when I and D space are separate, these will need to be fixed. */
228 case PTRACE_PEEKTEXT
: /* read word at location addr. */
229 case PTRACE_PEEKDATA
: {
233 copied
= access_process_vm(child
, addr
, &tmp
, sizeof(tmp
), 0);
235 if (copied
!= sizeof(tmp
))
237 ret
= put_user(tmp
,(unsigned long __user
*) data
);
241 /* read the word at location addr in the USER area. */
242 case PTRACE_PEEKUSR
: {
247 addr
> sizeof(struct user
) - 7)
251 case 0 ... sizeof(struct user_regs_struct
):
252 tmp
= getreg(child
, addr
);
254 case offsetof(struct user
, u_debugreg
[0]):
255 tmp
= child
->thread
.debugreg0
;
257 case offsetof(struct user
, u_debugreg
[1]):
258 tmp
= child
->thread
.debugreg1
;
260 case offsetof(struct user
, u_debugreg
[2]):
261 tmp
= child
->thread
.debugreg2
;
263 case offsetof(struct user
, u_debugreg
[3]):
264 tmp
= child
->thread
.debugreg3
;
266 case offsetof(struct user
, u_debugreg
[6]):
267 tmp
= child
->thread
.debugreg6
;
269 case offsetof(struct user
, u_debugreg
[7]):
270 tmp
= child
->thread
.debugreg7
;
276 ret
= put_user(tmp
,(unsigned long __user
*) data
);
280 /* when I and D space are separate, this will have to be fixed. */
281 case PTRACE_POKETEXT
: /* write the word at location addr. */
282 case PTRACE_POKEDATA
:
284 if (access_process_vm(child
, addr
, &data
, sizeof(data
), 1) == sizeof(data
))
289 case PTRACE_POKEUSR
: /* write the word at location addr in the USER area */
292 addr
> sizeof(struct user
) - 7)
296 case 0 ... sizeof(struct user_regs_struct
):
297 ret
= putreg(child
, addr
, data
);
299 /* Disallows to set a breakpoint into the vsyscall */
300 case offsetof(struct user
, u_debugreg
[0]):
301 if (data
>= TASK_SIZE
-7) break;
302 child
->thread
.debugreg0
= data
;
305 case offsetof(struct user
, u_debugreg
[1]):
306 if (data
>= TASK_SIZE
-7) break;
307 child
->thread
.debugreg1
= data
;
310 case offsetof(struct user
, u_debugreg
[2]):
311 if (data
>= TASK_SIZE
-7) break;
312 child
->thread
.debugreg2
= data
;
315 case offsetof(struct user
, u_debugreg
[3]):
316 if (data
>= TASK_SIZE
-7) break;
317 child
->thread
.debugreg3
= data
;
320 case offsetof(struct user
, u_debugreg
[6]):
323 child
->thread
.debugreg6
= data
;
326 case offsetof(struct user
, u_debugreg
[7]):
327 /* See arch/i386/kernel/ptrace.c for an explanation of
328 * this awkward check.*/
329 data
&= ~DR_CONTROL_RESERVED
;
331 if ((0x5454 >> ((data
>> (16 + 4*i
)) & 0xf)) & 1)
334 child
->thread
.debugreg7
= data
;
340 case PTRACE_SYSCALL
: /* continue and stop at next (return from) syscall */
341 case PTRACE_CONT
: { /* restart after signal. */
345 if ((unsigned long) data
> _NSIG
)
347 if (request
== PTRACE_SYSCALL
)
348 set_tsk_thread_flag(child
,TIF_SYSCALL_TRACE
);
350 clear_tsk_thread_flag(child
,TIF_SYSCALL_TRACE
);
351 clear_tsk_thread_flag(child
, TIF_SINGLESTEP
);
352 child
->exit_code
= data
;
353 /* make sure the single step bit is not set. */
354 tmp
= get_stack_long(child
, EFL_OFFSET
);
356 put_stack_long(child
, EFL_OFFSET
,tmp
);
357 wake_up_process(child
);
362 #ifdef CONFIG_IA32_EMULATION
363 /* This makes only sense with 32bit programs. Allow a
364 64bit debugger to fully examine them too. Better
365 don't use it against 64bit processes, use
366 PTRACE_ARCH_PRCTL instead. */
367 case PTRACE_SET_THREAD_AREA
: {
368 struct user_desc __user
*p
;
370 p
= (struct user_desc __user
*)data
;
371 get_user(old
, &p
->entry_number
);
372 put_user(addr
, &p
->entry_number
);
373 ret
= do_set_thread_area(&child
->thread
, p
);
374 put_user(old
, &p
->entry_number
);
376 case PTRACE_GET_THREAD_AREA
:
377 p
= (struct user_desc __user
*)data
;
378 get_user(old
, &p
->entry_number
);
379 put_user(addr
, &p
->entry_number
);
380 ret
= do_get_thread_area(&child
->thread
, p
);
381 put_user(old
, &p
->entry_number
);
385 /* normal 64bit interface to access TLS data.
386 Works just like arch_prctl, except that the arguments
388 case PTRACE_ARCH_PRCTL
:
389 ret
= do_arch_prctl(child
, data
, addr
);
393 * make the child exit. Best I can do is send it a sigkill.
394 * perhaps it should be put in the status that it wants to
401 if (child
->exit_state
== EXIT_ZOMBIE
) /* already dead */
403 clear_tsk_thread_flag(child
, TIF_SINGLESTEP
);
404 child
->exit_code
= SIGKILL
;
405 /* make sure the single step bit is not set. */
406 tmp
= get_stack_long(child
, EFL_OFFSET
) & ~TRAP_FLAG
;
407 put_stack_long(child
, EFL_OFFSET
, tmp
);
408 wake_up_process(child
);
412 case PTRACE_SINGLESTEP
: { /* set the trap flag. */
416 if ((unsigned long) data
> _NSIG
)
418 clear_tsk_thread_flag(child
,TIF_SYSCALL_TRACE
);
419 if ((child
->ptrace
& PT_DTRACE
) == 0) {
420 /* Spurious delayed TF traps may occur */
421 child
->ptrace
|= PT_DTRACE
;
423 tmp
= get_stack_long(child
, EFL_OFFSET
) | TRAP_FLAG
;
424 put_stack_long(child
, EFL_OFFSET
, tmp
);
425 set_tsk_thread_flag(child
, TIF_SINGLESTEP
);
426 child
->exit_code
= data
;
427 /* give it a chance to run. */
428 wake_up_process(child
);
434 /* detach a process that was attached. */
435 ret
= ptrace_detach(child
, data
);
438 case PTRACE_GETREGS
: { /* Get all gp regs from the child. */
439 if (!access_ok(VERIFY_WRITE
, (unsigned __user
*)data
,
440 sizeof(struct user_regs_struct
))) {
445 for (ui
= 0; ui
< sizeof(struct user_regs_struct
); ui
+= sizeof(long)) {
446 ret
|= __put_user(getreg(child
, ui
),(unsigned long __user
*) data
);
447 data
+= sizeof(long);
452 case PTRACE_SETREGS
: { /* Set all gp regs in the child. */
454 if (!access_ok(VERIFY_READ
, (unsigned __user
*)data
,
455 sizeof(struct user_regs_struct
))) {
460 for (ui
= 0; ui
< sizeof(struct user_regs_struct
); ui
+= sizeof(long)) {
461 ret
|= __get_user(tmp
, (unsigned long __user
*) data
);
462 putreg(child
, ui
, tmp
);
463 data
+= sizeof(long);
468 case PTRACE_GETFPREGS
: { /* Get the child extended FPU state. */
469 if (!access_ok(VERIFY_WRITE
, (unsigned __user
*)data
,
470 sizeof(struct user_i387_struct
))) {
474 ret
= get_fpregs((struct user_i387_struct __user
*)data
, child
);
478 case PTRACE_SETFPREGS
: { /* Set the child extended FPU state. */
479 if (!access_ok(VERIFY_READ
, (unsigned __user
*)data
,
480 sizeof(struct user_i387_struct
))) {
484 set_stopped_child_used_math(child
);
485 ret
= set_fpregs(child
, (struct user_i387_struct __user
*)data
);
490 ret
= ptrace_request(child
, request
, addr
, data
);
494 put_task_struct(child
);
500 static void syscall_trace(struct pt_regs
*regs
)
504 printk("trace %s rip %lx rsp %lx rax %d origrax %d caller %lx tiflags %x ptrace %x\n",
506 regs
->rip
, regs
->rsp
, regs
->rax
, regs
->orig_rax
, __builtin_return_address(0),
507 current_thread_info()->flags
, current
->ptrace
);
510 ptrace_notify(SIGTRAP
| ((current
->ptrace
& PT_TRACESYSGOOD
)
513 * this isn't the same as continuing with a signal, but it will do
514 * for normal use. strace only continues with a signal if the
515 * stopping signal is not SIGTRAP. -brl
517 if (current
->exit_code
) {
518 send_sig(current
->exit_code
, current
, 1);
519 current
->exit_code
= 0;
523 asmlinkage
void syscall_trace_enter(struct pt_regs
*regs
)
525 /* do the secure computing check first */
526 secure_computing(regs
->orig_rax
);
528 if (unlikely(current
->audit_context
))
529 audit_syscall_entry(current
, regs
->orig_rax
,
530 regs
->rdi
, regs
->rsi
,
531 regs
->rdx
, regs
->r10
);
533 if (test_thread_flag(TIF_SYSCALL_TRACE
)
534 && (current
->ptrace
& PT_PTRACED
))
538 asmlinkage
void syscall_trace_leave(struct pt_regs
*regs
)
540 if (unlikely(current
->audit_context
))
541 audit_syscall_exit(current
, regs
->rax
);
543 if ((test_thread_flag(TIF_SYSCALL_TRACE
)
544 || test_thread_flag(TIF_SINGLESTEP
))
545 && (current
->ptrace
& PT_PTRACED
))