2 * linux/kernel/signal.c
4 * Copyright (C) 1991, 1992 Linus Torvalds
6 * 1997-11-02 Modified for POSIX.1b signals by Richard Henderson
8 * 2003-06-02 Jim Houston - Concurrent Computer Corp.
9 * Changes to use preallocated sigqueue structures
10 * to allow signals to be sent reliably.
13 #include <linux/slab.h>
14 #include <linux/export.h>
15 #include <linux/init.h>
16 #include <linux/sched.h>
18 #include <linux/tty.h>
19 #include <linux/binfmts.h>
20 #include <linux/security.h>
21 #include <linux/syscalls.h>
22 #include <linux/ptrace.h>
23 #include <linux/signal.h>
24 #include <linux/signalfd.h>
25 #include <linux/ratelimit.h>
26 #include <linux/tracehook.h>
27 #include <linux/capability.h>
28 #include <linux/freezer.h>
29 #include <linux/pid_namespace.h>
30 #include <linux/nsproxy.h>
31 #include <linux/user_namespace.h>
32 #define CREATE_TRACE_POINTS
33 #include <trace/events/signal.h>
35 #include <asm/param.h>
36 #include <asm/uaccess.h>
37 #include <asm/unistd.h>
38 #include <asm/siginfo.h>
39 #include "audit.h" /* audit_signal_info() */
42 * SLAB caches for signal bits.
45 static struct kmem_cache
*sigqueue_cachep
;
47 int print_fatal_signals __read_mostly
;
49 static void __user
*sig_handler(struct task_struct
*t
, int sig
)
51 return t
->sighand
->action
[sig
- 1].sa
.sa_handler
;
54 static int sig_handler_ignored(void __user
*handler
, int sig
)
56 /* Is it explicitly or implicitly ignored? */
57 return handler
== SIG_IGN
||
58 (handler
== SIG_DFL
&& sig_kernel_ignore(sig
));
61 static int sig_task_ignored(struct task_struct
*t
, int sig
,
66 handler
= sig_handler(t
, sig
);
68 if (unlikely(t
->signal
->flags
& SIGNAL_UNKILLABLE
) &&
69 handler
== SIG_DFL
&& !from_ancestor_ns
)
72 return sig_handler_ignored(handler
, sig
);
75 static int sig_ignored(struct task_struct
*t
, int sig
, int from_ancestor_ns
)
78 * Blocked signals are never ignored, since the
79 * signal handler may change by the time it is
82 if (sigismember(&t
->blocked
, sig
) || sigismember(&t
->real_blocked
, sig
))
85 if (!sig_task_ignored(t
, sig
, from_ancestor_ns
))
89 * Tracers may want to know about even ignored signals.
95 * Re-calculate pending state from the set of locally pending
96 * signals, globally pending signals, and blocked signals.
98 static inline int has_pending_signals(sigset_t
*signal
, sigset_t
*blocked
)
103 switch (_NSIG_WORDS
) {
105 for (i
= _NSIG_WORDS
, ready
= 0; --i
>= 0 ;)
106 ready
|= signal
->sig
[i
] &~ blocked
->sig
[i
];
109 case 4: ready
= signal
->sig
[3] &~ blocked
->sig
[3];
110 ready
|= signal
->sig
[2] &~ blocked
->sig
[2];
111 ready
|= signal
->sig
[1] &~ blocked
->sig
[1];
112 ready
|= signal
->sig
[0] &~ blocked
->sig
[0];
115 case 2: ready
= signal
->sig
[1] &~ blocked
->sig
[1];
116 ready
|= signal
->sig
[0] &~ blocked
->sig
[0];
119 case 1: ready
= signal
->sig
[0] &~ blocked
->sig
[0];
124 #define PENDING(p,b) has_pending_signals(&(p)->signal, (b))
126 static int recalc_sigpending_tsk(struct task_struct
*t
)
128 if ((t
->jobctl
& JOBCTL_PENDING_MASK
) ||
129 PENDING(&t
->pending
, &t
->blocked
) ||
130 PENDING(&t
->signal
->shared_pending
, &t
->blocked
)) {
131 set_tsk_thread_flag(t
, TIF_SIGPENDING
);
135 * We must never clear the flag in another thread, or in current
136 * when it's possible the current syscall is returning -ERESTART*.
137 * So we don't clear it here, and only callers who know they should do.
143 * After recalculating TIF_SIGPENDING, we need to make sure the task wakes up.
144 * This is superfluous when called on current, the wakeup is a harmless no-op.
146 void recalc_sigpending_and_wake(struct task_struct
*t
)
148 if (recalc_sigpending_tsk(t
))
149 signal_wake_up(t
, 0);
152 void recalc_sigpending(void)
154 if (!recalc_sigpending_tsk(current
) && !freezing(current
))
155 clear_thread_flag(TIF_SIGPENDING
);
159 /* Given the mask, find the first available signal that should be serviced. */
161 #define SYNCHRONOUS_MASK \
162 (sigmask(SIGSEGV) | sigmask(SIGBUS) | sigmask(SIGILL) | \
163 sigmask(SIGTRAP) | sigmask(SIGFPE))
165 int next_signal(struct sigpending
*pending
, sigset_t
*mask
)
167 unsigned long i
, *s
, *m
, x
;
170 s
= pending
->signal
.sig
;
174 * Handle the first word specially: it contains the
175 * synchronous signals that need to be dequeued first.
179 if (x
& SYNCHRONOUS_MASK
)
180 x
&= SYNCHRONOUS_MASK
;
185 switch (_NSIG_WORDS
) {
187 for (i
= 1; i
< _NSIG_WORDS
; ++i
) {
191 sig
= ffz(~x
) + i
*_NSIG_BPW
+ 1;
200 sig
= ffz(~x
) + _NSIG_BPW
+ 1;
211 static inline void print_dropped_signal(int sig
)
213 static DEFINE_RATELIMIT_STATE(ratelimit_state
, 5 * HZ
, 10);
215 if (!print_fatal_signals
)
218 if (!__ratelimit(&ratelimit_state
))
221 printk(KERN_INFO
"%s/%d: reached RLIMIT_SIGPENDING, dropped signal %d\n",
222 current
->comm
, current
->pid
, sig
);
226 * task_set_jobctl_pending - set jobctl pending bits
228 * @mask: pending bits to set
230 * Clear @mask from @task->jobctl. @mask must be subset of
231 * %JOBCTL_PENDING_MASK | %JOBCTL_STOP_CONSUME | %JOBCTL_STOP_SIGMASK |
232 * %JOBCTL_TRAPPING. If stop signo is being set, the existing signo is
233 * cleared. If @task is already being killed or exiting, this function
237 * Must be called with @task->sighand->siglock held.
240 * %true if @mask is set, %false if made noop because @task was dying.
242 bool task_set_jobctl_pending(struct task_struct
*task
, unsigned int mask
)
244 BUG_ON(mask
& ~(JOBCTL_PENDING_MASK
| JOBCTL_STOP_CONSUME
|
245 JOBCTL_STOP_SIGMASK
| JOBCTL_TRAPPING
));
246 BUG_ON((mask
& JOBCTL_TRAPPING
) && !(mask
& JOBCTL_PENDING_MASK
));
248 if (unlikely(fatal_signal_pending(task
) || (task
->flags
& PF_EXITING
)))
251 if (mask
& JOBCTL_STOP_SIGMASK
)
252 task
->jobctl
&= ~JOBCTL_STOP_SIGMASK
;
254 task
->jobctl
|= mask
;
259 * task_clear_jobctl_trapping - clear jobctl trapping bit
262 * If JOBCTL_TRAPPING is set, a ptracer is waiting for us to enter TRACED.
263 * Clear it and wake up the ptracer. Note that we don't need any further
264 * locking. @task->siglock guarantees that @task->parent points to the
268 * Must be called with @task->sighand->siglock held.
270 void task_clear_jobctl_trapping(struct task_struct
*task
)
272 if (unlikely(task
->jobctl
& JOBCTL_TRAPPING
)) {
273 task
->jobctl
&= ~JOBCTL_TRAPPING
;
274 wake_up_bit(&task
->jobctl
, JOBCTL_TRAPPING_BIT
);
279 * task_clear_jobctl_pending - clear jobctl pending bits
281 * @mask: pending bits to clear
283 * Clear @mask from @task->jobctl. @mask must be subset of
284 * %JOBCTL_PENDING_MASK. If %JOBCTL_STOP_PENDING is being cleared, other
285 * STOP bits are cleared together.
287 * If clearing of @mask leaves no stop or trap pending, this function calls
288 * task_clear_jobctl_trapping().
291 * Must be called with @task->sighand->siglock held.
293 void task_clear_jobctl_pending(struct task_struct
*task
, unsigned int mask
)
295 BUG_ON(mask
& ~JOBCTL_PENDING_MASK
);
297 if (mask
& JOBCTL_STOP_PENDING
)
298 mask
|= JOBCTL_STOP_CONSUME
| JOBCTL_STOP_DEQUEUED
;
300 task
->jobctl
&= ~mask
;
302 if (!(task
->jobctl
& JOBCTL_PENDING_MASK
))
303 task_clear_jobctl_trapping(task
);
307 * task_participate_group_stop - participate in a group stop
308 * @task: task participating in a group stop
310 * @task has %JOBCTL_STOP_PENDING set and is participating in a group stop.
311 * Group stop states are cleared and the group stop count is consumed if
312 * %JOBCTL_STOP_CONSUME was set. If the consumption completes the group
313 * stop, the appropriate %SIGNAL_* flags are set.
316 * Must be called with @task->sighand->siglock held.
319 * %true if group stop completion should be notified to the parent, %false
322 static bool task_participate_group_stop(struct task_struct
*task
)
324 struct signal_struct
*sig
= task
->signal
;
325 bool consume
= task
->jobctl
& JOBCTL_STOP_CONSUME
;
327 WARN_ON_ONCE(!(task
->jobctl
& JOBCTL_STOP_PENDING
));
329 task_clear_jobctl_pending(task
, JOBCTL_STOP_PENDING
);
334 if (!WARN_ON_ONCE(sig
->group_stop_count
== 0))
335 sig
->group_stop_count
--;
338 * Tell the caller to notify completion iff we are entering into a
339 * fresh group stop. Read comment in do_signal_stop() for details.
341 if (!sig
->group_stop_count
&& !(sig
->flags
& SIGNAL_STOP_STOPPED
)) {
342 sig
->flags
= SIGNAL_STOP_STOPPED
;
349 * allocate a new signal queue record
350 * - this may be called without locks if and only if t == current, otherwise an
351 * appropriate lock must be held to stop the target task from exiting
353 static struct sigqueue
*
354 __sigqueue_alloc(int sig
, struct task_struct
*t
, gfp_t flags
, int override_rlimit
)
356 struct sigqueue
*q
= NULL
;
357 struct user_struct
*user
;
360 * Protect access to @t credentials. This can go away when all
361 * callers hold rcu read lock.
364 user
= get_uid(__task_cred(t
)->user
);
365 atomic_inc(&user
->sigpending
);
368 if (override_rlimit
||
369 atomic_read(&user
->sigpending
) <=
370 task_rlimit(t
, RLIMIT_SIGPENDING
)) {
371 q
= kmem_cache_alloc(sigqueue_cachep
, flags
);
373 print_dropped_signal(sig
);
376 if (unlikely(q
== NULL
)) {
377 atomic_dec(&user
->sigpending
);
380 INIT_LIST_HEAD(&q
->list
);
388 static void __sigqueue_free(struct sigqueue
*q
)
390 if (q
->flags
& SIGQUEUE_PREALLOC
)
392 atomic_dec(&q
->user
->sigpending
);
394 kmem_cache_free(sigqueue_cachep
, q
);
397 void flush_sigqueue(struct sigpending
*queue
)
401 sigemptyset(&queue
->signal
);
402 while (!list_empty(&queue
->list
)) {
403 q
= list_entry(queue
->list
.next
, struct sigqueue
, list
);
404 list_del_init(&q
->list
);
410 * Flush all pending signals for a task.
412 void __flush_signals(struct task_struct
*t
)
414 clear_tsk_thread_flag(t
, TIF_SIGPENDING
);
415 flush_sigqueue(&t
->pending
);
416 flush_sigqueue(&t
->signal
->shared_pending
);
419 void flush_signals(struct task_struct
*t
)
423 spin_lock_irqsave(&t
->sighand
->siglock
, flags
);
425 spin_unlock_irqrestore(&t
->sighand
->siglock
, flags
);
428 static void __flush_itimer_signals(struct sigpending
*pending
)
430 sigset_t signal
, retain
;
431 struct sigqueue
*q
, *n
;
433 signal
= pending
->signal
;
434 sigemptyset(&retain
);
436 list_for_each_entry_safe(q
, n
, &pending
->list
, list
) {
437 int sig
= q
->info
.si_signo
;
439 if (likely(q
->info
.si_code
!= SI_TIMER
)) {
440 sigaddset(&retain
, sig
);
442 sigdelset(&signal
, sig
);
443 list_del_init(&q
->list
);
448 sigorsets(&pending
->signal
, &signal
, &retain
);
451 void flush_itimer_signals(void)
453 struct task_struct
*tsk
= current
;
456 spin_lock_irqsave(&tsk
->sighand
->siglock
, flags
);
457 __flush_itimer_signals(&tsk
->pending
);
458 __flush_itimer_signals(&tsk
->signal
->shared_pending
);
459 spin_unlock_irqrestore(&tsk
->sighand
->siglock
, flags
);
462 void ignore_signals(struct task_struct
*t
)
466 for (i
= 0; i
< _NSIG
; ++i
)
467 t
->sighand
->action
[i
].sa
.sa_handler
= SIG_IGN
;
473 * Flush all handlers for a task.
477 flush_signal_handlers(struct task_struct
*t
, int force_default
)
480 struct k_sigaction
*ka
= &t
->sighand
->action
[0];
481 for (i
= _NSIG
; i
!= 0 ; i
--) {
482 if (force_default
|| ka
->sa
.sa_handler
!= SIG_IGN
)
483 ka
->sa
.sa_handler
= SIG_DFL
;
485 sigemptyset(&ka
->sa
.sa_mask
);
490 int unhandled_signal(struct task_struct
*tsk
, int sig
)
492 void __user
*handler
= tsk
->sighand
->action
[sig
-1].sa
.sa_handler
;
493 if (is_global_init(tsk
))
495 if (handler
!= SIG_IGN
&& handler
!= SIG_DFL
)
497 /* if ptraced, let the tracer determine */
502 * Notify the system that a driver wants to block all signals for this
503 * process, and wants to be notified if any signals at all were to be
504 * sent/acted upon. If the notifier routine returns non-zero, then the
505 * signal will be acted upon after all. If the notifier routine returns 0,
506 * then then signal will be blocked. Only one block per process is
507 * allowed. priv is a pointer to private data that the notifier routine
508 * can use to determine if the signal should be blocked or not.
511 block_all_signals(int (*notifier
)(void *priv
), void *priv
, sigset_t
*mask
)
515 spin_lock_irqsave(¤t
->sighand
->siglock
, flags
);
516 current
->notifier_mask
= mask
;
517 current
->notifier_data
= priv
;
518 current
->notifier
= notifier
;
519 spin_unlock_irqrestore(¤t
->sighand
->siglock
, flags
);
522 /* Notify the system that blocking has ended. */
525 unblock_all_signals(void)
529 spin_lock_irqsave(¤t
->sighand
->siglock
, flags
);
530 current
->notifier
= NULL
;
531 current
->notifier_data
= NULL
;
533 spin_unlock_irqrestore(¤t
->sighand
->siglock
, flags
);
536 static void collect_signal(int sig
, struct sigpending
*list
, siginfo_t
*info
)
538 struct sigqueue
*q
, *first
= NULL
;
541 * Collect the siginfo appropriate to this signal. Check if
542 * there is another siginfo for the same signal.
544 list_for_each_entry(q
, &list
->list
, list
) {
545 if (q
->info
.si_signo
== sig
) {
552 sigdelset(&list
->signal
, sig
);
556 list_del_init(&first
->list
);
557 copy_siginfo(info
, &first
->info
);
558 __sigqueue_free(first
);
561 * Ok, it wasn't in the queue. This must be
562 * a fast-pathed signal or we must have been
563 * out of queue space. So zero out the info.
565 info
->si_signo
= sig
;
567 info
->si_code
= SI_USER
;
573 static int __dequeue_signal(struct sigpending
*pending
, sigset_t
*mask
,
576 int sig
= next_signal(pending
, mask
);
579 if (current
->notifier
) {
580 if (sigismember(current
->notifier_mask
, sig
)) {
581 if (!(current
->notifier
)(current
->notifier_data
)) {
582 clear_thread_flag(TIF_SIGPENDING
);
588 collect_signal(sig
, pending
, info
);
595 * Dequeue a signal and return the element to the caller, which is
596 * expected to free it.
598 * All callers have to hold the siglock.
600 int dequeue_signal(struct task_struct
*tsk
, sigset_t
*mask
, siginfo_t
*info
)
604 /* We only dequeue private signals from ourselves, we don't let
605 * signalfd steal them
607 signr
= __dequeue_signal(&tsk
->pending
, mask
, info
);
609 signr
= __dequeue_signal(&tsk
->signal
->shared_pending
,
614 * itimers are process shared and we restart periodic
615 * itimers in the signal delivery path to prevent DoS
616 * attacks in the high resolution timer case. This is
617 * compliant with the old way of self-restarting
618 * itimers, as the SIGALRM is a legacy signal and only
619 * queued once. Changing the restart behaviour to
620 * restart the timer in the signal dequeue path is
621 * reducing the timer noise on heavy loaded !highres
624 if (unlikely(signr
== SIGALRM
)) {
625 struct hrtimer
*tmr
= &tsk
->signal
->real_timer
;
627 if (!hrtimer_is_queued(tmr
) &&
628 tsk
->signal
->it_real_incr
.tv64
!= 0) {
629 hrtimer_forward(tmr
, tmr
->base
->get_time(),
630 tsk
->signal
->it_real_incr
);
631 hrtimer_restart(tmr
);
640 if (unlikely(sig_kernel_stop(signr
))) {
642 * Set a marker that we have dequeued a stop signal. Our
643 * caller might release the siglock and then the pending
644 * stop signal it is about to process is no longer in the
645 * pending bitmasks, but must still be cleared by a SIGCONT
646 * (and overruled by a SIGKILL). So those cases clear this
647 * shared flag after we've set it. Note that this flag may
648 * remain set after the signal we return is ignored or
649 * handled. That doesn't matter because its only purpose
650 * is to alert stop-signal processing code when another
651 * processor has come along and cleared the flag.
653 current
->jobctl
|= JOBCTL_STOP_DEQUEUED
;
655 if ((info
->si_code
& __SI_MASK
) == __SI_TIMER
&& info
->si_sys_private
) {
657 * Release the siglock to ensure proper locking order
658 * of timer locks outside of siglocks. Note, we leave
659 * irqs disabled here, since the posix-timers code is
660 * about to disable them again anyway.
662 spin_unlock(&tsk
->sighand
->siglock
);
663 do_schedule_next_timer(info
);
664 spin_lock(&tsk
->sighand
->siglock
);
670 * Tell a process that it has a new active signal..
672 * NOTE! we rely on the previous spin_lock to
673 * lock interrupts for us! We can only be called with
674 * "siglock" held, and the local interrupt must
675 * have been disabled when that got acquired!
677 * No need to set need_resched since signal event passing
678 * goes through ->blocked
680 void signal_wake_up(struct task_struct
*t
, int resume
)
684 set_tsk_thread_flag(t
, TIF_SIGPENDING
);
687 * For SIGKILL, we want to wake it up in the stopped/traced/killable
688 * case. We don't check t->state here because there is a race with it
689 * executing another processor and just now entering stopped state.
690 * By using wake_up_state, we ensure the process will wake up and
691 * handle its death signal.
693 mask
= TASK_INTERRUPTIBLE
;
695 mask
|= TASK_WAKEKILL
;
696 if (!wake_up_state(t
, mask
))
701 * Remove signals in mask from the pending set and queue.
702 * Returns 1 if any signals were found.
704 * All callers must be holding the siglock.
706 * This version takes a sigset mask and looks at all signals,
707 * not just those in the first mask word.
709 static int rm_from_queue_full(sigset_t
*mask
, struct sigpending
*s
)
711 struct sigqueue
*q
, *n
;
714 sigandsets(&m
, mask
, &s
->signal
);
715 if (sigisemptyset(&m
))
718 sigandnsets(&s
->signal
, &s
->signal
, mask
);
719 list_for_each_entry_safe(q
, n
, &s
->list
, list
) {
720 if (sigismember(mask
, q
->info
.si_signo
)) {
721 list_del_init(&q
->list
);
728 * Remove signals in mask from the pending set and queue.
729 * Returns 1 if any signals were found.
731 * All callers must be holding the siglock.
733 static int rm_from_queue(unsigned long mask
, struct sigpending
*s
)
735 struct sigqueue
*q
, *n
;
737 if (!sigtestsetmask(&s
->signal
, mask
))
740 sigdelsetmask(&s
->signal
, mask
);
741 list_for_each_entry_safe(q
, n
, &s
->list
, list
) {
742 if (q
->info
.si_signo
< SIGRTMIN
&&
743 (mask
& sigmask(q
->info
.si_signo
))) {
744 list_del_init(&q
->list
);
751 static inline int is_si_special(const struct siginfo
*info
)
753 return info
<= SEND_SIG_FORCED
;
756 static inline bool si_fromuser(const struct siginfo
*info
)
758 return info
== SEND_SIG_NOINFO
||
759 (!is_si_special(info
) && SI_FROMUSER(info
));
763 * called with RCU read lock from check_kill_permission()
765 static int kill_ok_by_cred(struct task_struct
*t
)
767 const struct cred
*cred
= current_cred();
768 const struct cred
*tcred
= __task_cred(t
);
770 if (cred
->user
->user_ns
== tcred
->user
->user_ns
&&
771 (cred
->euid
== tcred
->suid
||
772 cred
->euid
== tcred
->uid
||
773 cred
->uid
== tcred
->suid
||
774 cred
->uid
== tcred
->uid
))
777 if (ns_capable(tcred
->user
->user_ns
, CAP_KILL
))
784 * Bad permissions for sending the signal
785 * - the caller must hold the RCU read lock
787 static int check_kill_permission(int sig
, struct siginfo
*info
,
788 struct task_struct
*t
)
793 if (!valid_signal(sig
))
796 if (!si_fromuser(info
))
799 error
= audit_signal_info(sig
, t
); /* Let audit system see the signal */
803 if (!same_thread_group(current
, t
) &&
804 !kill_ok_by_cred(t
)) {
807 sid
= task_session(t
);
809 * We don't return the error if sid == NULL. The
810 * task was unhashed, the caller must notice this.
812 if (!sid
|| sid
== task_session(current
))
819 return security_task_kill(t
, info
, sig
, 0);
823 * ptrace_trap_notify - schedule trap to notify ptracer
824 * @t: tracee wanting to notify tracer
826 * This function schedules sticky ptrace trap which is cleared on the next
827 * TRAP_STOP to notify ptracer of an event. @t must have been seized by
830 * If @t is running, STOP trap will be taken. If trapped for STOP and
831 * ptracer is listening for events, tracee is woken up so that it can
832 * re-trap for the new event. If trapped otherwise, STOP trap will be
833 * eventually taken without returning to userland after the existing traps
834 * are finished by PTRACE_CONT.
837 * Must be called with @task->sighand->siglock held.
839 static void ptrace_trap_notify(struct task_struct
*t
)
841 WARN_ON_ONCE(!(t
->ptrace
& PT_SEIZED
));
842 assert_spin_locked(&t
->sighand
->siglock
);
844 task_set_jobctl_pending(t
, JOBCTL_TRAP_NOTIFY
);
845 signal_wake_up(t
, t
->jobctl
& JOBCTL_LISTENING
);
849 * Handle magic process-wide effects of stop/continue signals. Unlike
850 * the signal actions, these happen immediately at signal-generation
851 * time regardless of blocking, ignoring, or handling. This does the
852 * actual continuing for SIGCONT, but not the actual stopping for stop
853 * signals. The process stop is done as a signal action for SIG_DFL.
855 * Returns true if the signal should be actually delivered, otherwise
856 * it should be dropped.
858 static int prepare_signal(int sig
, struct task_struct
*p
, int from_ancestor_ns
)
860 struct signal_struct
*signal
= p
->signal
;
861 struct task_struct
*t
;
863 if (unlikely(signal
->flags
& SIGNAL_GROUP_EXIT
)) {
865 * The process is in the middle of dying, nothing to do.
867 } else if (sig_kernel_stop(sig
)) {
869 * This is a stop signal. Remove SIGCONT from all queues.
871 rm_from_queue(sigmask(SIGCONT
), &signal
->shared_pending
);
874 rm_from_queue(sigmask(SIGCONT
), &t
->pending
);
875 } while_each_thread(p
, t
);
876 } else if (sig
== SIGCONT
) {
879 * Remove all stop signals from all queues, wake all threads.
881 rm_from_queue(SIG_KERNEL_STOP_MASK
, &signal
->shared_pending
);
884 task_clear_jobctl_pending(t
, JOBCTL_STOP_PENDING
);
885 rm_from_queue(SIG_KERNEL_STOP_MASK
, &t
->pending
);
886 if (likely(!(t
->ptrace
& PT_SEIZED
)))
887 wake_up_state(t
, __TASK_STOPPED
);
889 ptrace_trap_notify(t
);
890 } while_each_thread(p
, t
);
893 * Notify the parent with CLD_CONTINUED if we were stopped.
895 * If we were in the middle of a group stop, we pretend it
896 * was already finished, and then continued. Since SIGCHLD
897 * doesn't queue we report only CLD_STOPPED, as if the next
898 * CLD_CONTINUED was dropped.
901 if (signal
->flags
& SIGNAL_STOP_STOPPED
)
902 why
|= SIGNAL_CLD_CONTINUED
;
903 else if (signal
->group_stop_count
)
904 why
|= SIGNAL_CLD_STOPPED
;
908 * The first thread which returns from do_signal_stop()
909 * will take ->siglock, notice SIGNAL_CLD_MASK, and
910 * notify its parent. See get_signal_to_deliver().
912 signal
->flags
= why
| SIGNAL_STOP_CONTINUED
;
913 signal
->group_stop_count
= 0;
914 signal
->group_exit_code
= 0;
918 return !sig_ignored(p
, sig
, from_ancestor_ns
);
922 * Test if P wants to take SIG. After we've checked all threads with this,
923 * it's equivalent to finding no threads not blocking SIG. Any threads not
924 * blocking SIG were ruled out because they are not running and already
925 * have pending signals. Such threads will dequeue from the shared queue
926 * as soon as they're available, so putting the signal on the shared queue
927 * will be equivalent to sending it to one such thread.
929 static inline int wants_signal(int sig
, struct task_struct
*p
)
931 if (sigismember(&p
->blocked
, sig
))
933 if (p
->flags
& PF_EXITING
)
937 if (task_is_stopped_or_traced(p
))
939 return task_curr(p
) || !signal_pending(p
);
942 static void complete_signal(int sig
, struct task_struct
*p
, int group
)
944 struct signal_struct
*signal
= p
->signal
;
945 struct task_struct
*t
;
948 * Now find a thread we can wake up to take the signal off the queue.
950 * If the main thread wants the signal, it gets first crack.
951 * Probably the least surprising to the average bear.
953 if (wants_signal(sig
, p
))
955 else if (!group
|| thread_group_empty(p
))
957 * There is just one thread and it does not need to be woken.
958 * It will dequeue unblocked signals before it runs again.
963 * Otherwise try to find a suitable thread.
965 t
= signal
->curr_target
;
966 while (!wants_signal(sig
, t
)) {
968 if (t
== signal
->curr_target
)
970 * No thread needs to be woken.
971 * Any eligible threads will see
972 * the signal in the queue soon.
976 signal
->curr_target
= t
;
980 * Found a killable thread. If the signal will be fatal,
981 * then start taking the whole group down immediately.
983 if (sig_fatal(p
, sig
) &&
984 !(signal
->flags
& (SIGNAL_UNKILLABLE
| SIGNAL_GROUP_EXIT
)) &&
985 !sigismember(&t
->real_blocked
, sig
) &&
986 (sig
== SIGKILL
|| !t
->ptrace
)) {
988 * This signal will be fatal to the whole group.
990 if (!sig_kernel_coredump(sig
)) {
992 * Start a group exit and wake everybody up.
993 * This way we don't have other threads
994 * running and doing things after a slower
995 * thread has the fatal signal pending.
997 signal
->flags
= SIGNAL_GROUP_EXIT
;
998 signal
->group_exit_code
= sig
;
999 signal
->group_stop_count
= 0;
1002 task_clear_jobctl_pending(t
, JOBCTL_PENDING_MASK
);
1003 sigaddset(&t
->pending
.signal
, SIGKILL
);
1004 signal_wake_up(t
, 1);
1005 } while_each_thread(p
, t
);
1011 * The signal is already in the shared-pending queue.
1012 * Tell the chosen thread to wake up and dequeue it.
1014 signal_wake_up(t
, sig
== SIGKILL
);
1018 static inline int legacy_queue(struct sigpending
*signals
, int sig
)
1020 return (sig
< SIGRTMIN
) && sigismember(&signals
->signal
, sig
);
1024 * map the uid in struct cred into user namespace *ns
1026 static inline uid_t
map_cred_ns(const struct cred
*cred
,
1027 struct user_namespace
*ns
)
1029 return user_ns_map_uid(ns
, cred
, cred
->uid
);
1032 #ifdef CONFIG_USER_NS
1033 static inline void userns_fixup_signal_uid(struct siginfo
*info
, struct task_struct
*t
)
1035 if (current_user_ns() == task_cred_xxx(t
, user_ns
))
1038 if (SI_FROMKERNEL(info
))
1041 info
->si_uid
= user_ns_map_uid(task_cred_xxx(t
, user_ns
),
1042 current_cred(), info
->si_uid
);
1045 static inline void userns_fixup_signal_uid(struct siginfo
*info
, struct task_struct
*t
)
1051 static int __send_signal(int sig
, struct siginfo
*info
, struct task_struct
*t
,
1052 int group
, int from_ancestor_ns
)
1054 struct sigpending
*pending
;
1056 int override_rlimit
;
1058 trace_signal_generate(sig
, info
, t
);
1060 assert_spin_locked(&t
->sighand
->siglock
);
1062 if (!prepare_signal(sig
, t
, from_ancestor_ns
))
1065 pending
= group
? &t
->signal
->shared_pending
: &t
->pending
;
1067 * Short-circuit ignored signals and support queuing
1068 * exactly one non-rt signal, so that we can get more
1069 * detailed information about the cause of the signal.
1071 if (legacy_queue(pending
, sig
))
1074 * fast-pathed signals for kernel-internal things like SIGSTOP
1077 if (info
== SEND_SIG_FORCED
)
1081 * Real-time signals must be queued if sent by sigqueue, or
1082 * some other real-time mechanism. It is implementation
1083 * defined whether kill() does so. We attempt to do so, on
1084 * the principle of least surprise, but since kill is not
1085 * allowed to fail with EAGAIN when low on memory we just
1086 * make sure at least one signal gets delivered and don't
1087 * pass on the info struct.
1090 override_rlimit
= (is_si_special(info
) || info
->si_code
>= 0);
1092 override_rlimit
= 0;
1094 q
= __sigqueue_alloc(sig
, t
, GFP_ATOMIC
| __GFP_NOTRACK_FALSE_POSITIVE
,
1097 list_add_tail(&q
->list
, &pending
->list
);
1098 switch ((unsigned long) info
) {
1099 case (unsigned long) SEND_SIG_NOINFO
:
1100 q
->info
.si_signo
= sig
;
1101 q
->info
.si_errno
= 0;
1102 q
->info
.si_code
= SI_USER
;
1103 q
->info
.si_pid
= task_tgid_nr_ns(current
,
1104 task_active_pid_ns(t
));
1105 q
->info
.si_uid
= current_uid();
1107 case (unsigned long) SEND_SIG_PRIV
:
1108 q
->info
.si_signo
= sig
;
1109 q
->info
.si_errno
= 0;
1110 q
->info
.si_code
= SI_KERNEL
;
1115 copy_siginfo(&q
->info
, info
);
1116 if (from_ancestor_ns
)
1121 userns_fixup_signal_uid(&q
->info
, t
);
1123 } else if (!is_si_special(info
)) {
1124 if (sig
>= SIGRTMIN
&& info
->si_code
!= SI_USER
) {
1126 * Queue overflow, abort. We may abort if the
1127 * signal was rt and sent by user using something
1128 * other than kill().
1130 trace_signal_overflow_fail(sig
, group
, info
);
1134 * This is a silent loss of information. We still
1135 * send the signal, but the *info bits are lost.
1137 trace_signal_lose_info(sig
, group
, info
);
1142 signalfd_notify(t
, sig
);
1143 sigaddset(&pending
->signal
, sig
);
1144 complete_signal(sig
, t
, group
);
1148 static int send_signal(int sig
, struct siginfo
*info
, struct task_struct
*t
,
1151 int from_ancestor_ns
= 0;
1153 #ifdef CONFIG_PID_NS
1154 from_ancestor_ns
= si_fromuser(info
) &&
1155 !task_pid_nr_ns(current
, task_active_pid_ns(t
));
1158 return __send_signal(sig
, info
, t
, group
, from_ancestor_ns
);
1161 static void print_fatal_signal(struct pt_regs
*regs
, int signr
)
1163 printk("%s/%d: potentially unexpected fatal signal %d.\n",
1164 current
->comm
, task_pid_nr(current
), signr
);
1166 #if defined(__i386__) && !defined(__arch_um__)
1167 printk("code at %08lx: ", regs
->ip
);
1170 for (i
= 0; i
< 16; i
++) {
1173 if (get_user(insn
, (unsigned char *)(regs
->ip
+ i
)))
1175 printk("%02x ", insn
);
1185 static int __init
setup_print_fatal_signals(char *str
)
1187 get_option (&str
, &print_fatal_signals
);
1192 __setup("print-fatal-signals=", setup_print_fatal_signals
);
1195 __group_send_sig_info(int sig
, struct siginfo
*info
, struct task_struct
*p
)
1197 return send_signal(sig
, info
, p
, 1);
1201 specific_send_sig_info(int sig
, struct siginfo
*info
, struct task_struct
*t
)
1203 return send_signal(sig
, info
, t
, 0);
1206 int do_send_sig_info(int sig
, struct siginfo
*info
, struct task_struct
*p
,
1209 unsigned long flags
;
1212 if (lock_task_sighand(p
, &flags
)) {
1213 ret
= send_signal(sig
, info
, p
, group
);
1214 unlock_task_sighand(p
, &flags
);
1221 * Force a signal that the process can't ignore: if necessary
1222 * we unblock the signal and change any SIG_IGN to SIG_DFL.
1224 * Note: If we unblock the signal, we always reset it to SIG_DFL,
1225 * since we do not want to have a signal handler that was blocked
1226 * be invoked when user space had explicitly blocked it.
1228 * We don't want to have recursive SIGSEGV's etc, for example,
1229 * that is why we also clear SIGNAL_UNKILLABLE.
1232 force_sig_info(int sig
, struct siginfo
*info
, struct task_struct
*t
)
1234 unsigned long int flags
;
1235 int ret
, blocked
, ignored
;
1236 struct k_sigaction
*action
;
1238 spin_lock_irqsave(&t
->sighand
->siglock
, flags
);
1239 action
= &t
->sighand
->action
[sig
-1];
1240 ignored
= action
->sa
.sa_handler
== SIG_IGN
;
1241 blocked
= sigismember(&t
->blocked
, sig
);
1242 if (blocked
|| ignored
) {
1243 action
->sa
.sa_handler
= SIG_DFL
;
1245 sigdelset(&t
->blocked
, sig
);
1246 recalc_sigpending_and_wake(t
);
1249 if (action
->sa
.sa_handler
== SIG_DFL
)
1250 t
->signal
->flags
&= ~SIGNAL_UNKILLABLE
;
1251 ret
= specific_send_sig_info(sig
, info
, t
);
1252 spin_unlock_irqrestore(&t
->sighand
->siglock
, flags
);
1258 * Nuke all other threads in the group.
1260 int zap_other_threads(struct task_struct
*p
)
1262 struct task_struct
*t
= p
;
1265 p
->signal
->group_stop_count
= 0;
1267 while_each_thread(p
, t
) {
1268 task_clear_jobctl_pending(t
, JOBCTL_PENDING_MASK
);
1271 /* Don't bother with already dead threads */
1274 sigaddset(&t
->pending
.signal
, SIGKILL
);
1275 signal_wake_up(t
, 1);
1281 struct sighand_struct
*__lock_task_sighand(struct task_struct
*tsk
,
1282 unsigned long *flags
)
1284 struct sighand_struct
*sighand
;
1287 local_irq_save(*flags
);
1289 sighand
= rcu_dereference(tsk
->sighand
);
1290 if (unlikely(sighand
== NULL
)) {
1292 local_irq_restore(*flags
);
1296 spin_lock(&sighand
->siglock
);
1297 if (likely(sighand
== tsk
->sighand
)) {
1301 spin_unlock(&sighand
->siglock
);
1303 local_irq_restore(*flags
);
1310 * send signal info to all the members of a group
1312 int group_send_sig_info(int sig
, struct siginfo
*info
, struct task_struct
*p
)
1317 ret
= check_kill_permission(sig
, info
, p
);
1321 ret
= do_send_sig_info(sig
, info
, p
, true);
1327 * __kill_pgrp_info() sends a signal to a process group: this is what the tty
1328 * control characters do (^C, ^Z etc)
1329 * - the caller must hold at least a readlock on tasklist_lock
1331 int __kill_pgrp_info(int sig
, struct siginfo
*info
, struct pid
*pgrp
)
1333 struct task_struct
*p
= NULL
;
1334 int retval
, success
;
1338 do_each_pid_task(pgrp
, PIDTYPE_PGID
, p
) {
1339 int err
= group_send_sig_info(sig
, info
, p
);
1342 } while_each_pid_task(pgrp
, PIDTYPE_PGID
, p
);
1343 return success
? 0 : retval
;
1346 int kill_pid_info(int sig
, struct siginfo
*info
, struct pid
*pid
)
1349 struct task_struct
*p
;
1353 p
= pid_task(pid
, PIDTYPE_PID
);
1355 error
= group_send_sig_info(sig
, info
, p
);
1356 if (unlikely(error
== -ESRCH
))
1358 * The task was unhashed in between, try again.
1359 * If it is dead, pid_task() will return NULL,
1360 * if we race with de_thread() it will find the
1370 int kill_proc_info(int sig
, struct siginfo
*info
, pid_t pid
)
1374 error
= kill_pid_info(sig
, info
, find_vpid(pid
));
1379 static int kill_as_cred_perm(const struct cred
*cred
,
1380 struct task_struct
*target
)
1382 const struct cred
*pcred
= __task_cred(target
);
1383 if (cred
->user_ns
!= pcred
->user_ns
)
1385 if (cred
->euid
!= pcred
->suid
&& cred
->euid
!= pcred
->uid
&&
1386 cred
->uid
!= pcred
->suid
&& cred
->uid
!= pcred
->uid
)
1391 /* like kill_pid_info(), but doesn't use uid/euid of "current" */
1392 int kill_pid_info_as_cred(int sig
, struct siginfo
*info
, struct pid
*pid
,
1393 const struct cred
*cred
, u32 secid
)
1396 struct task_struct
*p
;
1397 unsigned long flags
;
1399 if (!valid_signal(sig
))
1403 p
= pid_task(pid
, PIDTYPE_PID
);
1408 if (si_fromuser(info
) && !kill_as_cred_perm(cred
, p
)) {
1412 ret
= security_task_kill(p
, info
, sig
, secid
);
1417 if (lock_task_sighand(p
, &flags
)) {
1418 ret
= __send_signal(sig
, info
, p
, 1, 0);
1419 unlock_task_sighand(p
, &flags
);
1427 EXPORT_SYMBOL_GPL(kill_pid_info_as_cred
);
1430 * kill_something_info() interprets pid in interesting ways just like kill(2).
1432 * POSIX specifies that kill(-1,sig) is unspecified, but what we have
1433 * is probably wrong. Should make it like BSD or SYSV.
1436 static int kill_something_info(int sig
, struct siginfo
*info
, pid_t pid
)
1442 ret
= kill_pid_info(sig
, info
, find_vpid(pid
));
1447 read_lock(&tasklist_lock
);
1449 ret
= __kill_pgrp_info(sig
, info
,
1450 pid
? find_vpid(-pid
) : task_pgrp(current
));
1452 int retval
= 0, count
= 0;
1453 struct task_struct
* p
;
1455 for_each_process(p
) {
1456 if (task_pid_vnr(p
) > 1 &&
1457 !same_thread_group(p
, current
)) {
1458 int err
= group_send_sig_info(sig
, info
, p
);
1464 ret
= count
? retval
: -ESRCH
;
1466 read_unlock(&tasklist_lock
);
1472 * These are for backward compatibility with the rest of the kernel source.
1475 int send_sig_info(int sig
, struct siginfo
*info
, struct task_struct
*p
)
1478 * Make sure legacy kernel users don't send in bad values
1479 * (normal paths check this in check_kill_permission).
1481 if (!valid_signal(sig
))
1484 return do_send_sig_info(sig
, info
, p
, false);
1487 #define __si_special(priv) \
1488 ((priv) ? SEND_SIG_PRIV : SEND_SIG_NOINFO)
1491 send_sig(int sig
, struct task_struct
*p
, int priv
)
1493 return send_sig_info(sig
, __si_special(priv
), p
);
1497 force_sig(int sig
, struct task_struct
*p
)
1499 force_sig_info(sig
, SEND_SIG_PRIV
, p
);
1503 * When things go south during signal handling, we
1504 * will force a SIGSEGV. And if the signal that caused
1505 * the problem was already a SIGSEGV, we'll want to
1506 * make sure we don't even try to deliver the signal..
1509 force_sigsegv(int sig
, struct task_struct
*p
)
1511 if (sig
== SIGSEGV
) {
1512 unsigned long flags
;
1513 spin_lock_irqsave(&p
->sighand
->siglock
, flags
);
1514 p
->sighand
->action
[sig
- 1].sa
.sa_handler
= SIG_DFL
;
1515 spin_unlock_irqrestore(&p
->sighand
->siglock
, flags
);
1517 force_sig(SIGSEGV
, p
);
1521 int kill_pgrp(struct pid
*pid
, int sig
, int priv
)
1525 read_lock(&tasklist_lock
);
1526 ret
= __kill_pgrp_info(sig
, __si_special(priv
), pid
);
1527 read_unlock(&tasklist_lock
);
1531 EXPORT_SYMBOL(kill_pgrp
);
1533 int kill_pid(struct pid
*pid
, int sig
, int priv
)
1535 return kill_pid_info(sig
, __si_special(priv
), pid
);
1537 EXPORT_SYMBOL(kill_pid
);
1540 * These functions support sending signals using preallocated sigqueue
1541 * structures. This is needed "because realtime applications cannot
1542 * afford to lose notifications of asynchronous events, like timer
1543 * expirations or I/O completions". In the case of POSIX Timers
1544 * we allocate the sigqueue structure from the timer_create. If this
1545 * allocation fails we are able to report the failure to the application
1546 * with an EAGAIN error.
1548 struct sigqueue
*sigqueue_alloc(void)
1550 struct sigqueue
*q
= __sigqueue_alloc(-1, current
, GFP_KERNEL
, 0);
1553 q
->flags
|= SIGQUEUE_PREALLOC
;
1558 void sigqueue_free(struct sigqueue
*q
)
1560 unsigned long flags
;
1561 spinlock_t
*lock
= ¤t
->sighand
->siglock
;
1563 BUG_ON(!(q
->flags
& SIGQUEUE_PREALLOC
));
1565 * We must hold ->siglock while testing q->list
1566 * to serialize with collect_signal() or with
1567 * __exit_signal()->flush_sigqueue().
1569 spin_lock_irqsave(lock
, flags
);
1570 q
->flags
&= ~SIGQUEUE_PREALLOC
;
1572 * If it is queued it will be freed when dequeued,
1573 * like the "regular" sigqueue.
1575 if (!list_empty(&q
->list
))
1577 spin_unlock_irqrestore(lock
, flags
);
1583 int send_sigqueue(struct sigqueue
*q
, struct task_struct
*t
, int group
)
1585 int sig
= q
->info
.si_signo
;
1586 struct sigpending
*pending
;
1587 unsigned long flags
;
1590 BUG_ON(!(q
->flags
& SIGQUEUE_PREALLOC
));
1593 if (!likely(lock_task_sighand(t
, &flags
)))
1596 ret
= 1; /* the signal is ignored */
1597 if (!prepare_signal(sig
, t
, 0))
1601 if (unlikely(!list_empty(&q
->list
))) {
1603 * If an SI_TIMER entry is already queue just increment
1604 * the overrun count.
1606 BUG_ON(q
->info
.si_code
!= SI_TIMER
);
1607 q
->info
.si_overrun
++;
1610 q
->info
.si_overrun
= 0;
1612 signalfd_notify(t
, sig
);
1613 pending
= group
? &t
->signal
->shared_pending
: &t
->pending
;
1614 list_add_tail(&q
->list
, &pending
->list
);
1615 sigaddset(&pending
->signal
, sig
);
1616 complete_signal(sig
, t
, group
);
1618 unlock_task_sighand(t
, &flags
);
1624 * Let a parent know about the death of a child.
1625 * For a stopped/continued status change, use do_notify_parent_cldstop instead.
1627 * Returns true if our parent ignored us and so we've switched to
1630 bool do_notify_parent(struct task_struct
*tsk
, int sig
)
1632 struct siginfo info
;
1633 unsigned long flags
;
1634 struct sighand_struct
*psig
;
1635 bool autoreap
= false;
1639 /* do_notify_parent_cldstop should have been called instead. */
1640 BUG_ON(task_is_stopped_or_traced(tsk
));
1642 BUG_ON(!tsk
->ptrace
&&
1643 (tsk
->group_leader
!= tsk
|| !thread_group_empty(tsk
)));
1645 if (sig
!= SIGCHLD
) {
1647 * This is only possible if parent == real_parent.
1648 * Check if it has changed security domain.
1650 if (tsk
->parent_exec_id
!= tsk
->parent
->self_exec_id
)
1654 info
.si_signo
= sig
;
1657 * we are under tasklist_lock here so our parent is tied to
1658 * us and cannot exit and release its namespace.
1660 * the only it can is to switch its nsproxy with sys_unshare,
1661 * bu uncharing pid namespaces is not allowed, so we'll always
1662 * see relevant namespace
1664 * write_lock() currently calls preempt_disable() which is the
1665 * same as rcu_read_lock(), but according to Oleg, this is not
1666 * correct to rely on this
1669 info
.si_pid
= task_pid_nr_ns(tsk
, tsk
->parent
->nsproxy
->pid_ns
);
1670 info
.si_uid
= map_cred_ns(__task_cred(tsk
),
1671 task_cred_xxx(tsk
->parent
, user_ns
));
1674 info
.si_utime
= cputime_to_clock_t(tsk
->utime
+ tsk
->signal
->utime
);
1675 info
.si_stime
= cputime_to_clock_t(tsk
->stime
+ tsk
->signal
->stime
);
1677 info
.si_status
= tsk
->exit_code
& 0x7f;
1678 if (tsk
->exit_code
& 0x80)
1679 info
.si_code
= CLD_DUMPED
;
1680 else if (tsk
->exit_code
& 0x7f)
1681 info
.si_code
= CLD_KILLED
;
1683 info
.si_code
= CLD_EXITED
;
1684 info
.si_status
= tsk
->exit_code
>> 8;
1687 psig
= tsk
->parent
->sighand
;
1688 spin_lock_irqsave(&psig
->siglock
, flags
);
1689 if (!tsk
->ptrace
&& sig
== SIGCHLD
&&
1690 (psig
->action
[SIGCHLD
-1].sa
.sa_handler
== SIG_IGN
||
1691 (psig
->action
[SIGCHLD
-1].sa
.sa_flags
& SA_NOCLDWAIT
))) {
1693 * We are exiting and our parent doesn't care. POSIX.1
1694 * defines special semantics for setting SIGCHLD to SIG_IGN
1695 * or setting the SA_NOCLDWAIT flag: we should be reaped
1696 * automatically and not left for our parent's wait4 call.
1697 * Rather than having the parent do it as a magic kind of
1698 * signal handler, we just set this to tell do_exit that we
1699 * can be cleaned up without becoming a zombie. Note that
1700 * we still call __wake_up_parent in this case, because a
1701 * blocked sys_wait4 might now return -ECHILD.
1703 * Whether we send SIGCHLD or not for SA_NOCLDWAIT
1704 * is implementation-defined: we do (if you don't want
1705 * it, just use SIG_IGN instead).
1708 if (psig
->action
[SIGCHLD
-1].sa
.sa_handler
== SIG_IGN
)
1711 if (valid_signal(sig
) && sig
)
1712 __group_send_sig_info(sig
, &info
, tsk
->parent
);
1713 __wake_up_parent(tsk
, tsk
->parent
);
1714 spin_unlock_irqrestore(&psig
->siglock
, flags
);
1720 * do_notify_parent_cldstop - notify parent of stopped/continued state change
1721 * @tsk: task reporting the state change
1722 * @for_ptracer: the notification is for ptracer
1723 * @why: CLD_{CONTINUED|STOPPED|TRAPPED} to report
1725 * Notify @tsk's parent that the stopped/continued state has changed. If
1726 * @for_ptracer is %false, @tsk's group leader notifies to its real parent.
1727 * If %true, @tsk reports to @tsk->parent which should be the ptracer.
1730 * Must be called with tasklist_lock at least read locked.
1732 static void do_notify_parent_cldstop(struct task_struct
*tsk
,
1733 bool for_ptracer
, int why
)
1735 struct siginfo info
;
1736 unsigned long flags
;
1737 struct task_struct
*parent
;
1738 struct sighand_struct
*sighand
;
1741 parent
= tsk
->parent
;
1743 tsk
= tsk
->group_leader
;
1744 parent
= tsk
->real_parent
;
1747 info
.si_signo
= SIGCHLD
;
1750 * see comment in do_notify_parent() about the following 4 lines
1753 info
.si_pid
= task_pid_nr_ns(tsk
, parent
->nsproxy
->pid_ns
);
1754 info
.si_uid
= map_cred_ns(__task_cred(tsk
),
1755 task_cred_xxx(parent
, user_ns
));
1758 info
.si_utime
= cputime_to_clock_t(tsk
->utime
);
1759 info
.si_stime
= cputime_to_clock_t(tsk
->stime
);
1764 info
.si_status
= SIGCONT
;
1767 info
.si_status
= tsk
->signal
->group_exit_code
& 0x7f;
1770 info
.si_status
= tsk
->exit_code
& 0x7f;
1776 sighand
= parent
->sighand
;
1777 spin_lock_irqsave(&sighand
->siglock
, flags
);
1778 if (sighand
->action
[SIGCHLD
-1].sa
.sa_handler
!= SIG_IGN
&&
1779 !(sighand
->action
[SIGCHLD
-1].sa
.sa_flags
& SA_NOCLDSTOP
))
1780 __group_send_sig_info(SIGCHLD
, &info
, parent
);
1782 * Even if SIGCHLD is not generated, we must wake up wait4 calls.
1784 __wake_up_parent(tsk
, parent
);
1785 spin_unlock_irqrestore(&sighand
->siglock
, flags
);
1788 static inline int may_ptrace_stop(void)
1790 if (!likely(current
->ptrace
))
1793 * Are we in the middle of do_coredump?
1794 * If so and our tracer is also part of the coredump stopping
1795 * is a deadlock situation, and pointless because our tracer
1796 * is dead so don't allow us to stop.
1797 * If SIGKILL was already sent before the caller unlocked
1798 * ->siglock we must see ->core_state != NULL. Otherwise it
1799 * is safe to enter schedule().
1801 if (unlikely(current
->mm
->core_state
) &&
1802 unlikely(current
->mm
== current
->parent
->mm
))
1809 * Return non-zero if there is a SIGKILL that should be waking us up.
1810 * Called with the siglock held.
1812 static int sigkill_pending(struct task_struct
*tsk
)
1814 return sigismember(&tsk
->pending
.signal
, SIGKILL
) ||
1815 sigismember(&tsk
->signal
->shared_pending
.signal
, SIGKILL
);
1819 * This must be called with current->sighand->siglock held.
1821 * This should be the path for all ptrace stops.
1822 * We always set current->last_siginfo while stopped here.
1823 * That makes it a way to test a stopped process for
1824 * being ptrace-stopped vs being job-control-stopped.
1826 * If we actually decide not to stop at all because the tracer
1827 * is gone, we keep current->exit_code unless clear_code.
1829 static void ptrace_stop(int exit_code
, int why
, int clear_code
, siginfo_t
*info
)
1830 __releases(¤t
->sighand
->siglock
)
1831 __acquires(¤t
->sighand
->siglock
)
1833 bool gstop_done
= false;
1835 if (arch_ptrace_stop_needed(exit_code
, info
)) {
1837 * The arch code has something special to do before a
1838 * ptrace stop. This is allowed to block, e.g. for faults
1839 * on user stack pages. We can't keep the siglock while
1840 * calling arch_ptrace_stop, so we must release it now.
1841 * To preserve proper semantics, we must do this before
1842 * any signal bookkeeping like checking group_stop_count.
1843 * Meanwhile, a SIGKILL could come in before we retake the
1844 * siglock. That must prevent us from sleeping in TASK_TRACED.
1845 * So after regaining the lock, we must check for SIGKILL.
1847 spin_unlock_irq(¤t
->sighand
->siglock
);
1848 arch_ptrace_stop(exit_code
, info
);
1849 spin_lock_irq(¤t
->sighand
->siglock
);
1850 if (sigkill_pending(current
))
1855 * We're committing to trapping. TRACED should be visible before
1856 * TRAPPING is cleared; otherwise, the tracer might fail do_wait().
1857 * Also, transition to TRACED and updates to ->jobctl should be
1858 * atomic with respect to siglock and should be done after the arch
1859 * hook as siglock is released and regrabbed across it.
1861 set_current_state(TASK_TRACED
);
1863 current
->last_siginfo
= info
;
1864 current
->exit_code
= exit_code
;
1867 * If @why is CLD_STOPPED, we're trapping to participate in a group
1868 * stop. Do the bookkeeping. Note that if SIGCONT was delievered
1869 * across siglock relocks since INTERRUPT was scheduled, PENDING
1870 * could be clear now. We act as if SIGCONT is received after
1871 * TASK_TRACED is entered - ignore it.
1873 if (why
== CLD_STOPPED
&& (current
->jobctl
& JOBCTL_STOP_PENDING
))
1874 gstop_done
= task_participate_group_stop(current
);
1876 /* any trap clears pending STOP trap, STOP trap clears NOTIFY */
1877 task_clear_jobctl_pending(current
, JOBCTL_TRAP_STOP
);
1878 if (info
&& info
->si_code
>> 8 == PTRACE_EVENT_STOP
)
1879 task_clear_jobctl_pending(current
, JOBCTL_TRAP_NOTIFY
);
1881 /* entering a trap, clear TRAPPING */
1882 task_clear_jobctl_trapping(current
);
1884 spin_unlock_irq(¤t
->sighand
->siglock
);
1885 read_lock(&tasklist_lock
);
1886 if (may_ptrace_stop()) {
1888 * Notify parents of the stop.
1890 * While ptraced, there are two parents - the ptracer and
1891 * the real_parent of the group_leader. The ptracer should
1892 * know about every stop while the real parent is only
1893 * interested in the completion of group stop. The states
1894 * for the two don't interact with each other. Notify
1895 * separately unless they're gonna be duplicates.
1897 do_notify_parent_cldstop(current
, true, why
);
1898 if (gstop_done
&& ptrace_reparented(current
))
1899 do_notify_parent_cldstop(current
, false, why
);
1902 * Don't want to allow preemption here, because
1903 * sys_ptrace() needs this task to be inactive.
1905 * XXX: implement read_unlock_no_resched().
1908 read_unlock(&tasklist_lock
);
1909 preempt_enable_no_resched();
1913 * By the time we got the lock, our tracer went away.
1914 * Don't drop the lock yet, another tracer may come.
1916 * If @gstop_done, the ptracer went away between group stop
1917 * completion and here. During detach, it would have set
1918 * JOBCTL_STOP_PENDING on us and we'll re-enter
1919 * TASK_STOPPED in do_signal_stop() on return, so notifying
1920 * the real parent of the group stop completion is enough.
1923 do_notify_parent_cldstop(current
, false, why
);
1925 __set_current_state(TASK_RUNNING
);
1927 current
->exit_code
= 0;
1928 read_unlock(&tasklist_lock
);
1932 * While in TASK_TRACED, we were considered "frozen enough".
1933 * Now that we woke up, it's crucial if we're supposed to be
1934 * frozen that we freeze now before running anything substantial.
1939 * We are back. Now reacquire the siglock before touching
1940 * last_siginfo, so that we are sure to have synchronized with
1941 * any signal-sending on another CPU that wants to examine it.
1943 spin_lock_irq(¤t
->sighand
->siglock
);
1944 current
->last_siginfo
= NULL
;
1946 /* LISTENING can be set only during STOP traps, clear it */
1947 current
->jobctl
&= ~JOBCTL_LISTENING
;
1950 * Queued signals ignored us while we were stopped for tracing.
1951 * So check for any that we should take before resuming user mode.
1952 * This sets TIF_SIGPENDING, but never clears it.
1954 recalc_sigpending_tsk(current
);
1957 static void ptrace_do_notify(int signr
, int exit_code
, int why
)
1961 memset(&info
, 0, sizeof info
);
1962 info
.si_signo
= signr
;
1963 info
.si_code
= exit_code
;
1964 info
.si_pid
= task_pid_vnr(current
);
1965 info
.si_uid
= current_uid();
1967 /* Let the debugger run. */
1968 ptrace_stop(exit_code
, why
, 1, &info
);
1971 void ptrace_notify(int exit_code
)
1973 BUG_ON((exit_code
& (0x7f | ~0xffff)) != SIGTRAP
);
1975 spin_lock_irq(¤t
->sighand
->siglock
);
1976 ptrace_do_notify(SIGTRAP
, exit_code
, CLD_TRAPPED
);
1977 spin_unlock_irq(¤t
->sighand
->siglock
);
1981 * do_signal_stop - handle group stop for SIGSTOP and other stop signals
1982 * @signr: signr causing group stop if initiating
1984 * If %JOBCTL_STOP_PENDING is not set yet, initiate group stop with @signr
1985 * and participate in it. If already set, participate in the existing
1986 * group stop. If participated in a group stop (and thus slept), %true is
1987 * returned with siglock released.
1989 * If ptraced, this function doesn't handle stop itself. Instead,
1990 * %JOBCTL_TRAP_STOP is scheduled and %false is returned with siglock
1991 * untouched. The caller must ensure that INTERRUPT trap handling takes
1992 * places afterwards.
1995 * Must be called with @current->sighand->siglock held, which is released
1999 * %false if group stop is already cancelled or ptrace trap is scheduled.
2000 * %true if participated in group stop.
2002 static bool do_signal_stop(int signr
)
2003 __releases(¤t
->sighand
->siglock
)
2005 struct signal_struct
*sig
= current
->signal
;
2007 if (!(current
->jobctl
& JOBCTL_STOP_PENDING
)) {
2008 unsigned int gstop
= JOBCTL_STOP_PENDING
| JOBCTL_STOP_CONSUME
;
2009 struct task_struct
*t
;
2011 /* signr will be recorded in task->jobctl for retries */
2012 WARN_ON_ONCE(signr
& ~JOBCTL_STOP_SIGMASK
);
2014 if (!likely(current
->jobctl
& JOBCTL_STOP_DEQUEUED
) ||
2015 unlikely(signal_group_exit(sig
)))
2018 * There is no group stop already in progress. We must
2021 * While ptraced, a task may be resumed while group stop is
2022 * still in effect and then receive a stop signal and
2023 * initiate another group stop. This deviates from the
2024 * usual behavior as two consecutive stop signals can't
2025 * cause two group stops when !ptraced. That is why we
2026 * also check !task_is_stopped(t) below.
2028 * The condition can be distinguished by testing whether
2029 * SIGNAL_STOP_STOPPED is already set. Don't generate
2030 * group_exit_code in such case.
2032 * This is not necessary for SIGNAL_STOP_CONTINUED because
2033 * an intervening stop signal is required to cause two
2034 * continued events regardless of ptrace.
2036 if (!(sig
->flags
& SIGNAL_STOP_STOPPED
))
2037 sig
->group_exit_code
= signr
;
2039 sig
->group_stop_count
= 0;
2041 if (task_set_jobctl_pending(current
, signr
| gstop
))
2042 sig
->group_stop_count
++;
2044 for (t
= next_thread(current
); t
!= current
;
2045 t
= next_thread(t
)) {
2047 * Setting state to TASK_STOPPED for a group
2048 * stop is always done with the siglock held,
2049 * so this check has no races.
2051 if (!task_is_stopped(t
) &&
2052 task_set_jobctl_pending(t
, signr
| gstop
)) {
2053 sig
->group_stop_count
++;
2054 if (likely(!(t
->ptrace
& PT_SEIZED
)))
2055 signal_wake_up(t
, 0);
2057 ptrace_trap_notify(t
);
2062 if (likely(!current
->ptrace
)) {
2066 * If there are no other threads in the group, or if there
2067 * is a group stop in progress and we are the last to stop,
2068 * report to the parent.
2070 if (task_participate_group_stop(current
))
2071 notify
= CLD_STOPPED
;
2073 __set_current_state(TASK_STOPPED
);
2074 spin_unlock_irq(¤t
->sighand
->siglock
);
2077 * Notify the parent of the group stop completion. Because
2078 * we're not holding either the siglock or tasklist_lock
2079 * here, ptracer may attach inbetween; however, this is for
2080 * group stop and should always be delivered to the real
2081 * parent of the group leader. The new ptracer will get
2082 * its notification when this task transitions into
2086 read_lock(&tasklist_lock
);
2087 do_notify_parent_cldstop(current
, false, notify
);
2088 read_unlock(&tasklist_lock
);
2091 /* Now we don't run again until woken by SIGCONT or SIGKILL */
2096 * While ptraced, group stop is handled by STOP trap.
2097 * Schedule it and let the caller deal with it.
2099 task_set_jobctl_pending(current
, JOBCTL_TRAP_STOP
);
2105 * do_jobctl_trap - take care of ptrace jobctl traps
2107 * When PT_SEIZED, it's used for both group stop and explicit
2108 * SEIZE/INTERRUPT traps. Both generate PTRACE_EVENT_STOP trap with
2109 * accompanying siginfo. If stopped, lower eight bits of exit_code contain
2110 * the stop signal; otherwise, %SIGTRAP.
2112 * When !PT_SEIZED, it's used only for group stop trap with stop signal
2113 * number as exit_code and no siginfo.
2116 * Must be called with @current->sighand->siglock held, which may be
2117 * released and re-acquired before returning with intervening sleep.
2119 static void do_jobctl_trap(void)
2121 struct signal_struct
*signal
= current
->signal
;
2122 int signr
= current
->jobctl
& JOBCTL_STOP_SIGMASK
;
2124 if (current
->ptrace
& PT_SEIZED
) {
2125 if (!signal
->group_stop_count
&&
2126 !(signal
->flags
& SIGNAL_STOP_STOPPED
))
2128 WARN_ON_ONCE(!signr
);
2129 ptrace_do_notify(signr
, signr
| (PTRACE_EVENT_STOP
<< 8),
2132 WARN_ON_ONCE(!signr
);
2133 ptrace_stop(signr
, CLD_STOPPED
, 0, NULL
);
2134 current
->exit_code
= 0;
2138 static int ptrace_signal(int signr
, siginfo_t
*info
,
2139 struct pt_regs
*regs
, void *cookie
)
2141 ptrace_signal_deliver(regs
, cookie
);
2143 * We do not check sig_kernel_stop(signr) but set this marker
2144 * unconditionally because we do not know whether debugger will
2145 * change signr. This flag has no meaning unless we are going
2146 * to stop after return from ptrace_stop(). In this case it will
2147 * be checked in do_signal_stop(), we should only stop if it was
2148 * not cleared by SIGCONT while we were sleeping. See also the
2149 * comment in dequeue_signal().
2151 current
->jobctl
|= JOBCTL_STOP_DEQUEUED
;
2152 ptrace_stop(signr
, CLD_TRAPPED
, 0, info
);
2154 /* We're back. Did the debugger cancel the sig? */
2155 signr
= current
->exit_code
;
2159 current
->exit_code
= 0;
2162 * Update the siginfo structure if the signal has
2163 * changed. If the debugger wanted something
2164 * specific in the siginfo structure then it should
2165 * have updated *info via PTRACE_SETSIGINFO.
2167 if (signr
!= info
->si_signo
) {
2168 info
->si_signo
= signr
;
2170 info
->si_code
= SI_USER
;
2172 info
->si_pid
= task_pid_vnr(current
->parent
);
2173 info
->si_uid
= map_cred_ns(__task_cred(current
->parent
),
2178 /* If the (new) signal is now blocked, requeue it. */
2179 if (sigismember(¤t
->blocked
, signr
)) {
2180 specific_send_sig_info(signr
, info
, current
);
2187 int get_signal_to_deliver(siginfo_t
*info
, struct k_sigaction
*return_ka
,
2188 struct pt_regs
*regs
, void *cookie
)
2190 struct sighand_struct
*sighand
= current
->sighand
;
2191 struct signal_struct
*signal
= current
->signal
;
2196 * We'll jump back here after any time we were stopped in TASK_STOPPED.
2197 * While in TASK_STOPPED, we were considered "frozen enough".
2198 * Now that we woke up, it's crucial if we're supposed to be
2199 * frozen that we freeze now before running anything substantial.
2203 spin_lock_irq(&sighand
->siglock
);
2205 * Every stopped thread goes here after wakeup. Check to see if
2206 * we should notify the parent, prepare_signal(SIGCONT) encodes
2207 * the CLD_ si_code into SIGNAL_CLD_MASK bits.
2209 if (unlikely(signal
->flags
& SIGNAL_CLD_MASK
)) {
2212 if (signal
->flags
& SIGNAL_CLD_CONTINUED
)
2213 why
= CLD_CONTINUED
;
2217 signal
->flags
&= ~SIGNAL_CLD_MASK
;
2219 spin_unlock_irq(&sighand
->siglock
);
2222 * Notify the parent that we're continuing. This event is
2223 * always per-process and doesn't make whole lot of sense
2224 * for ptracers, who shouldn't consume the state via
2225 * wait(2) either, but, for backward compatibility, notify
2226 * the ptracer of the group leader too unless it's gonna be
2229 read_lock(&tasklist_lock
);
2230 do_notify_parent_cldstop(current
, false, why
);
2232 if (ptrace_reparented(current
->group_leader
))
2233 do_notify_parent_cldstop(current
->group_leader
,
2235 read_unlock(&tasklist_lock
);
2241 struct k_sigaction
*ka
;
2243 if (unlikely(current
->jobctl
& JOBCTL_STOP_PENDING
) &&
2247 if (unlikely(current
->jobctl
& JOBCTL_TRAP_MASK
)) {
2249 spin_unlock_irq(&sighand
->siglock
);
2253 signr
= dequeue_signal(current
, ¤t
->blocked
, info
);
2256 break; /* will return 0 */
2258 if (unlikely(current
->ptrace
) && signr
!= SIGKILL
) {
2259 signr
= ptrace_signal(signr
, info
,
2265 ka
= &sighand
->action
[signr
-1];
2267 /* Trace actually delivered signals. */
2268 trace_signal_deliver(signr
, info
, ka
);
2270 if (ka
->sa
.sa_handler
== SIG_IGN
) /* Do nothing. */
2272 if (ka
->sa
.sa_handler
!= SIG_DFL
) {
2273 /* Run the handler. */
2276 if (ka
->sa
.sa_flags
& SA_ONESHOT
)
2277 ka
->sa
.sa_handler
= SIG_DFL
;
2279 break; /* will return non-zero "signr" value */
2283 * Now we are doing the default action for this signal.
2285 if (sig_kernel_ignore(signr
)) /* Default is nothing. */
2289 * Global init gets no signals it doesn't want.
2290 * Container-init gets no signals it doesn't want from same
2293 * Note that if global/container-init sees a sig_kernel_only()
2294 * signal here, the signal must have been generated internally
2295 * or must have come from an ancestor namespace. In either
2296 * case, the signal cannot be dropped.
2298 if (unlikely(signal
->flags
& SIGNAL_UNKILLABLE
) &&
2299 !sig_kernel_only(signr
))
2302 if (sig_kernel_stop(signr
)) {
2304 * The default action is to stop all threads in
2305 * the thread group. The job control signals
2306 * do nothing in an orphaned pgrp, but SIGSTOP
2307 * always works. Note that siglock needs to be
2308 * dropped during the call to is_orphaned_pgrp()
2309 * because of lock ordering with tasklist_lock.
2310 * This allows an intervening SIGCONT to be posted.
2311 * We need to check for that and bail out if necessary.
2313 if (signr
!= SIGSTOP
) {
2314 spin_unlock_irq(&sighand
->siglock
);
2316 /* signals can be posted during this window */
2318 if (is_current_pgrp_orphaned())
2321 spin_lock_irq(&sighand
->siglock
);
2324 if (likely(do_signal_stop(info
->si_signo
))) {
2325 /* It released the siglock. */
2330 * We didn't actually stop, due to a race
2331 * with SIGCONT or something like that.
2336 spin_unlock_irq(&sighand
->siglock
);
2339 * Anything else is fatal, maybe with a core dump.
2341 current
->flags
|= PF_SIGNALED
;
2343 if (sig_kernel_coredump(signr
)) {
2344 if (print_fatal_signals
)
2345 print_fatal_signal(regs
, info
->si_signo
);
2347 * If it was able to dump core, this kills all
2348 * other threads in the group and synchronizes with
2349 * their demise. If we lost the race with another
2350 * thread getting here, it set group_exit_code
2351 * first and our do_group_exit call below will use
2352 * that value and ignore the one we pass it.
2354 do_coredump(info
->si_signo
, info
->si_signo
, regs
);
2358 * Death signals, no core dump.
2360 do_group_exit(info
->si_signo
);
2363 spin_unlock_irq(&sighand
->siglock
);
2368 * block_sigmask - add @ka's signal mask to current->blocked
2369 * @ka: action for @signr
2370 * @signr: signal that has been successfully delivered
2372 * This function should be called when a signal has succesfully been
2373 * delivered. It adds the mask of signals for @ka to current->blocked
2374 * so that they are blocked during the execution of the signal
2375 * handler. In addition, @signr will be blocked unless %SA_NODEFER is
2376 * set in @ka->sa.sa_flags.
2378 void block_sigmask(struct k_sigaction
*ka
, int signr
)
2382 sigorsets(&blocked
, ¤t
->blocked
, &ka
->sa
.sa_mask
);
2383 if (!(ka
->sa
.sa_flags
& SA_NODEFER
))
2384 sigaddset(&blocked
, signr
);
2385 set_current_blocked(&blocked
);
2389 * It could be that complete_signal() picked us to notify about the
2390 * group-wide signal. Other threads should be notified now to take
2391 * the shared signals in @which since we will not.
2393 static void retarget_shared_pending(struct task_struct
*tsk
, sigset_t
*which
)
2396 struct task_struct
*t
;
2398 sigandsets(&retarget
, &tsk
->signal
->shared_pending
.signal
, which
);
2399 if (sigisemptyset(&retarget
))
2403 while_each_thread(tsk
, t
) {
2404 if (t
->flags
& PF_EXITING
)
2407 if (!has_pending_signals(&retarget
, &t
->blocked
))
2409 /* Remove the signals this thread can handle. */
2410 sigandsets(&retarget
, &retarget
, &t
->blocked
);
2412 if (!signal_pending(t
))
2413 signal_wake_up(t
, 0);
2415 if (sigisemptyset(&retarget
))
2420 void exit_signals(struct task_struct
*tsk
)
2426 * @tsk is about to have PF_EXITING set - lock out users which
2427 * expect stable threadgroup.
2429 threadgroup_change_begin(tsk
);
2431 if (thread_group_empty(tsk
) || signal_group_exit(tsk
->signal
)) {
2432 tsk
->flags
|= PF_EXITING
;
2433 threadgroup_change_end(tsk
);
2437 spin_lock_irq(&tsk
->sighand
->siglock
);
2439 * From now this task is not visible for group-wide signals,
2440 * see wants_signal(), do_signal_stop().
2442 tsk
->flags
|= PF_EXITING
;
2444 threadgroup_change_end(tsk
);
2446 if (!signal_pending(tsk
))
2449 unblocked
= tsk
->blocked
;
2450 signotset(&unblocked
);
2451 retarget_shared_pending(tsk
, &unblocked
);
2453 if (unlikely(tsk
->jobctl
& JOBCTL_STOP_PENDING
) &&
2454 task_participate_group_stop(tsk
))
2455 group_stop
= CLD_STOPPED
;
2457 spin_unlock_irq(&tsk
->sighand
->siglock
);
2460 * If group stop has completed, deliver the notification. This
2461 * should always go to the real parent of the group leader.
2463 if (unlikely(group_stop
)) {
2464 read_lock(&tasklist_lock
);
2465 do_notify_parent_cldstop(tsk
, false, group_stop
);
2466 read_unlock(&tasklist_lock
);
2470 EXPORT_SYMBOL(recalc_sigpending
);
2471 EXPORT_SYMBOL_GPL(dequeue_signal
);
2472 EXPORT_SYMBOL(flush_signals
);
2473 EXPORT_SYMBOL(force_sig
);
2474 EXPORT_SYMBOL(send_sig
);
2475 EXPORT_SYMBOL(send_sig_info
);
2476 EXPORT_SYMBOL(sigprocmask
);
2477 EXPORT_SYMBOL(block_all_signals
);
2478 EXPORT_SYMBOL(unblock_all_signals
);
2482 * System call entry points.
2486 * sys_restart_syscall - restart a system call
2488 SYSCALL_DEFINE0(restart_syscall
)
2490 struct restart_block
*restart
= ¤t_thread_info()->restart_block
;
2491 return restart
->fn(restart
);
2494 long do_no_restart_syscall(struct restart_block
*param
)
2499 static void __set_task_blocked(struct task_struct
*tsk
, const sigset_t
*newset
)
2501 if (signal_pending(tsk
) && !thread_group_empty(tsk
)) {
2502 sigset_t newblocked
;
2503 /* A set of now blocked but previously unblocked signals. */
2504 sigandnsets(&newblocked
, newset
, ¤t
->blocked
);
2505 retarget_shared_pending(tsk
, &newblocked
);
2507 tsk
->blocked
= *newset
;
2508 recalc_sigpending();
2512 * set_current_blocked - change current->blocked mask
2515 * It is wrong to change ->blocked directly, this helper should be used
2516 * to ensure the process can't miss a shared signal we are going to block.
2518 void set_current_blocked(const sigset_t
*newset
)
2520 struct task_struct
*tsk
= current
;
2522 spin_lock_irq(&tsk
->sighand
->siglock
);
2523 __set_task_blocked(tsk
, newset
);
2524 spin_unlock_irq(&tsk
->sighand
->siglock
);
2528 * This is also useful for kernel threads that want to temporarily
2529 * (or permanently) block certain signals.
2531 * NOTE! Unlike the user-mode sys_sigprocmask(), the kernel
2532 * interface happily blocks "unblockable" signals like SIGKILL
2535 int sigprocmask(int how
, sigset_t
*set
, sigset_t
*oldset
)
2537 struct task_struct
*tsk
= current
;
2540 /* Lockless, only current can change ->blocked, never from irq */
2542 *oldset
= tsk
->blocked
;
2546 sigorsets(&newset
, &tsk
->blocked
, set
);
2549 sigandnsets(&newset
, &tsk
->blocked
, set
);
2558 set_current_blocked(&newset
);
2563 * sys_rt_sigprocmask - change the list of currently blocked signals
2564 * @how: whether to add, remove, or set signals
2565 * @nset: stores pending signals
2566 * @oset: previous value of signal mask if non-null
2567 * @sigsetsize: size of sigset_t type
2569 SYSCALL_DEFINE4(rt_sigprocmask
, int, how
, sigset_t __user
*, nset
,
2570 sigset_t __user
*, oset
, size_t, sigsetsize
)
2572 sigset_t old_set
, new_set
;
2575 /* XXX: Don't preclude handling different sized sigset_t's. */
2576 if (sigsetsize
!= sizeof(sigset_t
))
2579 old_set
= current
->blocked
;
2582 if (copy_from_user(&new_set
, nset
, sizeof(sigset_t
)))
2584 sigdelsetmask(&new_set
, sigmask(SIGKILL
)|sigmask(SIGSTOP
));
2586 error
= sigprocmask(how
, &new_set
, NULL
);
2592 if (copy_to_user(oset
, &old_set
, sizeof(sigset_t
)))
2599 long do_sigpending(void __user
*set
, unsigned long sigsetsize
)
2601 long error
= -EINVAL
;
2604 if (sigsetsize
> sizeof(sigset_t
))
2607 spin_lock_irq(¤t
->sighand
->siglock
);
2608 sigorsets(&pending
, ¤t
->pending
.signal
,
2609 ¤t
->signal
->shared_pending
.signal
);
2610 spin_unlock_irq(¤t
->sighand
->siglock
);
2612 /* Outside the lock because only this thread touches it. */
2613 sigandsets(&pending
, ¤t
->blocked
, &pending
);
2616 if (!copy_to_user(set
, &pending
, sigsetsize
))
2624 * sys_rt_sigpending - examine a pending signal that has been raised
2626 * @set: stores pending signals
2627 * @sigsetsize: size of sigset_t type or larger
2629 SYSCALL_DEFINE2(rt_sigpending
, sigset_t __user
*, set
, size_t, sigsetsize
)
2631 return do_sigpending(set
, sigsetsize
);
2634 #ifndef HAVE_ARCH_COPY_SIGINFO_TO_USER
2636 int copy_siginfo_to_user(siginfo_t __user
*to
, siginfo_t
*from
)
2640 if (!access_ok (VERIFY_WRITE
, to
, sizeof(siginfo_t
)))
2642 if (from
->si_code
< 0)
2643 return __copy_to_user(to
, from
, sizeof(siginfo_t
))
2646 * If you change siginfo_t structure, please be sure
2647 * this code is fixed accordingly.
2648 * Please remember to update the signalfd_copyinfo() function
2649 * inside fs/signalfd.c too, in case siginfo_t changes.
2650 * It should never copy any pad contained in the structure
2651 * to avoid security leaks, but must copy the generic
2652 * 3 ints plus the relevant union member.
2654 err
= __put_user(from
->si_signo
, &to
->si_signo
);
2655 err
|= __put_user(from
->si_errno
, &to
->si_errno
);
2656 err
|= __put_user((short)from
->si_code
, &to
->si_code
);
2657 switch (from
->si_code
& __SI_MASK
) {
2659 err
|= __put_user(from
->si_pid
, &to
->si_pid
);
2660 err
|= __put_user(from
->si_uid
, &to
->si_uid
);
2663 err
|= __put_user(from
->si_tid
, &to
->si_tid
);
2664 err
|= __put_user(from
->si_overrun
, &to
->si_overrun
);
2665 err
|= __put_user(from
->si_ptr
, &to
->si_ptr
);
2668 err
|= __put_user(from
->si_band
, &to
->si_band
);
2669 err
|= __put_user(from
->si_fd
, &to
->si_fd
);
2672 err
|= __put_user(from
->si_addr
, &to
->si_addr
);
2673 #ifdef __ARCH_SI_TRAPNO
2674 err
|= __put_user(from
->si_trapno
, &to
->si_trapno
);
2676 #ifdef BUS_MCEERR_AO
2678 * Other callers might not initialize the si_lsb field,
2679 * so check explicitly for the right codes here.
2681 if (from
->si_code
== BUS_MCEERR_AR
|| from
->si_code
== BUS_MCEERR_AO
)
2682 err
|= __put_user(from
->si_addr_lsb
, &to
->si_addr_lsb
);
2686 err
|= __put_user(from
->si_pid
, &to
->si_pid
);
2687 err
|= __put_user(from
->si_uid
, &to
->si_uid
);
2688 err
|= __put_user(from
->si_status
, &to
->si_status
);
2689 err
|= __put_user(from
->si_utime
, &to
->si_utime
);
2690 err
|= __put_user(from
->si_stime
, &to
->si_stime
);
2692 case __SI_RT
: /* This is not generated by the kernel as of now. */
2693 case __SI_MESGQ
: /* But this is */
2694 err
|= __put_user(from
->si_pid
, &to
->si_pid
);
2695 err
|= __put_user(from
->si_uid
, &to
->si_uid
);
2696 err
|= __put_user(from
->si_ptr
, &to
->si_ptr
);
2698 default: /* this is just in case for now ... */
2699 err
|= __put_user(from
->si_pid
, &to
->si_pid
);
2700 err
|= __put_user(from
->si_uid
, &to
->si_uid
);
2709 * do_sigtimedwait - wait for queued signals specified in @which
2710 * @which: queued signals to wait for
2711 * @info: if non-null, the signal's siginfo is returned here
2712 * @ts: upper bound on process time suspension
2714 int do_sigtimedwait(const sigset_t
*which
, siginfo_t
*info
,
2715 const struct timespec
*ts
)
2717 struct task_struct
*tsk
= current
;
2718 long timeout
= MAX_SCHEDULE_TIMEOUT
;
2719 sigset_t mask
= *which
;
2723 if (!timespec_valid(ts
))
2725 timeout
= timespec_to_jiffies(ts
);
2727 * We can be close to the next tick, add another one
2728 * to ensure we will wait at least the time asked for.
2730 if (ts
->tv_sec
|| ts
->tv_nsec
)
2735 * Invert the set of allowed signals to get those we want to block.
2737 sigdelsetmask(&mask
, sigmask(SIGKILL
) | sigmask(SIGSTOP
));
2740 spin_lock_irq(&tsk
->sighand
->siglock
);
2741 sig
= dequeue_signal(tsk
, &mask
, info
);
2742 if (!sig
&& timeout
) {
2744 * None ready, temporarily unblock those we're interested
2745 * while we are sleeping in so that we'll be awakened when
2746 * they arrive. Unblocking is always fine, we can avoid
2747 * set_current_blocked().
2749 tsk
->real_blocked
= tsk
->blocked
;
2750 sigandsets(&tsk
->blocked
, &tsk
->blocked
, &mask
);
2751 recalc_sigpending();
2752 spin_unlock_irq(&tsk
->sighand
->siglock
);
2754 timeout
= schedule_timeout_interruptible(timeout
);
2756 spin_lock_irq(&tsk
->sighand
->siglock
);
2757 __set_task_blocked(tsk
, &tsk
->real_blocked
);
2758 siginitset(&tsk
->real_blocked
, 0);
2759 sig
= dequeue_signal(tsk
, &mask
, info
);
2761 spin_unlock_irq(&tsk
->sighand
->siglock
);
2765 return timeout
? -EINTR
: -EAGAIN
;
2769 * sys_rt_sigtimedwait - synchronously wait for queued signals specified
2771 * @uthese: queued signals to wait for
2772 * @uinfo: if non-null, the signal's siginfo is returned here
2773 * @uts: upper bound on process time suspension
2774 * @sigsetsize: size of sigset_t type
2776 SYSCALL_DEFINE4(rt_sigtimedwait
, const sigset_t __user
*, uthese
,
2777 siginfo_t __user
*, uinfo
, const struct timespec __user
*, uts
,
2785 /* XXX: Don't preclude handling different sized sigset_t's. */
2786 if (sigsetsize
!= sizeof(sigset_t
))
2789 if (copy_from_user(&these
, uthese
, sizeof(these
)))
2793 if (copy_from_user(&ts
, uts
, sizeof(ts
)))
2797 ret
= do_sigtimedwait(&these
, &info
, uts
? &ts
: NULL
);
2799 if (ret
> 0 && uinfo
) {
2800 if (copy_siginfo_to_user(uinfo
, &info
))
2808 * sys_kill - send a signal to a process
2809 * @pid: the PID of the process
2810 * @sig: signal to be sent
2812 SYSCALL_DEFINE2(kill
, pid_t
, pid
, int, sig
)
2814 struct siginfo info
;
2816 info
.si_signo
= sig
;
2818 info
.si_code
= SI_USER
;
2819 info
.si_pid
= task_tgid_vnr(current
);
2820 info
.si_uid
= current_uid();
2822 return kill_something_info(sig
, &info
, pid
);
2826 do_send_specific(pid_t tgid
, pid_t pid
, int sig
, struct siginfo
*info
)
2828 struct task_struct
*p
;
2832 p
= find_task_by_vpid(pid
);
2833 if (p
&& (tgid
<= 0 || task_tgid_vnr(p
) == tgid
)) {
2834 error
= check_kill_permission(sig
, info
, p
);
2836 * The null signal is a permissions and process existence
2837 * probe. No signal is actually delivered.
2839 if (!error
&& sig
) {
2840 error
= do_send_sig_info(sig
, info
, p
, false);
2842 * If lock_task_sighand() failed we pretend the task
2843 * dies after receiving the signal. The window is tiny,
2844 * and the signal is private anyway.
2846 if (unlikely(error
== -ESRCH
))
2855 static int do_tkill(pid_t tgid
, pid_t pid
, int sig
)
2857 struct siginfo info
;
2859 info
.si_signo
= sig
;
2861 info
.si_code
= SI_TKILL
;
2862 info
.si_pid
= task_tgid_vnr(current
);
2863 info
.si_uid
= current_uid();
2865 return do_send_specific(tgid
, pid
, sig
, &info
);
2869 * sys_tgkill - send signal to one specific thread
2870 * @tgid: the thread group ID of the thread
2871 * @pid: the PID of the thread
2872 * @sig: signal to be sent
2874 * This syscall also checks the @tgid and returns -ESRCH even if the PID
2875 * exists but it's not belonging to the target process anymore. This
2876 * method solves the problem of threads exiting and PIDs getting reused.
2878 SYSCALL_DEFINE3(tgkill
, pid_t
, tgid
, pid_t
, pid
, int, sig
)
2880 /* This is only valid for single tasks */
2881 if (pid
<= 0 || tgid
<= 0)
2884 return do_tkill(tgid
, pid
, sig
);
2888 * sys_tkill - send signal to one specific task
2889 * @pid: the PID of the task
2890 * @sig: signal to be sent
2892 * Send a signal to only one task, even if it's a CLONE_THREAD task.
2894 SYSCALL_DEFINE2(tkill
, pid_t
, pid
, int, sig
)
2896 /* This is only valid for single tasks */
2900 return do_tkill(0, pid
, sig
);
2904 * sys_rt_sigqueueinfo - send signal information to a signal
2905 * @pid: the PID of the thread
2906 * @sig: signal to be sent
2907 * @uinfo: signal info to be sent
2909 SYSCALL_DEFINE3(rt_sigqueueinfo
, pid_t
, pid
, int, sig
,
2910 siginfo_t __user
*, uinfo
)
2914 if (copy_from_user(&info
, uinfo
, sizeof(siginfo_t
)))
2917 /* Not even root can pretend to send signals from the kernel.
2918 * Nor can they impersonate a kill()/tgkill(), which adds source info.
2920 if (info
.si_code
>= 0 || info
.si_code
== SI_TKILL
) {
2921 /* We used to allow any < 0 si_code */
2922 WARN_ON_ONCE(info
.si_code
< 0);
2925 info
.si_signo
= sig
;
2927 /* POSIX.1b doesn't mention process groups. */
2928 return kill_proc_info(sig
, &info
, pid
);
2931 long do_rt_tgsigqueueinfo(pid_t tgid
, pid_t pid
, int sig
, siginfo_t
*info
)
2933 /* This is only valid for single tasks */
2934 if (pid
<= 0 || tgid
<= 0)
2937 /* Not even root can pretend to send signals from the kernel.
2938 * Nor can they impersonate a kill()/tgkill(), which adds source info.
2940 if (info
->si_code
>= 0 || info
->si_code
== SI_TKILL
) {
2941 /* We used to allow any < 0 si_code */
2942 WARN_ON_ONCE(info
->si_code
< 0);
2945 info
->si_signo
= sig
;
2947 return do_send_specific(tgid
, pid
, sig
, info
);
2950 SYSCALL_DEFINE4(rt_tgsigqueueinfo
, pid_t
, tgid
, pid_t
, pid
, int, sig
,
2951 siginfo_t __user
*, uinfo
)
2955 if (copy_from_user(&info
, uinfo
, sizeof(siginfo_t
)))
2958 return do_rt_tgsigqueueinfo(tgid
, pid
, sig
, &info
);
2961 int do_sigaction(int sig
, struct k_sigaction
*act
, struct k_sigaction
*oact
)
2963 struct task_struct
*t
= current
;
2964 struct k_sigaction
*k
;
2967 if (!valid_signal(sig
) || sig
< 1 || (act
&& sig_kernel_only(sig
)))
2970 k
= &t
->sighand
->action
[sig
-1];
2972 spin_lock_irq(¤t
->sighand
->siglock
);
2977 sigdelsetmask(&act
->sa
.sa_mask
,
2978 sigmask(SIGKILL
) | sigmask(SIGSTOP
));
2982 * "Setting a signal action to SIG_IGN for a signal that is
2983 * pending shall cause the pending signal to be discarded,
2984 * whether or not it is blocked."
2986 * "Setting a signal action to SIG_DFL for a signal that is
2987 * pending and whose default action is to ignore the signal
2988 * (for example, SIGCHLD), shall cause the pending signal to
2989 * be discarded, whether or not it is blocked"
2991 if (sig_handler_ignored(sig_handler(t
, sig
), sig
)) {
2993 sigaddset(&mask
, sig
);
2994 rm_from_queue_full(&mask
, &t
->signal
->shared_pending
);
2996 rm_from_queue_full(&mask
, &t
->pending
);
2998 } while (t
!= current
);
3002 spin_unlock_irq(¤t
->sighand
->siglock
);
3007 do_sigaltstack (const stack_t __user
*uss
, stack_t __user
*uoss
, unsigned long sp
)
3012 oss
.ss_sp
= (void __user
*) current
->sas_ss_sp
;
3013 oss
.ss_size
= current
->sas_ss_size
;
3014 oss
.ss_flags
= sas_ss_flags(sp
);
3022 if (!access_ok(VERIFY_READ
, uss
, sizeof(*uss
)))
3024 error
= __get_user(ss_sp
, &uss
->ss_sp
) |
3025 __get_user(ss_flags
, &uss
->ss_flags
) |
3026 __get_user(ss_size
, &uss
->ss_size
);
3031 if (on_sig_stack(sp
))
3036 * Note - this code used to test ss_flags incorrectly:
3037 * old code may have been written using ss_flags==0
3038 * to mean ss_flags==SS_ONSTACK (as this was the only
3039 * way that worked) - this fix preserves that older
3042 if (ss_flags
!= SS_DISABLE
&& ss_flags
!= SS_ONSTACK
&& ss_flags
!= 0)
3045 if (ss_flags
== SS_DISABLE
) {
3050 if (ss_size
< MINSIGSTKSZ
)
3054 current
->sas_ss_sp
= (unsigned long) ss_sp
;
3055 current
->sas_ss_size
= ss_size
;
3061 if (!access_ok(VERIFY_WRITE
, uoss
, sizeof(*uoss
)))
3063 error
= __put_user(oss
.ss_sp
, &uoss
->ss_sp
) |
3064 __put_user(oss
.ss_size
, &uoss
->ss_size
) |
3065 __put_user(oss
.ss_flags
, &uoss
->ss_flags
);
3072 #ifdef __ARCH_WANT_SYS_SIGPENDING
3075 * sys_sigpending - examine pending signals
3076 * @set: where mask of pending signal is returned
3078 SYSCALL_DEFINE1(sigpending
, old_sigset_t __user
*, set
)
3080 return do_sigpending(set
, sizeof(*set
));
3085 #ifdef __ARCH_WANT_SYS_SIGPROCMASK
3087 * sys_sigprocmask - examine and change blocked signals
3088 * @how: whether to add, remove, or set signals
3089 * @nset: signals to add or remove (if non-null)
3090 * @oset: previous value of signal mask if non-null
3092 * Some platforms have their own version with special arguments;
3093 * others support only sys_rt_sigprocmask.
3096 SYSCALL_DEFINE3(sigprocmask
, int, how
, old_sigset_t __user
*, nset
,
3097 old_sigset_t __user
*, oset
)
3099 old_sigset_t old_set
, new_set
;
3100 sigset_t new_blocked
;
3102 old_set
= current
->blocked
.sig
[0];
3105 if (copy_from_user(&new_set
, nset
, sizeof(*nset
)))
3107 new_set
&= ~(sigmask(SIGKILL
) | sigmask(SIGSTOP
));
3109 new_blocked
= current
->blocked
;
3113 sigaddsetmask(&new_blocked
, new_set
);
3116 sigdelsetmask(&new_blocked
, new_set
);
3119 new_blocked
.sig
[0] = new_set
;
3125 set_current_blocked(&new_blocked
);
3129 if (copy_to_user(oset
, &old_set
, sizeof(*oset
)))
3135 #endif /* __ARCH_WANT_SYS_SIGPROCMASK */
3137 #ifdef __ARCH_WANT_SYS_RT_SIGACTION
3139 * sys_rt_sigaction - alter an action taken by a process
3140 * @sig: signal to be sent
3141 * @act: new sigaction
3142 * @oact: used to save the previous sigaction
3143 * @sigsetsize: size of sigset_t type
3145 SYSCALL_DEFINE4(rt_sigaction
, int, sig
,
3146 const struct sigaction __user
*, act
,
3147 struct sigaction __user
*, oact
,
3150 struct k_sigaction new_sa
, old_sa
;
3153 /* XXX: Don't preclude handling different sized sigset_t's. */
3154 if (sigsetsize
!= sizeof(sigset_t
))
3158 if (copy_from_user(&new_sa
.sa
, act
, sizeof(new_sa
.sa
)))
3162 ret
= do_sigaction(sig
, act
? &new_sa
: NULL
, oact
? &old_sa
: NULL
);
3165 if (copy_to_user(oact
, &old_sa
.sa
, sizeof(old_sa
.sa
)))
3171 #endif /* __ARCH_WANT_SYS_RT_SIGACTION */
3173 #ifdef __ARCH_WANT_SYS_SGETMASK
3176 * For backwards compatibility. Functionality superseded by sigprocmask.
3178 SYSCALL_DEFINE0(sgetmask
)
3181 return current
->blocked
.sig
[0];
3184 SYSCALL_DEFINE1(ssetmask
, int, newmask
)
3186 int old
= current
->blocked
.sig
[0];
3189 siginitset(&newset
, newmask
& ~(sigmask(SIGKILL
) | sigmask(SIGSTOP
)));
3190 set_current_blocked(&newset
);
3194 #endif /* __ARCH_WANT_SGETMASK */
3196 #ifdef __ARCH_WANT_SYS_SIGNAL
3198 * For backwards compatibility. Functionality superseded by sigaction.
3200 SYSCALL_DEFINE2(signal
, int, sig
, __sighandler_t
, handler
)
3202 struct k_sigaction new_sa
, old_sa
;
3205 new_sa
.sa
.sa_handler
= handler
;
3206 new_sa
.sa
.sa_flags
= SA_ONESHOT
| SA_NOMASK
;
3207 sigemptyset(&new_sa
.sa
.sa_mask
);
3209 ret
= do_sigaction(sig
, &new_sa
, &old_sa
);
3211 return ret
? ret
: (unsigned long)old_sa
.sa
.sa_handler
;
3213 #endif /* __ARCH_WANT_SYS_SIGNAL */
3215 #ifdef __ARCH_WANT_SYS_PAUSE
3217 SYSCALL_DEFINE0(pause
)
3219 while (!signal_pending(current
)) {
3220 current
->state
= TASK_INTERRUPTIBLE
;
3223 return -ERESTARTNOHAND
;
3228 #ifdef __ARCH_WANT_SYS_RT_SIGSUSPEND
3230 * sys_rt_sigsuspend - replace the signal mask for a value with the
3231 * @unewset value until a signal is received
3232 * @unewset: new signal mask value
3233 * @sigsetsize: size of sigset_t type
3235 SYSCALL_DEFINE2(rt_sigsuspend
, sigset_t __user
*, unewset
, size_t, sigsetsize
)
3239 /* XXX: Don't preclude handling different sized sigset_t's. */
3240 if (sigsetsize
!= sizeof(sigset_t
))
3243 if (copy_from_user(&newset
, unewset
, sizeof(newset
)))
3245 sigdelsetmask(&newset
, sigmask(SIGKILL
)|sigmask(SIGSTOP
));
3247 current
->saved_sigmask
= current
->blocked
;
3248 set_current_blocked(&newset
);
3250 current
->state
= TASK_INTERRUPTIBLE
;
3252 set_restore_sigmask();
3253 return -ERESTARTNOHAND
;
3255 #endif /* __ARCH_WANT_SYS_RT_SIGSUSPEND */
3257 __attribute__((weak
)) const char *arch_vma_name(struct vm_area_struct
*vma
)
3262 void __init
signals_init(void)
3264 sigqueue_cachep
= KMEM_CACHE(sigqueue
, SLAB_PANIC
);
3267 #ifdef CONFIG_KGDB_KDB
3268 #include <linux/kdb.h>
3270 * kdb_send_sig_info - Allows kdb to send signals without exposing
3271 * signal internals. This function checks if the required locks are
3272 * available before calling the main signal code, to avoid kdb
3276 kdb_send_sig_info(struct task_struct
*t
, struct siginfo
*info
)
3278 static struct task_struct
*kdb_prev_t
;
3280 if (!spin_trylock(&t
->sighand
->siglock
)) {
3281 kdb_printf("Can't do kill command now.\n"
3282 "The sigmask lock is held somewhere else in "
3283 "kernel, try again later\n");
3286 spin_unlock(&t
->sighand
->siglock
);
3287 new_t
= kdb_prev_t
!= t
;
3289 if (t
->state
!= TASK_RUNNING
&& new_t
) {
3290 kdb_printf("Process is not RUNNING, sending a signal from "
3291 "kdb risks deadlock\n"
3292 "on the run queue locks. "
3293 "The signal has _not_ been sent.\n"
3294 "Reissue the kill command if you want to risk "
3298 sig
= info
->si_signo
;
3299 if (send_sig_info(sig
, info
, t
))
3300 kdb_printf("Fail to deliver Signal %d to process %d.\n",
3303 kdb_printf("Signal %d is sent to process %d.\n", sig
, t
->pid
);
3305 #endif /* CONFIG_KGDB_KDB */