SAFE public projects git trees. - safe/jmp/linux-2.6/blob - kernel/signal.c

   1 /*
   2  *  linux/kernel/signal.c
   3  *
   4  *  Copyright (C) 1991, 1992  Linus Torvalds
   5  *
   6  *  1997-11-02  Modified for POSIX.1b signals by Richard Henderson
   7  *
   8  *  2003-06-02  Jim Houston - Concurrent Computer Corp.
   9  *              Changes to use preallocated sigqueue structures
  10  *              to allow signals to be sent reliably.
  11  */
  12
  13 #include <linux/slab.h>
  14 #include <linux/module.h>
  15 #include <linux/init.h>
  16 #include <linux/sched.h>
  17 #include <linux/fs.h>
  18 #include <linux/tty.h>
  19 #include <linux/binfmts.h>
  20 #include <linux/security.h>
  21 #include <linux/syscalls.h>
  22 #include <linux/ptrace.h>
  23 #include <linux/signal.h>
  24 #include <linux/signalfd.h>
  25 #include <linux/capability.h>
  26 #include <linux/freezer.h>
  27 #include <linux/pid_namespace.h>
  28 #include <linux/nsproxy.h>
  29
  30 #include <asm/param.h>
  31 #include <asm/uaccess.h>
  32 #include <asm/unistd.h>
  33 #include <asm/siginfo.h>
  34 #include "audit.h"      /* audit_signal_info() */
  35
  36 /*
  37  * SLAB caches for signal bits.
  38  */
  39
  40 static struct kmem_cache *sigqueue_cachep;
  41
  42 static int __sig_ignored(struct task_struct *t, int sig)
  43 {
  44         void __user *handler;
  45
  46         /* Is it explicitly or implicitly ignored? */
  47
  48         handler = t->sighand->action[sig - 1].sa.sa_handler;
  49         return handler == SIG_IGN ||
  50                 (handler == SIG_DFL && sig_kernel_ignore(sig));
  51 }
  52
  53 static int sig_ignored(struct task_struct *t, int sig)
  54 {
  55         /*
  56          * Tracers always want to know about signals..
  57          */
  58         if (t->ptrace & PT_PTRACED)
  59                 return 0;
  60
  61         /*
  62          * Blocked signals are never ignored, since the
  63          * signal handler may change by the time it is
  64          * unblocked.
  65          */
  66         if (sigismember(&t->blocked, sig) || sigismember(&t->real_blocked, sig))
  67                 return 0;
  68
  69         return __sig_ignored(t, sig);
  70 }
  71
  72 /*
  73  * Re-calculate pending state from the set of locally pending
  74  * signals, globally pending signals, and blocked signals.
  75  */
  76 static inline int has_pending_signals(sigset_t *signal, sigset_t *blocked)
  77 {
  78         unsigned long ready;
  79         long i;
  80
  81         switch (_NSIG_WORDS) {
  82         default:
  83                 for (i = _NSIG_WORDS, ready = 0; --i >= 0 ;)
  84                         ready |= signal->sig[i] &~ blocked->sig[i];
  85                 break;
  86
  87         case 4: ready  = signal->sig[3] &~ blocked->sig[3];
  88                 ready |= signal->sig[2] &~ blocked->sig[2];
  89                 ready |= signal->sig[1] &~ blocked->sig[1];
  90                 ready |= signal->sig[0] &~ blocked->sig[0];
  91                 break;
  92
  93         case 2: ready  = signal->sig[1] &~ blocked->sig[1];
  94                 ready |= signal->sig[0] &~ blocked->sig[0];
  95                 break;
  96
  97         case 1: ready  = signal->sig[0] &~ blocked->sig[0];
  98         }
  99         return ready != 0;
 100 }
 101
 102 #define PENDING(p,b) has_pending_signals(&(p)->signal, (b))
 103
 104 static int recalc_sigpending_tsk(struct task_struct *t)
 105 {
 106         if (t->signal->group_stop_count > 0 ||
 107             PENDING(&t->pending, &t->blocked) ||
 108             PENDING(&t->signal->shared_pending, &t->blocked)) {
 109                 set_tsk_thread_flag(t, TIF_SIGPENDING);
 110                 return 1;
 111         }
 112         /*
 113          * We must never clear the flag in another thread, or in current
 114          * when it's possible the current syscall is returning -ERESTART*.
 115          * So we don't clear it here, and only callers who know they should do.
 116          */
 117         return 0;
 118 }
 119
 120 /*
 121  * After recalculating TIF_SIGPENDING, we need to make sure the task wakes up.
 122  * This is superfluous when called on current, the wakeup is a harmless no-op.
 123  */
 124 void recalc_sigpending_and_wake(struct task_struct *t)
 125 {
 126         if (recalc_sigpending_tsk(t))
 127                 signal_wake_up(t, 0);
 128 }
 129
 130 void recalc_sigpending(void)
 131 {
 132         if (!recalc_sigpending_tsk(current) && !freezing(current))
 133                 clear_thread_flag(TIF_SIGPENDING);
 134
 135 }
 136
 137 /* Given the mask, find the first available signal that should be serviced. */
 138
 139 int next_signal(struct sigpending *pending, sigset_t *mask)
 140 {
 141         unsigned long i, *s, *m, x;
 142         int sig = 0;
 143
 144         s = pending->signal.sig;
 145         m = mask->sig;
 146         switch (_NSIG_WORDS) {
 147         default:
 148                 for (i = 0; i < _NSIG_WORDS; ++i, ++s, ++m)
 149                         if ((x = *s &~ *m) != 0) {
 150                                 sig = ffz(~x) + i*_NSIG_BPW + 1;
 151                                 break;
 152                         }
 153                 break;
 154
 155         case 2: if ((x = s[0] &~ m[0]) != 0)
 156                         sig = 1;
 157                 else if ((x = s[1] &~ m[1]) != 0)
 158                         sig = _NSIG_BPW + 1;
 159                 else
 160                         break;
 161                 sig += ffz(~x);
 162                 break;
 163
 164         case 1: if ((x = *s &~ *m) != 0)
 165                         sig = ffz(~x) + 1;
 166                 break;
 167         }
 168
 169         return sig;
 170 }
 171
 172 static struct sigqueue *__sigqueue_alloc(struct task_struct *t, gfp_t flags,
 173                                          int override_rlimit)
 174 {
 175         struct sigqueue *q = NULL;
 176         struct user_struct *user;
 177
 178         /*
 179          * In order to avoid problems with "switch_user()", we want to make
 180          * sure that the compiler doesn't re-load "t->user"
 181          */
 182         user = t->user;
 183         barrier();
 184         atomic_inc(&user->sigpending);
 185         if (override_rlimit ||
 186             atomic_read(&user->sigpending) <=
 187                         t->signal->rlim[RLIMIT_SIGPENDING].rlim_cur)
 188                 q = kmem_cache_alloc(sigqueue_cachep, flags);
 189         if (unlikely(q == NULL)) {
 190                 atomic_dec(&user->sigpending);
 191         } else {
 192                 INIT_LIST_HEAD(&q->list);
 193                 q->flags = 0;
 194                 q->user = get_uid(user);
 195         }
 196         return(q);
 197 }
 198
 199 static void __sigqueue_free(struct sigqueue *q)
 200 {
 201         if (q->flags & SIGQUEUE_PREALLOC)
 202                 return;
 203         atomic_dec(&q->user->sigpending);
 204         free_uid(q->user);
 205         kmem_cache_free(sigqueue_cachep, q);
 206 }
 207
 208 void flush_sigqueue(struct sigpending *queue)
 209 {
 210         struct sigqueue *q;
 211
 212         sigemptyset(&queue->signal);
 213         while (!list_empty(&queue->list)) {
 214                 q = list_entry(queue->list.next, struct sigqueue , list);
 215                 list_del_init(&q->list);
 216                 __sigqueue_free(q);
 217         }
 218 }
 219
 220 /*
 221  * Flush all pending signals for a task.
 222  */
 223 void flush_signals(struct task_struct *t)
 224 {
 225         unsigned long flags;
 226
 227         spin_lock_irqsave(&t->sighand->siglock, flags);
 228         clear_tsk_thread_flag(t, TIF_SIGPENDING);
 229         flush_sigqueue(&t->pending);
 230         flush_sigqueue(&t->signal->shared_pending);
 231         spin_unlock_irqrestore(&t->sighand->siglock, flags);
 232 }
 233
 234 void ignore_signals(struct task_struct *t)
 235 {
 236         int i;
 237
 238         for (i = 0; i < _NSIG; ++i)
 239                 t->sighand->action[i].sa.sa_handler = SIG_IGN;
 240
 241         flush_signals(t);
 242 }
 243
 244 /*
 245  * Flush all handlers for a task.
 246  */
 247
 248 void
 249 flush_signal_handlers(struct task_struct *t, int force_default)
 250 {
 251         int i;
 252         struct k_sigaction *ka = &t->sighand->action[0];
 253         for (i = _NSIG ; i != 0 ; i--) {
 254                 if (force_default || ka->sa.sa_handler != SIG_IGN)
 255                         ka->sa.sa_handler = SIG_DFL;
 256                 ka->sa.sa_flags = 0;
 257                 sigemptyset(&ka->sa.sa_mask);
 258                 ka++;
 259         }
 260 }
 261
 262 int unhandled_signal(struct task_struct *tsk, int sig)
 263 {
 264         if (is_global_init(tsk))
 265                 return 1;
 266         if (tsk->ptrace & PT_PTRACED)
 267                 return 0;
 268         return (tsk->sighand->action[sig-1].sa.sa_handler == SIG_IGN) ||
 269                 (tsk->sighand->action[sig-1].sa.sa_handler == SIG_DFL);
 270 }
 271
 272
 273 /* Notify the system that a driver wants to block all signals for this
 274  * process, and wants to be notified if any signals at all were to be
 275  * sent/acted upon.  If the notifier routine returns non-zero, then the
 276  * signal will be acted upon after all.  If the notifier routine returns 0,
 277  * then then signal will be blocked.  Only one block per process is
 278  * allowed.  priv is a pointer to private data that the notifier routine
 279  * can use to determine if the signal should be blocked or not.  */
 280
 281 void
 282 block_all_signals(int (*notifier)(void *priv), void *priv, sigset_t *mask)
 283 {
 284         unsigned long flags;
 285
 286         spin_lock_irqsave(&current->sighand->siglock, flags);
 287         current->notifier_mask = mask;
 288         current->notifier_data = priv;
 289         current->notifier = notifier;
 290         spin_unlock_irqrestore(&current->sighand->siglock, flags);
 291 }
 292
 293 /* Notify the system that blocking has ended. */
 294
 295 void
 296 unblock_all_signals(void)
 297 {
 298         unsigned long flags;
 299
 300         spin_lock_irqsave(&current->sighand->siglock, flags);
 301         current->notifier = NULL;
 302         current->notifier_data = NULL;
 303         recalc_sigpending();
 304         spin_unlock_irqrestore(&current->sighand->siglock, flags);
 305 }
 306
 307 static int collect_signal(int sig, struct sigpending *list, siginfo_t *info)
 308 {
 309         struct sigqueue *q, *first = NULL;
 310         int still_pending = 0;
 311
 312         if (unlikely(!sigismember(&list->signal, sig)))
 313                 return 0;
 314
 315         /*
 316          * Collect the siginfo appropriate to this signal.  Check if
 317          * there is another siginfo for the same signal.
 318         */
 319         list_for_each_entry(q, &list->list, list) {
 320                 if (q->info.si_signo == sig) {
 321                         if (first) {
 322                                 still_pending = 1;
 323                                 break;
 324                         }
 325                         first = q;
 326                 }
 327         }
 328         if (first) {
 329                 list_del_init(&first->list);
 330                 copy_siginfo(info, &first->info);
 331                 __sigqueue_free(first);
 332                 if (!still_pending)
 333                         sigdelset(&list->signal, sig);
 334         } else {
 335
 336                 /* Ok, it wasn't in the queue.  This must be
 337                    a fast-pathed signal or we must have been
 338                    out of queue space.  So zero out the info.
 339                  */
 340                 sigdelset(&list->signal, sig);
 341                 info->si_signo = sig;
 342                 info->si_errno = 0;
 343                 info->si_code = 0;
 344                 info->si_pid = 0;
 345                 info->si_uid = 0;
 346         }
 347         return 1;
 348 }
 349
 350 static int __dequeue_signal(struct sigpending *pending, sigset_t *mask,
 351                         siginfo_t *info)
 352 {
 353         int sig = next_signal(pending, mask);
 354
 355         if (sig) {
 356                 if (current->notifier) {
 357                         if (sigismember(current->notifier_mask, sig)) {
 358                                 if (!(current->notifier)(current->notifier_data)) {
 359                                         clear_thread_flag(TIF_SIGPENDING);
 360                                         return 0;
 361                                 }
 362                         }
 363                 }
 364
 365                 if (!collect_signal(sig, pending, info))
 366                         sig = 0;
 367         }
 368
 369         return sig;
 370 }
 371
 372 /*
 373  * Dequeue a signal and return the element to the caller, which is
 374  * expected to free it.
 375  *
 376  * All callers have to hold the siglock.
 377  */
 378 int dequeue_signal(struct task_struct *tsk, sigset_t *mask, siginfo_t *info)
 379 {
 380         int signr;
 381
 382         /* We only dequeue private signals from ourselves, we don't let
 383          * signalfd steal them
 384          */
 385         signr = __dequeue_signal(&tsk->pending, mask, info);
 386         if (!signr) {
 387                 signr = __dequeue_signal(&tsk->signal->shared_pending,
 388                                          mask, info);
 389                 /*
 390                  * itimer signal ?
 391                  *
 392                  * itimers are process shared and we restart periodic
 393                  * itimers in the signal delivery path to prevent DoS
 394                  * attacks in the high resolution timer case. This is
 395                  * compliant with the old way of self restarting
 396                  * itimers, as the SIGALRM is a legacy signal and only
 397                  * queued once. Changing the restart behaviour to
 398                  * restart the timer in the signal dequeue path is
 399                  * reducing the timer noise on heavy loaded !highres
 400                  * systems too.
 401                  */
 402                 if (unlikely(signr == SIGALRM)) {
 403                         struct hrtimer *tmr = &tsk->signal->real_timer;
 404
 405                         if (!hrtimer_is_queued(tmr) &&
 406                             tsk->signal->it_real_incr.tv64 != 0) {
 407                                 hrtimer_forward(tmr, tmr->base->get_time(),
 408                                                 tsk->signal->it_real_incr);
 409                                 hrtimer_restart(tmr);
 410                         }
 411                 }
 412         }
 413
 414         recalc_sigpending();
 415         if (!signr)
 416                 return 0;
 417
 418         if (unlikely(sig_kernel_stop(signr))) {
 419                 /*
 420                  * Set a marker that we have dequeued a stop signal.  Our
 421                  * caller might release the siglock and then the pending
 422                  * stop signal it is about to process is no longer in the
 423                  * pending bitmasks, but must still be cleared by a SIGCONT
 424                  * (and overruled by a SIGKILL).  So those cases clear this
 425                  * shared flag after we've set it.  Note that this flag may
 426                  * remain set after the signal we return is ignored or
 427                  * handled.  That doesn't matter because its only purpose
 428                  * is to alert stop-signal processing code when another
 429                  * processor has come along and cleared the flag.
 430                  */
 431                 if (!(tsk->signal->flags & SIGNAL_GROUP_EXIT))
 432                         tsk->signal->flags |= SIGNAL_STOP_DEQUEUED;
 433         }
 434         if ((info->si_code & __SI_MASK) == __SI_TIMER && info->si_sys_private) {
 435                 /*
 436                  * Release the siglock to ensure proper locking order
 437                  * of timer locks outside of siglocks.  Note, we leave
 438                  * irqs disabled here, since the posix-timers code is
 439                  * about to disable them again anyway.
 440                  */
 441                 spin_unlock(&tsk->sighand->siglock);
 442                 do_schedule_next_timer(info);
 443                 spin_lock(&tsk->sighand->siglock);
 444         }
 445         return signr;
 446 }
 447
 448 /*
 449  * Tell a process that it has a new active signal..
 450  *
 451  * NOTE! we rely on the previous spin_lock to
 452  * lock interrupts for us! We can only be called with
 453  * "siglock" held, and the local interrupt must
 454  * have been disabled when that got acquired!
 455  *
 456  * No need to set need_resched since signal event passing
 457  * goes through ->blocked
 458  */
 459 void signal_wake_up(struct task_struct *t, int resume)
 460 {
 461         unsigned int mask;
 462
 463         set_tsk_thread_flag(t, TIF_SIGPENDING);
 464
 465         /*
 466          * For SIGKILL, we want to wake it up in the stopped/traced/killable
 467          * case. We don't check t->state here because there is a race with it
 468          * executing another processor and just now entering stopped state.
 469          * By using wake_up_state, we ensure the process will wake up and
 470          * handle its death signal.
 471          */
 472         mask = TASK_INTERRUPTIBLE;
 473         if (resume)
 474                 mask |= TASK_WAKEKILL;
 475         if (!wake_up_state(t, mask))
 476                 kick_process(t);
 477 }
 478
 479 /*
 480  * Remove signals in mask from the pending set and queue.
 481  * Returns 1 if any signals were found.
 482  *
 483  * All callers must be holding the siglock.
 484  *
 485  * This version takes a sigset mask and looks at all signals,
 486  * not just those in the first mask word.
 487  */
 488 static int rm_from_queue_full(sigset_t *mask, struct sigpending *s)
 489 {
 490         struct sigqueue *q, *n;
 491         sigset_t m;
 492
 493         sigandsets(&m, mask, &s->signal);
 494         if (sigisemptyset(&m))
 495                 return 0;
 496
 497         signandsets(&s->signal, &s->signal, mask);
 498         list_for_each_entry_safe(q, n, &s->list, list) {
 499                 if (sigismember(mask, q->info.si_signo)) {
 500                         list_del_init(&q->list);
 501                         __sigqueue_free(q);
 502                 }
 503         }
 504         return 1;
 505 }
 506 /*
 507  * Remove signals in mask from the pending set and queue.
 508  * Returns 1 if any signals were found.
 509  *
 510  * All callers must be holding the siglock.
 511  */
 512 static int rm_from_queue(unsigned long mask, struct sigpending *s)
 513 {
 514         struct sigqueue *q, *n;
 515
 516         if (!sigtestsetmask(&s->signal, mask))
 517                 return 0;
 518
 519         sigdelsetmask(&s->signal, mask);
 520         list_for_each_entry_safe(q, n, &s->list, list) {
 521                 if (q->info.si_signo < SIGRTMIN &&
 522                     (mask & sigmask(q->info.si_signo))) {
 523                         list_del_init(&q->list);
 524                         __sigqueue_free(q);
 525                 }
 526         }
 527         return 1;
 528 }
 529
 530 /*
 531  * Bad permissions for sending the signal
 532  */
 533 static int check_kill_permission(int sig, struct siginfo *info,
 534                                  struct task_struct *t)
 535 {
 536         int error;
 537
 538         if (!valid_signal(sig))
 539                 return -EINVAL;
 540
 541         if (info != SEND_SIG_NOINFO && (is_si_special(info) || SI_FROMKERNEL(info)))
 542                 return 0;
 543
 544         error = audit_signal_info(sig, t); /* Let audit system see the signal */
 545         if (error)
 546                 return error;
 547
 548         if (((sig != SIGCONT) || (task_session_nr(current) != task_session_nr(t)))
 549             && (current->euid ^ t->suid) && (current->euid ^ t->uid)
 550             && (current->uid ^ t->suid) && (current->uid ^ t->uid)
 551             && !capable(CAP_KILL))
 552                 return -EPERM;
 553
 554         return security_task_kill(t, info, sig, 0);
 555 }
 556
 557 /* forward decl */
 558 static void do_notify_parent_cldstop(struct task_struct *tsk, int why);
 559
 560 /*
 561  * Handle magic process-wide effects of stop/continue signals.
 562  * Unlike the signal actions, these happen immediately at signal-generation
 563  * time regardless of blocking, ignoring, or handling.  This does the
 564  * actual continuing for SIGCONT, but not the actual stopping for stop
 565  * signals.  The process stop is done as a signal action for SIG_DFL.
 566  */
 567 static void handle_stop_signal(int sig, struct task_struct *p)
 568 {
 569         struct task_struct *t;
 570
 571         if (p->signal->flags & SIGNAL_GROUP_EXIT)
 572                 /*
 573                  * The process is in the middle of dying already.
 574                  */
 575                 return;
 576
 577         if (sig_kernel_stop(sig)) {
 578                 /*
 579                  * This is a stop signal.  Remove SIGCONT from all queues.
 580                  */
 581                 rm_from_queue(sigmask(SIGCONT), &p->signal->shared_pending);
 582                 t = p;
 583                 do {
 584                         rm_from_queue(sigmask(SIGCONT), &t->pending);
 585                         t = next_thread(t);
 586                 } while (t != p);
 587         } else if (sig == SIGCONT) {
 588                 /*
 589                  * Remove all stop signals from all queues,
 590                  * and wake all threads.
 591                  */
 592                 if (unlikely(p->signal->group_stop_count > 0)) {
 593                         /*
 594                          * There was a group stop in progress.  We'll
 595                          * pretend it finished before we got here.  We are
 596                          * obliged to report it to the parent: if the
 597                          * SIGSTOP happened "after" this SIGCONT, then it
 598                          * would have cleared this pending SIGCONT.  If it
 599                          * happened "before" this SIGCONT, then the parent
 600                          * got the SIGCHLD about the stop finishing before
 601                          * the continue happened.  We do the notification
 602                          * now, and it's as if the stop had finished and
 603                          * the SIGCHLD was pending on entry to this kill.
 604                          */
 605                         p->signal->group_stop_count = 0;
 606                         p->signal->flags = SIGNAL_STOP_CONTINUED |
 607                                                 SIGNAL_CLD_STOPPED;
 608                 }
 609                 rm_from_queue(SIG_KERNEL_STOP_MASK, &p->signal->shared_pending);
 610                 t = p;
 611                 do {
 612                         unsigned int state;
 613                         rm_from_queue(SIG_KERNEL_STOP_MASK, &t->pending);
 614
 615                         /*
 616                          * If there is a handler for SIGCONT, we must make
 617                          * sure that no thread returns to user mode before
 618                          * we post the signal, in case it was the only
 619                          * thread eligible to run the signal handler--then
 620                          * it must not do anything between resuming and
 621                          * running the handler.  With the TIF_SIGPENDING
 622                          * flag set, the thread will pause and acquire the
 623                          * siglock that we hold now and until we've queued
 624                          * the pending signal.
 625                          *
 626                          * Wake up the stopped thread _after_ setting
 627                          * TIF_SIGPENDING
 628                          */
 629                         state = __TASK_STOPPED;
 630                         if (sig_user_defined(t, SIGCONT) && !sigismember(&t->blocked, SIGCONT)) {
 631                                 set_tsk_thread_flag(t, TIF_SIGPENDING);
 632                                 state |= TASK_INTERRUPTIBLE;
 633                         }
 634                         wake_up_state(t, state);
 635
 636                         t = next_thread(t);
 637                 } while (t != p);
 638
 639                 if (p->signal->flags & SIGNAL_STOP_STOPPED) {
 640                         /*
 641                          * We were in fact stopped, and are now continued.
 642                          * Notify the parent with CLD_CONTINUED.
 643                          */
 644                         p->signal->flags = SIGNAL_STOP_CONTINUED |
 645                                                 SIGNAL_CLD_CONTINUED;
 646                         p->signal->group_exit_code = 0;
 647                 } else {
 648                         /*
 649                          * We are not stopped, but there could be a stop
 650                          * signal in the middle of being processed after
 651                          * being removed from the queue.  Clear that too.
 652                          */
 653                         p->signal->flags &= ~SIGNAL_STOP_DEQUEUED;
 654                 }
 655         } else if (sig == SIGKILL) {
 656                 /*
 657                  * Make sure that any pending stop signal already dequeued
 658                  * is undone by the wakeup for SIGKILL.
 659                  */
 660                 p->signal->flags &= ~SIGNAL_STOP_DEQUEUED;
 661         }
 662 }
 663
 664 static inline int legacy_queue(struct sigpending *signals, int sig)
 665 {
 666         return (sig < SIGRTMIN) && sigismember(&signals->signal, sig);
 667 }
 668
 669 static int send_signal(int sig, struct siginfo *info, struct task_struct *t,
 670                         struct sigpending *signals)
 671 {
 672         struct sigqueue * q = NULL;
 673
 674         /*
 675          * Short-circuit ignored signals and support queuing
 676          * exactly one non-rt signal, so that we can get more
 677          * detailed information about the cause of the signal.
 678          */
 679         if (sig_ignored(t, sig) || legacy_queue(signals, sig))
 680                 return 0;
 681
 682         /*
 683          * Deliver the signal to listening signalfds. This must be called
 684          * with the sighand lock held.
 685          */
 686         signalfd_notify(t, sig);
 687
 688         /*
 689          * fast-pathed signals for kernel-internal things like SIGSTOP
 690          * or SIGKILL.
 691          */
 692         if (info == SEND_SIG_FORCED)
 693                 goto out_set;
 694
 695         /* Real-time signals must be queued if sent by sigqueue, or
 696            some other real-time mechanism.  It is implementation
 697            defined whether kill() does so.  We attempt to do so, on
 698            the principle of least surprise, but since kill is not
 699            allowed to fail with EAGAIN when low on memory we just
 700            make sure at least one signal gets delivered and don't
 701            pass on the info struct.  */
 702
 703         q = __sigqueue_alloc(t, GFP_ATOMIC, (sig < SIGRTMIN &&
 704                                              (is_si_special(info) ||
 705                                               info->si_code >= 0)));
 706         if (q) {
 707                 list_add_tail(&q->list, &signals->list);
 708                 switch ((unsigned long) info) {
 709                 case (unsigned long) SEND_SIG_NOINFO:
 710                         q->info.si_signo = sig;
 711                         q->info.si_errno = 0;
 712                         q->info.si_code = SI_USER;
 713                         q->info.si_pid = task_pid_vnr(current);
 714                         q->info.si_uid = current->uid;
 715                         break;
 716                 case (unsigned long) SEND_SIG_PRIV:
 717                         q->info.si_signo = sig;
 718                         q->info.si_errno = 0;
 719                         q->info.si_code = SI_KERNEL;
 720                         q->info.si_pid = 0;
 721                         q->info.si_uid = 0;
 722                         break;
 723                 default:
 724                         copy_siginfo(&q->info, info);
 725                         break;
 726                 }
 727         } else if (!is_si_special(info)) {
 728                 if (sig >= SIGRTMIN && info->si_code != SI_USER)
 729                 /*
 730                  * Queue overflow, abort.  We may abort if the signal was rt
 731                  * and sent by user using something other than kill().
 732                  */
 733                         return -EAGAIN;
 734         }
 735
 736 out_set:
 737         sigaddset(&signals->signal, sig);
 738         return 1;
 739 }
 740
 741 int print_fatal_signals;
 742
 743 static void print_fatal_signal(struct pt_regs *regs, int signr)
 744 {
 745         printk("%s/%d: potentially unexpected fatal signal %d.\n",
 746                 current->comm, task_pid_nr(current), signr);
 747
 748 #if defined(__i386__) && !defined(__arch_um__)
 749         printk("code at %08lx: ", regs->ip);
 750         {
 751                 int i;
 752                 for (i = 0; i < 16; i++) {
 753                         unsigned char insn;
 754
 755                         __get_user(insn, (unsigned char *)(regs->ip + i));
 756                         printk("%02x ", insn);
 757                 }
 758         }
 759 #endif
 760         printk("\n");
 761         show_regs(regs);
 762 }
 763
 764 static int __init setup_print_fatal_signals(char *str)
 765 {
 766         get_option (&str, &print_fatal_signals);
 767
 768         return 1;
 769 }
 770
 771 __setup("print-fatal-signals=", setup_print_fatal_signals);
 772
 773 static int
 774 specific_send_sig_info(int sig, struct siginfo *info, struct task_struct *t)
 775 {
 776         int ret;
 777
 778         BUG_ON(!irqs_disabled());
 779         assert_spin_locked(&t->sighand->siglock);
 780
 781         ret = send_signal(sig, info, t, &t->pending);
 782         if (ret <= 0)
 783                 return ret;
 784
 785         if (!sigismember(&t->blocked, sig))
 786                 signal_wake_up(t, sig == SIGKILL);
 787         return 0;
 788 }
 789
 790 /*
 791  * Force a signal that the process can't ignore: if necessary
 792  * we unblock the signal and change any SIG_IGN to SIG_DFL.
 793  *
 794  * Note: If we unblock the signal, we always reset it to SIG_DFL,
 795  * since we do not want to have a signal handler that was blocked
 796  * be invoked when user space had explicitly blocked it.
 797  *
 798  * We don't want to have recursive SIGSEGV's etc, for example.
 799  */
 800 int
 801 force_sig_info(int sig, struct siginfo *info, struct task_struct *t)
 802 {
 803         unsigned long int flags;
 804         int ret, blocked, ignored;
 805         struct k_sigaction *action;
 806
 807         spin_lock_irqsave(&t->sighand->siglock, flags);
 808         action = &t->sighand->action[sig-1];
 809         ignored = action->sa.sa_handler == SIG_IGN;
 810         blocked = sigismember(&t->blocked, sig);
 811         if (blocked || ignored) {
 812                 action->sa.sa_handler = SIG_DFL;
 813                 if (blocked) {
 814                         sigdelset(&t->blocked, sig);
 815                         recalc_sigpending_and_wake(t);
 816                 }
 817         }
 818         ret = specific_send_sig_info(sig, info, t);
 819         spin_unlock_irqrestore(&t->sighand->siglock, flags);
 820
 821         return ret;
 822 }
 823
 824 void
 825 force_sig_specific(int sig, struct task_struct *t)
 826 {
 827         force_sig_info(sig, SEND_SIG_FORCED, t);
 828 }
 829
 830 /*
 831  * Test if P wants to take SIG.  After we've checked all threads with this,
 832  * it's equivalent to finding no threads not blocking SIG.  Any threads not
 833  * blocking SIG were ruled out because they are not running and already
 834  * have pending signals.  Such threads will dequeue from the shared queue
 835  * as soon as they're available, so putting the signal on the shared queue
 836  * will be equivalent to sending it to one such thread.
 837  */
 838 static inline int wants_signal(int sig, struct task_struct *p)
 839 {
 840         if (sigismember(&p->blocked, sig))
 841                 return 0;
 842         if (p->flags & PF_EXITING)
 843                 return 0;
 844         if (sig == SIGKILL)
 845                 return 1;
 846         if (task_is_stopped_or_traced(p))
 847                 return 0;
 848         return task_curr(p) || !signal_pending(p);
 849 }
 850
 851 static void
 852 __group_complete_signal(int sig, struct task_struct *p)
 853 {
 854         struct task_struct *t;
 855
 856         /*
 857          * Now find a thread we can wake up to take the signal off the queue.
 858          *
 859          * If the main thread wants the signal, it gets first crack.
 860          * Probably the least surprising to the average bear.
 861          */
 862         if (wants_signal(sig, p))
 863                 t = p;
 864         else if (thread_group_empty(p))
 865                 /*
 866                  * There is just one thread and it does not need to be woken.
 867                  * It will dequeue unblocked signals before it runs again.
 868                  */
 869                 return;
 870         else {
 871                 /*
 872                  * Otherwise try to find a suitable thread.
 873                  */
 874                 t = p->signal->curr_target;
 875                 if (t == NULL)
 876                         /* restart balancing at this thread */
 877                         t = p->signal->curr_target = p;
 878
 879                 while (!wants_signal(sig, t)) {
 880                         t = next_thread(t);
 881                         if (t == p->signal->curr_target)
 882                                 /*
 883                                  * No thread needs to be woken.
 884                                  * Any eligible threads will see
 885                                  * the signal in the queue soon.
 886                                  */
 887                                 return;
 888                 }
 889                 p->signal->curr_target = t;
 890         }
 891
 892         /*
 893          * Found a killable thread.  If the signal will be fatal,
 894          * then start taking the whole group down immediately.
 895          */
 896         if (sig_fatal(p, sig) && !(p->signal->flags & SIGNAL_GROUP_EXIT) &&
 897             !sigismember(&t->real_blocked, sig) &&
 898             (sig == SIGKILL || !(t->ptrace & PT_PTRACED))) {
 899                 /*
 900                  * This signal will be fatal to the whole group.
 901                  */
 902                 if (!sig_kernel_coredump(sig)) {
 903                         /*
 904                          * Start a group exit and wake everybody up.
 905                          * This way we don't have other threads
 906                          * running and doing things after a slower
 907                          * thread has the fatal signal pending.
 908                          */
 909                         p->signal->flags = SIGNAL_GROUP_EXIT;
 910                         p->signal->group_exit_code = sig;
 911                         p->signal->group_stop_count = 0;
 912                         t = p;
 913                         do {
 914                                 sigaddset(&t->pending.signal, SIGKILL);
 915                                 signal_wake_up(t, 1);
 916                         } while_each_thread(p, t);
 917                         return;
 918                 }
 919         }
 920
 921         /*
 922          * The signal is already in the shared-pending queue.
 923          * Tell the chosen thread to wake up and dequeue it.
 924          */
 925         signal_wake_up(t, sig == SIGKILL);
 926         return;
 927 }
 928
 929 int
 930 __group_send_sig_info(int sig, struct siginfo *info, struct task_struct *p)
 931 {
 932         int ret;
 933
 934         assert_spin_locked(&p->sighand->siglock);
 935         handle_stop_signal(sig, p);
 936
 937         /*
 938          * Put this signal on the shared-pending queue, or fail with EAGAIN.
 939          * We always use the shared queue for process-wide signals,
 940          * to avoid several races.
 941          */
 942         ret = send_signal(sig, info, p, &p->signal->shared_pending);
 943         if (ret <= 0)
 944                 return ret;
 945
 946         __group_complete_signal(sig, p);
 947         return 0;
 948 }
 949
 950 /*
 951  * Nuke all other threads in the group.
 952  */
 953 void zap_other_threads(struct task_struct *p)
 954 {
 955         struct task_struct *t;
 956
 957         p->signal->group_stop_count = 0;
 958
 959         for (t = next_thread(p); t != p; t = next_thread(t)) {
 960                 /*
 961                  * Don't bother with already dead threads
 962                  */
 963                 if (t->exit_state)
 964                         continue;
 965
 966                 /* SIGKILL will be handled before any pending SIGSTOP */
 967                 sigaddset(&t->pending.signal, SIGKILL);
 968                 signal_wake_up(t, 1);
 969         }
 970 }
 971
 972 int __fatal_signal_pending(struct task_struct *tsk)
 973 {
 974         return sigismember(&tsk->pending.signal, SIGKILL);
 975 }
 976 EXPORT_SYMBOL(__fatal_signal_pending);
 977
 978 struct sighand_struct *lock_task_sighand(struct task_struct *tsk, unsigned long *flags)
 979 {
 980         struct sighand_struct *sighand;
 981
 982         rcu_read_lock();
 983         for (;;) {
 984                 sighand = rcu_dereference(tsk->sighand);
 985                 if (unlikely(sighand == NULL))
 986                         break;
 987
 988                 spin_lock_irqsave(&sighand->siglock, *flags);
 989                 if (likely(sighand == tsk->sighand))
 990                         break;
 991                 spin_unlock_irqrestore(&sighand->siglock, *flags);
 992         }
 993         rcu_read_unlock();
 994
 995         return sighand;
 996 }
 997
 998 int group_send_sig_info(int sig, struct siginfo *info, struct task_struct *p)
 999 {
1000         unsigned long flags;
1001         int ret;
1002
1003         ret = check_kill_permission(sig, info, p);
1004
1005         if (!ret && sig) {
1006                 ret = -ESRCH;
1007                 if (lock_task_sighand(p, &flags)) {
1008                         ret = __group_send_sig_info(sig, info, p);
1009                         unlock_task_sighand(p, &flags);
1010                 }
1011         }
1012
1013         return ret;
1014 }
1015
1016 /*
1017  * __kill_pgrp_info() sends a signal to a process group: this is what the tty
1018  * control characters do (^C, ^Z etc)
1019  */
1020
1021 int __kill_pgrp_info(int sig, struct siginfo *info, struct pid *pgrp)
1022 {
1023         struct task_struct *p = NULL;
1024         int retval, success;
1025
1026         success = 0;
1027         retval = -ESRCH;
1028         do_each_pid_task(pgrp, PIDTYPE_PGID, p) {
1029                 int err = group_send_sig_info(sig, info, p);
1030                 success |= !err;
1031                 retval = err;
1032         } while_each_pid_task(pgrp, PIDTYPE_PGID, p);
1033         return success ? 0 : retval;
1034 }
1035
1036 int kill_pid_info(int sig, struct siginfo *info, struct pid *pid)
1037 {
1038         int error = -ESRCH;
1039         struct task_struct *p;
1040
1041         rcu_read_lock();
1042 retry:
1043         p = pid_task(pid, PIDTYPE_PID);
1044         if (p) {
1045                 error = group_send_sig_info(sig, info, p);
1046                 if (unlikely(error == -ESRCH))
1047                         /*
1048                          * The task was unhashed in between, try again.
1049                          * If it is dead, pid_task() will return NULL,
1050                          * if we race with de_thread() it will find the
1051                          * new leader.
1052                          */
1053                         goto retry;
1054         }
1055         rcu_read_unlock();
1056
1057         return error;
1058 }
1059
1060 int
1061 kill_proc_info(int sig, struct siginfo *info, pid_t pid)
1062 {
1063         int error;
1064         rcu_read_lock();
1065         error = kill_pid_info(sig, info, find_vpid(pid));
1066         rcu_read_unlock();
1067         return error;
1068 }
1069
1070 /* like kill_pid_info(), but doesn't use uid/euid of "current" */
1071 int kill_pid_info_as_uid(int sig, struct siginfo *info, struct pid *pid,
1072                       uid_t uid, uid_t euid, u32 secid)
1073 {
1074         int ret = -EINVAL;
1075         struct task_struct *p;
1076
1077         if (!valid_signal(sig))
1078                 return ret;
1079
1080         read_lock(&tasklist_lock);
1081         p = pid_task(pid, PIDTYPE_PID);
1082         if (!p) {
1083                 ret = -ESRCH;
1084                 goto out_unlock;
1085         }
1086         if ((info == SEND_SIG_NOINFO || (!is_si_special(info) && SI_FROMUSER(info)))
1087             && (euid != p->suid) && (euid != p->uid)
1088             && (uid != p->suid) && (uid != p->uid)) {
1089                 ret = -EPERM;
1090                 goto out_unlock;
1091         }
1092         ret = security_task_kill(p, info, sig, secid);
1093         if (ret)
1094                 goto out_unlock;
1095         if (sig && p->sighand) {
1096                 unsigned long flags;
1097                 spin_lock_irqsave(&p->sighand->siglock, flags);
1098                 ret = __group_send_sig_info(sig, info, p);
1099                 spin_unlock_irqrestore(&p->sighand->siglock, flags);
1100         }
1101 out_unlock:
1102         read_unlock(&tasklist_lock);
1103         return ret;
1104 }
1105 EXPORT_SYMBOL_GPL(kill_pid_info_as_uid);
1106
1107 /*
1108  * kill_something_info() interprets pid in interesting ways just like kill(2).
1109  *
1110  * POSIX specifies that kill(-1,sig) is unspecified, but what we have
1111  * is probably wrong.  Should make it like BSD or SYSV.
1112  */
1113
1114 static int kill_something_info(int sig, struct siginfo *info, int pid)
1115 {
1116         int ret;
1117
1118         if (pid > 0) {
1119                 rcu_read_lock();
1120                 ret = kill_pid_info(sig, info, find_vpid(pid));
1121                 rcu_read_unlock();
1122                 return ret;
1123         }
1124
1125         read_lock(&tasklist_lock);
1126         if (pid != -1) {
1127                 ret = __kill_pgrp_info(sig, info,
1128                                 pid ? find_vpid(-pid) : task_pgrp(current));
1129         } else {
1130                 int retval = 0, count = 0;
1131                 struct task_struct * p;
1132
1133                 for_each_process(p) {
1134                         if (p->pid > 1 && !same_thread_group(p, current)) {
1135                                 int err = group_send_sig_info(sig, info, p);
1136                                 ++count;
1137                                 if (err != -EPERM)
1138                                         retval = err;
1139                         }
1140                 }
1141                 ret = count ? retval : -ESRCH;
1142         }
1143         read_unlock(&tasklist_lock);
1144
1145         return ret;
1146 }
1147
1148 /*
1149  * These are for backward compatibility with the rest of the kernel source.
1150  */
1151
1152 /*
1153  * These two are the most common entry points.  They send a signal
1154  * just to the specific thread.
1155  */
1156 int
1157 send_sig_info(int sig, struct siginfo *info, struct task_struct *p)
1158 {
1159         int ret;
1160         unsigned long flags;
1161
1162         /*
1163          * Make sure legacy kernel users don't send in bad values
1164          * (normal paths check this in check_kill_permission).
1165          */
1166         if (!valid_signal(sig))
1167                 return -EINVAL;
1168
1169         /*
1170          * We need the tasklist lock even for the specific
1171          * thread case (when we don't need to follow the group
1172          * lists) in order to avoid races with "p->sighand"
1173          * going away or changing from under us.
1174          */
1175         read_lock(&tasklist_lock);
1176         spin_lock_irqsave(&p->sighand->siglock, flags);
1177         ret = specific_send_sig_info(sig, info, p);
1178         spin_unlock_irqrestore(&p->sighand->siglock, flags);
1179         read_unlock(&tasklist_lock);
1180         return ret;
1181 }
1182
1183 #define __si_special(priv) \
1184         ((priv) ? SEND_SIG_PRIV : SEND_SIG_NOINFO)
1185
1186 int
1187 send_sig(int sig, struct task_struct *p, int priv)
1188 {
1189         return send_sig_info(sig, __si_special(priv), p);
1190 }
1191
1192 void
1193 force_sig(int sig, struct task_struct *p)
1194 {
1195         force_sig_info(sig, SEND_SIG_PRIV, p);
1196 }
1197
1198 /*
1199  * When things go south during signal handling, we
1200  * will force a SIGSEGV. And if the signal that caused
1201  * the problem was already a SIGSEGV, we'll want to
1202  * make sure we don't even try to deliver the signal..
1203  */
1204 int
1205 force_sigsegv(int sig, struct task_struct *p)
1206 {
1207         if (sig == SIGSEGV) {
1208                 unsigned long flags;
1209                 spin_lock_irqsave(&p->sighand->siglock, flags);
1210                 p->sighand->action[sig - 1].sa.sa_handler = SIG_DFL;
1211                 spin_unlock_irqrestore(&p->sighand->siglock, flags);
1212         }
1213         force_sig(SIGSEGV, p);
1214         return 0;
1215 }
1216
1217 int kill_pgrp(struct pid *pid, int sig, int priv)
1218 {
1219         int ret;
1220
1221         read_lock(&tasklist_lock);
1222         ret = __kill_pgrp_info(sig, __si_special(priv), pid);
1223         read_unlock(&tasklist_lock);
1224
1225         return ret;
1226 }
1227 EXPORT_SYMBOL(kill_pgrp);
1228
1229 int kill_pid(struct pid *pid, int sig, int priv)
1230 {
1231         return kill_pid_info(sig, __si_special(priv), pid);
1232 }
1233 EXPORT_SYMBOL(kill_pid);
1234
1235 int
1236 kill_proc(pid_t pid, int sig, int priv)
1237 {
1238         int ret;
1239
1240         rcu_read_lock();
1241         ret = kill_pid_info(sig, __si_special(priv), find_pid(pid));
1242         rcu_read_unlock();
1243         return ret;
1244 }
1245
1246 /*
1247  * These functions support sending signals using preallocated sigqueue
1248  * structures.  This is needed "because realtime applications cannot
1249  * afford to lose notifications of asynchronous events, like timer
1250  * expirations or I/O completions".  In the case of Posix Timers
1251  * we allocate the sigqueue structure from the timer_create.  If this
1252  * allocation fails we are able to report the failure to the application
1253  * with an EAGAIN error.
1254  */
1255
1256 struct sigqueue *sigqueue_alloc(void)
1257 {
1258         struct sigqueue *q;
1259
1260         if ((q = __sigqueue_alloc(current, GFP_KERNEL, 0)))
1261                 q->flags |= SIGQUEUE_PREALLOC;
1262         return(q);
1263 }
1264
1265 void sigqueue_free(struct sigqueue *q)
1266 {
1267         unsigned long flags;
1268         spinlock_t *lock = &current->sighand->siglock;
1269
1270         BUG_ON(!(q->flags & SIGQUEUE_PREALLOC));
1271         /*
1272          * If the signal is still pending remove it from the
1273          * pending queue. We must hold ->siglock while testing
1274          * q->list to serialize with collect_signal().
1275          */
1276         spin_lock_irqsave(lock, flags);
1277         if (!list_empty(&q->list))
1278                 list_del_init(&q->list);
1279         spin_unlock_irqrestore(lock, flags);
1280
1281         q->flags &= ~SIGQUEUE_PREALLOC;
1282         __sigqueue_free(q);
1283 }
1284
1285 static int do_send_sigqueue(int sig, struct sigqueue *q, struct task_struct *t,
1286                 struct sigpending *pending)
1287 {
1288         if (unlikely(!list_empty(&q->list))) {
1289                 /*
1290                  * If an SI_TIMER entry is already queue just increment
1291                  * the overrun count.
1292                  */
1293
1294                 BUG_ON(q->info.si_code != SI_TIMER);
1295                 q->info.si_overrun++;
1296                 return 0;
1297         }
1298
1299         if (sig_ignored(t, sig))
1300                 return 1;
1301
1302         signalfd_notify(t, sig);
1303         list_add_tail(&q->list, &pending->list);
1304         sigaddset(&pending->signal, sig);
1305         return 0;
1306 }
1307
1308 int send_sigqueue(int sig, struct sigqueue *q, struct task_struct *p)
1309 {
1310         unsigned long flags;
1311         int ret = -1;
1312
1313         BUG_ON(!(q->flags & SIGQUEUE_PREALLOC));
1314
1315         /*
1316          * The rcu based delayed sighand destroy makes it possible to
1317          * run this without tasklist lock held. The task struct itself
1318          * cannot go away as create_timer did get_task_struct().
1319          *
1320          * We return -1, when the task is marked exiting, so
1321          * posix_timer_event can redirect it to the group leader
1322          */
1323         rcu_read_lock();
1324
1325         if (!likely(lock_task_sighand(p, &flags)))
1326                 goto out_err;
1327
1328         ret = do_send_sigqueue(sig, q, p, &p->pending);
1329
1330         if (!sigismember(&p->blocked, sig))
1331                 signal_wake_up(p, sig == SIGKILL);
1332
1333         unlock_task_sighand(p, &flags);
1334 out_err:
1335         rcu_read_unlock();
1336
1337         return ret;
1338 }
1339
1340 int
1341 send_group_sigqueue(int sig, struct sigqueue *q, struct task_struct *p)
1342 {
1343         unsigned long flags;
1344         int ret;
1345
1346         BUG_ON(!(q->flags & SIGQUEUE_PREALLOC));
1347
1348         read_lock(&tasklist_lock);
1349         /* Since it_lock is held, p->sighand cannot be NULL. */
1350         spin_lock_irqsave(&p->sighand->siglock, flags);
1351         handle_stop_signal(sig, p);
1352
1353         ret = do_send_sigqueue(sig, q, p, &p->signal->shared_pending);
1354
1355         __group_complete_signal(sig, p);
1356
1357         spin_unlock_irqrestore(&p->sighand->siglock, flags);
1358         read_unlock(&tasklist_lock);
1359         return ret;
1360 }
1361
1362 /*
1363  * Wake up any threads in the parent blocked in wait* syscalls.
1364  */
1365 static inline void __wake_up_parent(struct task_struct *p,
1366                                     struct task_struct *parent)
1367 {
1368         wake_up_interruptible_sync(&parent->signal->wait_chldexit);
1369 }
1370
1371 /*
1372  * Let a parent know about the death of a child.
1373  * For a stopped/continued status change, use do_notify_parent_cldstop instead.
1374  */
1375
1376 void do_notify_parent(struct task_struct *tsk, int sig)
1377 {
1378         struct siginfo info;
1379         unsigned long flags;
1380         struct sighand_struct *psig;
1381
1382         BUG_ON(sig == -1);
1383
1384         /* do_notify_parent_cldstop should have been called instead.  */
1385         BUG_ON(task_is_stopped_or_traced(tsk));
1386
1387         BUG_ON(!tsk->ptrace &&
1388                (tsk->group_leader != tsk || !thread_group_empty(tsk)));
1389
1390         info.si_signo = sig;
1391         info.si_errno = 0;
1392         /*
1393          * we are under tasklist_lock here so our parent is tied to
1394          * us and cannot exit and release its namespace.
1395          *
1396          * the only it can is to switch its nsproxy with sys_unshare,
1397          * bu uncharing pid namespaces is not allowed, so we'll always
1398          * see relevant namespace
1399          *
1400          * write_lock() currently calls preempt_disable() which is the
1401          * same as rcu_read_lock(), but according to Oleg, this is not
1402          * correct to rely on this
1403          */
1404         rcu_read_lock();
1405         info.si_pid = task_pid_nr_ns(tsk, tsk->parent->nsproxy->pid_ns);
1406         rcu_read_unlock();
1407
1408         info.si_uid = tsk->uid;
1409
1410         /* FIXME: find out whether or not this is supposed to be c*time. */
1411         info.si_utime = cputime_to_jiffies(cputime_add(tsk->utime,
1412                                                        tsk->signal->utime));
1413         info.si_stime = cputime_to_jiffies(cputime_add(tsk->stime,
1414                                                        tsk->signal->stime));
1415
1416         info.si_status = tsk->exit_code & 0x7f;
1417         if (tsk->exit_code & 0x80)
1418                 info.si_code = CLD_DUMPED;
1419         else if (tsk->exit_code & 0x7f)
1420                 info.si_code = CLD_KILLED;
1421         else {
1422                 info.si_code = CLD_EXITED;
1423                 info.si_status = tsk->exit_code >> 8;
1424         }
1425
1426         psig = tsk->parent->sighand;
1427         spin_lock_irqsave(&psig->siglock, flags);
1428         if (!tsk->ptrace && sig == SIGCHLD &&
1429             (psig->action[SIGCHLD-1].sa.sa_handler == SIG_IGN ||
1430              (psig->action[SIGCHLD-1].sa.sa_flags & SA_NOCLDWAIT))) {
1431                 /*
1432                  * We are exiting and our parent doesn't care.  POSIX.1
1433                  * defines special semantics for setting SIGCHLD to SIG_IGN
1434                  * or setting the SA_NOCLDWAIT flag: we should be reaped
1435                  * automatically and not left for our parent's wait4 call.
1436                  * Rather than having the parent do it as a magic kind of
1437                  * signal handler, we just set this to tell do_exit that we
1438                  * can be cleaned up without becoming a zombie.  Note that
1439                  * we still call __wake_up_parent in this case, because a
1440                  * blocked sys_wait4 might now return -ECHILD.
1441                  *
1442                  * Whether we send SIGCHLD or not for SA_NOCLDWAIT
1443                  * is implementation-defined: we do (if you don't want
1444                  * it, just use SIG_IGN instead).
1445                  */
1446                 tsk->exit_signal = -1;
1447                 if (psig->action[SIGCHLD-1].sa.sa_handler == SIG_IGN)
1448                         sig = 0;
1449         }
1450         if (valid_signal(sig) && sig > 0)
1451                 __group_send_sig_info(sig, &info, tsk->parent);
1452         __wake_up_parent(tsk, tsk->parent);
1453         spin_unlock_irqrestore(&psig->siglock, flags);
1454 }
1455
1456 static void do_notify_parent_cldstop(struct task_struct *tsk, int why)
1457 {
1458         struct siginfo info;
1459         unsigned long flags;
1460         struct task_struct *parent;
1461         struct sighand_struct *sighand;
1462
1463         if (tsk->ptrace & PT_PTRACED)
1464                 parent = tsk->parent;
1465         else {
1466                 tsk = tsk->group_leader;
1467                 parent = tsk->real_parent;
1468         }
1469
1470         info.si_signo = SIGCHLD;
1471         info.si_errno = 0;
1472         /*
1473          * see comment in do_notify_parent() abot the following 3 lines
1474          */
1475         rcu_read_lock();
1476         info.si_pid = task_pid_nr_ns(tsk, tsk->parent->nsproxy->pid_ns);
1477         rcu_read_unlock();
1478
1479         info.si_uid = tsk->uid;
1480
1481         /* FIXME: find out whether or not this is supposed to be c*time. */
1482         info.si_utime = cputime_to_jiffies(tsk->utime);
1483         info.si_stime = cputime_to_jiffies(tsk->stime);
1484
1485         info.si_code = why;
1486         switch (why) {
1487         case CLD_CONTINUED:
1488                 info.si_status = SIGCONT;
1489                 break;
1490         case CLD_STOPPED:
1491                 info.si_status = tsk->signal->group_exit_code & 0x7f;
1492                 break;
1493         case CLD_TRAPPED:
1494                 info.si_status = tsk->exit_code & 0x7f;
1495                 break;
1496         default:
1497                 BUG();
1498         }
1499
1500         sighand = parent->sighand;
1501         spin_lock_irqsave(&sighand->siglock, flags);
1502         if (sighand->action[SIGCHLD-1].sa.sa_handler != SIG_IGN &&
1503             !(sighand->action[SIGCHLD-1].sa.sa_flags & SA_NOCLDSTOP))
1504                 __group_send_sig_info(SIGCHLD, &info, parent);
1505         /*
1506          * Even if SIGCHLD is not generated, we must wake up wait4 calls.
1507          */
1508         __wake_up_parent(tsk, parent);
1509         spin_unlock_irqrestore(&sighand->siglock, flags);
1510 }
1511
1512 static inline int may_ptrace_stop(void)
1513 {
1514         if (!likely(current->ptrace & PT_PTRACED))
1515                 return 0;
1516         /*
1517          * Are we in the middle of do_coredump?
1518          * If so and our tracer is also part of the coredump stopping
1519          * is a deadlock situation, and pointless because our tracer
1520          * is dead so don't allow us to stop.
1521          * If SIGKILL was already sent before the caller unlocked
1522          * ->siglock we must see ->core_waiters != 0. Otherwise it
1523          * is safe to enter schedule().
1524          */
1525         if (unlikely(current->mm->core_waiters) &&
1526             unlikely(current->mm == current->parent->mm))
1527                 return 0;
1528
1529         return 1;
1530 }
1531
1532 /*
1533  * Return nonzero if there is a SIGKILL that should be waking us up.
1534  * Called with the siglock held.
1535  */
1536 static int sigkill_pending(struct task_struct *tsk)
1537 {
1538         return ((sigismember(&tsk->pending.signal, SIGKILL) ||
1539                  sigismember(&tsk->signal->shared_pending.signal, SIGKILL)) &&
1540                 !unlikely(sigismember(&tsk->blocked, SIGKILL)));
1541 }
1542
1543 /*
1544  * This must be called with current->sighand->siglock held.
1545  *
1546  * This should be the path for all ptrace stops.
1547  * We always set current->last_siginfo while stopped here.
1548  * That makes it a way to test a stopped process for
1549  * being ptrace-stopped vs being job-control-stopped.
1550  *
1551  * If we actually decide not to stop at all because the tracer
1552  * is gone, we keep current->exit_code unless clear_code.
1553  */
1554 static void ptrace_stop(int exit_code, int clear_code, siginfo_t *info)
1555 {
1556         int killed = 0;
1557
1558         if (arch_ptrace_stop_needed(exit_code, info)) {
1559                 /*
1560                  * The arch code has something special to do before a
1561                  * ptrace stop.  This is allowed to block, e.g. for faults
1562                  * on user stack pages.  We can't keep the siglock while
1563                  * calling arch_ptrace_stop, so we must release it now.
1564                  * To preserve proper semantics, we must do this before
1565                  * any signal bookkeeping like checking group_stop_count.
1566                  * Meanwhile, a SIGKILL could come in before we retake the
1567                  * siglock.  That must prevent us from sleeping in TASK_TRACED.
1568                  * So after regaining the lock, we must check for SIGKILL.
1569                  */
1570                 spin_unlock_irq(&current->sighand->siglock);
1571                 arch_ptrace_stop(exit_code, info);
1572                 spin_lock_irq(&current->sighand->siglock);
1573                 killed = sigkill_pending(current);
1574         }
1575
1576         /*
1577          * If there is a group stop in progress,
1578          * we must participate in the bookkeeping.
1579          */
1580         if (current->signal->group_stop_count > 0)
1581                 --current->signal->group_stop_count;
1582
1583         current->last_siginfo = info;
1584         current->exit_code = exit_code;
1585
1586         /* Let the debugger run.  */
1587         __set_current_state(TASK_TRACED);
1588         spin_unlock_irq(&current->sighand->siglock);
1589         read_lock(&tasklist_lock);
1590         if (!unlikely(killed) && may_ptrace_stop()) {
1591                 do_notify_parent_cldstop(current, CLD_TRAPPED);
1592                 read_unlock(&tasklist_lock);
1593                 schedule();
1594         } else {
1595                 /*
1596                  * By the time we got the lock, our tracer went away.
1597                  * Don't drop the lock yet, another tracer may come.
1598                  */
1599                 __set_current_state(TASK_RUNNING);
1600                 if (clear_code)
1601                         current->exit_code = 0;
1602                 read_unlock(&tasklist_lock);
1603         }
1604
1605         /*
1606          * While in TASK_TRACED, we were considered "frozen enough".
1607          * Now that we woke up, it's crucial if we're supposed to be
1608          * frozen that we freeze now before running anything substantial.
1609          */
1610         try_to_freeze();
1611
1612         /*
1613          * We are back.  Now reacquire the siglock before touching
1614          * last_siginfo, so that we are sure to have synchronized with
1615          * any signal-sending on another CPU that wants to examine it.
1616          */
1617         spin_lock_irq(&current->sighand->siglock);
1618         current->last_siginfo = NULL;
1619
1620         /*
1621          * Queued signals ignored us while we were stopped for tracing.
1622          * So check for any that we should take before resuming user mode.
1623          * This sets TIF_SIGPENDING, but never clears it.
1624          */
1625         recalc_sigpending_tsk(current);
1626 }
1627
1628 void ptrace_notify(int exit_code)
1629 {
1630         siginfo_t info;
1631
1632         BUG_ON((exit_code & (0x7f | ~0xffff)) != SIGTRAP);
1633
1634         memset(&info, 0, sizeof info);
1635         info.si_signo = SIGTRAP;
1636         info.si_code = exit_code;
1637         info.si_pid = task_pid_vnr(current);
1638         info.si_uid = current->uid;
1639
1640         /* Let the debugger run.  */
1641         spin_lock_irq(&current->sighand->siglock);
1642         ptrace_stop(exit_code, 1, &info);
1643         spin_unlock_irq(&current->sighand->siglock);
1644 }
1645
1646 static void
1647 finish_stop(int stop_count)
1648 {
1649         /*
1650          * If there are no other threads in the group, or if there is
1651          * a group stop in progress and we are the last to stop,
1652          * report to the parent.  When ptraced, every thread reports itself.
1653          */
1654         if (stop_count == 0 || (current->ptrace & PT_PTRACED)) {
1655                 read_lock(&tasklist_lock);
1656                 do_notify_parent_cldstop(current, CLD_STOPPED);
1657                 read_unlock(&tasklist_lock);
1658         }
1659
1660         do {
1661                 schedule();
1662         } while (try_to_freeze());
1663         /*
1664          * Now we don't run again until continued.
1665          */
1666         current->exit_code = 0;
1667 }
1668
1669 /*
1670  * This performs the stopping for SIGSTOP and other stop signals.
1671  * We have to stop all threads in the thread group.
1672  * Returns nonzero if we've actually stopped and released the siglock.
1673  * Returns zero if we didn't stop and still hold the siglock.
1674  */
1675 static int do_signal_stop(int signr)
1676 {
1677         struct signal_struct *sig = current->signal;
1678         int stop_count;
1679
1680         if (sig->group_stop_count > 0) {
1681                 /*
1682                  * There is a group stop in progress.  We don't need to
1683                  * start another one.
1684                  */
1685                 stop_count = --sig->group_stop_count;
1686         } else {
1687                 struct task_struct *t;
1688
1689                 if (!likely(sig->flags & SIGNAL_STOP_DEQUEUED) ||
1690                     unlikely(signal_group_exit(sig)))
1691                         return 0;
1692                 /*
1693                  * There is no group stop already in progress.
1694                  * We must initiate one now.
1695                  */
1696                 sig->group_exit_code = signr;
1697
1698                 stop_count = 0;
1699                 for (t = next_thread(current); t != current; t = next_thread(t))
1700                         /*
1701                          * Setting state to TASK_STOPPED for a group
1702                          * stop is always done with the siglock held,
1703                          * so this check has no races.
1704                          */
1705                         if (!(t->flags & PF_EXITING) &&
1706                             !task_is_stopped_or_traced(t)) {
1707                                 stop_count++;
1708                                 signal_wake_up(t, 0);
1709                         }
1710                 sig->group_stop_count = stop_count;
1711         }
1712
1713         if (stop_count == 0)
1714                 sig->flags = SIGNAL_STOP_STOPPED;
1715         current->exit_code = sig->group_exit_code;
1716         __set_current_state(TASK_STOPPED);
1717
1718         spin_unlock_irq(&current->sighand->siglock);
1719         finish_stop(stop_count);
1720         return 1;
1721 }
1722
1723 static int ptrace_signal(int signr, siginfo_t *info,
1724                          struct pt_regs *regs, void *cookie)
1725 {
1726         if (!(current->ptrace & PT_PTRACED))
1727                 return signr;
1728
1729         ptrace_signal_deliver(regs, cookie);
1730
1731         /* Let the debugger run.  */
1732         ptrace_stop(signr, 0, info);
1733
1734         /* We're back.  Did the debugger cancel the sig?  */
1735         signr = current->exit_code;
1736         if (signr == 0)
1737                 return signr;
1738
1739         current->exit_code = 0;
1740
1741         /* Update the siginfo structure if the signal has
1742            changed.  If the debugger wanted something
1743            specific in the siginfo structure then it should
1744            have updated *info via PTRACE_SETSIGINFO.  */
1745         if (signr != info->si_signo) {
1746                 info->si_signo = signr;
1747                 info->si_errno = 0;
1748                 info->si_code = SI_USER;
1749                 info->si_pid = task_pid_vnr(current->parent);
1750                 info->si_uid = current->parent->uid;
1751         }
1752
1753         /* If the (new) signal is now blocked, requeue it.  */
1754         if (sigismember(&current->blocked, signr)) {
1755                 specific_send_sig_info(signr, info, current);
1756                 signr = 0;
1757         }
1758
1759         return signr;
1760 }
1761
1762 int get_signal_to_deliver(siginfo_t *info, struct k_sigaction *return_ka,
1763                           struct pt_regs *regs, void *cookie)
1764 {
1765         sigset_t *mask = &current->blocked;
1766         int signr = 0;
1767
1768 relock:
1769         /*
1770          * We'll jump back here after any time we were stopped in TASK_STOPPED.
1771          * While in TASK_STOPPED, we were considered "frozen enough".
1772          * Now that we woke up, it's crucial if we're supposed to be
1773          * frozen that we freeze now before running anything substantial.
1774          */
1775         try_to_freeze();
1776
1777         spin_lock_irq(&current->sighand->siglock);
1778
1779         if (unlikely(current->signal->flags & SIGNAL_CLD_MASK)) {
1780                 int why = (current->signal->flags & SIGNAL_STOP_CONTINUED)
1781                                 ? CLD_CONTINUED : CLD_STOPPED;
1782                 current->signal->flags &= ~SIGNAL_CLD_MASK;
1783                 spin_unlock_irq(&current->sighand->siglock);
1784
1785                 read_lock(&tasklist_lock);
1786                 do_notify_parent_cldstop(current->group_leader, why);
1787                 read_unlock(&tasklist_lock);
1788                 goto relock;
1789         }
1790
1791         for (;;) {
1792                 struct k_sigaction *ka;
1793
1794                 if (unlikely(current->signal->group_stop_count > 0) &&
1795                     do_signal_stop(0))
1796                         goto relock;
1797
1798                 signr = dequeue_signal(current, mask, info);
1799
1800                 if (!signr)
1801                         break; /* will return 0 */
1802
1803                 if (signr != SIGKILL) {
1804                         signr = ptrace_signal(signr, info, regs, cookie);
1805                         if (!signr)
1806                                 continue;
1807                 }
1808
1809                 ka = &current->sighand->action[signr-1];
1810                 if (ka->sa.sa_handler == SIG_IGN) /* Do nothing.  */
1811                         continue;
1812                 if (ka->sa.sa_handler != SIG_DFL) {
1813                         /* Run the handler.  */
1814                         *return_ka = *ka;
1815
1816                         if (ka->sa.sa_flags & SA_ONESHOT)
1817                                 ka->sa.sa_handler = SIG_DFL;
1818
1819                         break; /* will return non-zero "signr" value */
1820                 }
1821
1822                 /*
1823                  * Now we are doing the default action for this signal.
1824                  */
1825                 if (sig_kernel_ignore(signr)) /* Default is nothing. */
1826                         continue;
1827
1828                 /*
1829                  * Global init gets no signals it doesn't want.
1830                  */
1831                 if (is_global_init(current))
1832                         continue;
1833
1834                 if (sig_kernel_stop(signr)) {
1835                         /*
1836                          * The default action is to stop all threads in
1837                          * the thread group.  The job control signals
1838                          * do nothing in an orphaned pgrp, but SIGSTOP
1839                          * always works.  Note that siglock needs to be
1840                          * dropped during the call to is_orphaned_pgrp()
1841                          * because of lock ordering with tasklist_lock.
1842                          * This allows an intervening SIGCONT to be posted.
1843                          * We need to check for that and bail out if necessary.
1844                          */
1845                         if (signr != SIGSTOP) {
1846                                 spin_unlock_irq(&current->sighand->siglock);
1847
1848                                 /* signals can be posted during this window */
1849
1850                                 if (is_current_pgrp_orphaned())
1851                                         goto relock;
1852
1853                                 spin_lock_irq(&current->sighand->siglock);
1854                         }
1855
1856                         if (likely(do_signal_stop(signr))) {
1857                                 /* It released the siglock.  */
1858                                 goto relock;
1859                         }
1860
1861                         /*
1862                          * We didn't actually stop, due to a race
1863                          * with SIGCONT or something like that.
1864                          */
1865                         continue;
1866                 }
1867
1868                 spin_unlock_irq(&current->sighand->siglock);
1869
1870                 /*
1871                  * Anything else is fatal, maybe with a core dump.
1872                  */
1873                 current->flags |= PF_SIGNALED;
1874                 if ((signr != SIGKILL) && print_fatal_signals)
1875                         print_fatal_signal(regs, signr);
1876                 if (sig_kernel_coredump(signr)) {
1877                         /*
1878                          * If it was able to dump core, this kills all
1879                          * other threads in the group and synchronizes with
1880                          * their demise.  If we lost the race with another
1881                          * thread getting here, it set group_exit_code
1882                          * first and our do_group_exit call below will use
1883                          * that value and ignore the one we pass it.
1884                          */
1885                         do_coredump((long)signr, signr, regs);
1886                 }
1887
1888                 /*
1889                  * Death signals, no core dump.
1890                  */
1891                 do_group_exit(signr);
1892                 /* NOTREACHED */
1893         }
1894         spin_unlock_irq(&current->sighand->siglock);
1895         return signr;
1896 }
1897
1898 void exit_signals(struct task_struct *tsk)
1899 {
1900         int group_stop = 0;
1901         struct task_struct *t;
1902
1903         if (thread_group_empty(tsk) || signal_group_exit(tsk->signal)) {
1904                 tsk->flags |= PF_EXITING;
1905                 return;
1906         }
1907
1908         spin_lock_irq(&tsk->sighand->siglock);
1909         /*
1910          * From now this task is not visible for group-wide signals,
1911          * see wants_signal(), do_signal_stop().
1912          */
1913         tsk->flags |= PF_EXITING;
1914         if (!signal_pending(tsk))
1915                 goto out;
1916
1917         /* It could be that __group_complete_signal() choose us to
1918          * notify about group-wide signal. Another thread should be
1919          * woken now to take the signal since we will not.
1920          */
1921         for (t = tsk; (t = next_thread(t)) != tsk; )
1922                 if (!signal_pending(t) && !(t->flags & PF_EXITING))
1923                         recalc_sigpending_and_wake(t);
1924
1925         if (unlikely(tsk->signal->group_stop_count) &&
1926                         !--tsk->signal->group_stop_count) {
1927                 tsk->signal->flags = SIGNAL_STOP_STOPPED;
1928                 group_stop = 1;
1929         }
1930 out:
1931         spin_unlock_irq(&tsk->sighand->siglock);
1932
1933         if (unlikely(group_stop)) {
1934                 read_lock(&tasklist_lock);
1935                 do_notify_parent_cldstop(tsk, CLD_STOPPED);
1936                 read_unlock(&tasklist_lock);
1937         }
1938 }
1939
1940 EXPORT_SYMBOL(recalc_sigpending);
1941 EXPORT_SYMBOL_GPL(dequeue_signal);
1942 EXPORT_SYMBOL(flush_signals);
1943 EXPORT_SYMBOL(force_sig);
1944 EXPORT_SYMBOL(kill_proc);
1945 EXPORT_SYMBOL(ptrace_notify);
1946 EXPORT_SYMBOL(send_sig);
1947 EXPORT_SYMBOL(send_sig_info);
1948 EXPORT_SYMBOL(sigprocmask);
1949 EXPORT_SYMBOL(block_all_signals);
1950 EXPORT_SYMBOL(unblock_all_signals);
1951
1952
1953 /*
1954  * System call entry points.
1955  */
1956
1957 asmlinkage long sys_restart_syscall(void)
1958 {
1959         struct restart_block *restart = &current_thread_info()->restart_block;
1960         return restart->fn(restart);
1961 }
1962
1963 long do_no_restart_syscall(struct restart_block *param)
1964 {
1965         return -EINTR;
1966 }
1967
1968 /*
1969  * We don't need to get the kernel lock - this is all local to this
1970  * particular thread.. (and that's good, because this is _heavily_
1971  * used by various programs)
1972  */
1973
1974 /*
1975  * This is also useful for kernel threads that want to temporarily
1976  * (or permanently) block certain signals.
1977  *
1978  * NOTE! Unlike the user-mode sys_sigprocmask(), the kernel
1979  * interface happily blocks "unblockable" signals like SIGKILL
1980  * and friends.
1981  */
1982 int sigprocmask(int how, sigset_t *set, sigset_t *oldset)
1983 {
1984         int error;
1985
1986         spin_lock_irq(&current->sighand->siglock);
1987         if (oldset)
1988                 *oldset = current->blocked;
1989
1990         error = 0;
1991         switch (how) {
1992         case SIG_BLOCK:
1993                 sigorsets(&current->blocked, &current->blocked, set);
1994                 break;
1995         case SIG_UNBLOCK:
1996                 signandsets(&current->blocked, &current->blocked, set);
1997                 break;
1998         case SIG_SETMASK:
1999                 current->blocked = *set;
2000                 break;
2001         default:
2002                 error = -EINVAL;
2003         }
2004         recalc_sigpending();
2005         spin_unlock_irq(&current->sighand->siglock);
2006
2007         return error;
2008 }
2009
2010 asmlinkage long
2011 sys_rt_sigprocmask(int how, sigset_t __user *set, sigset_t __user *oset, size_t sigsetsize)
2012 {
2013         int error = -EINVAL;
2014         sigset_t old_set, new_set;
2015
2016         /* XXX: Don't preclude handling different sized sigset_t's.  */
2017         if (sigsetsize != sizeof(sigset_t))
2018                 goto out;
2019
2020         if (set) {
2021                 error = -EFAULT;
2022                 if (copy_from_user(&new_set, set, sizeof(*set)))
2023                         goto out;
2024                 sigdelsetmask(&new_set, sigmask(SIGKILL)|sigmask(SIGSTOP));
2025
2026                 error = sigprocmask(how, &new_set, &old_set);
2027                 if (error)
2028                         goto out;
2029                 if (oset)
2030                         goto set_old;
2031         } else if (oset) {
2032                 spin_lock_irq(&current->sighand->siglock);
2033                 old_set = current->blocked;
2034                 spin_unlock_irq(&current->sighand->siglock);
2035
2036         set_old:
2037                 error = -EFAULT;
2038                 if (copy_to_user(oset, &old_set, sizeof(*oset)))
2039                         goto out;
2040         }
2041         error = 0;
2042 out:
2043         return error;
2044 }
2045
2046 long do_sigpending(void __user *set, unsigned long sigsetsize)
2047 {
2048         long error = -EINVAL;
2049         sigset_t pending;
2050
2051         if (sigsetsize > sizeof(sigset_t))
2052                 goto out;
2053
2054         spin_lock_irq(&current->sighand->siglock);
2055         sigorsets(&pending, &current->pending.signal,
2056                   &current->signal->shared_pending.signal);
2057         spin_unlock_irq(&current->sighand->siglock);
2058
2059         /* Outside the lock because only this thread touches it.  */
2060         sigandsets(&pending, &current->blocked, &pending);
2061
2062         error = -EFAULT;
2063         if (!copy_to_user(set, &pending, sigsetsize))
2064                 error = 0;
2065
2066 out:
2067         return error;
2068 }
2069
2070 asmlinkage long
2071 sys_rt_sigpending(sigset_t __user *set, size_t sigsetsize)
2072 {
2073         return do_sigpending(set, sigsetsize);
2074 }
2075
2076 #ifndef HAVE_ARCH_COPY_SIGINFO_TO_USER
2077
2078 int copy_siginfo_to_user(siginfo_t __user *to, siginfo_t *from)
2079 {
2080         int err;
2081
2082         if (!access_ok (VERIFY_WRITE, to, sizeof(siginfo_t)))
2083                 return -EFAULT;
2084         if (from->si_code < 0)
2085                 return __copy_to_user(to, from, sizeof(siginfo_t))
2086                         ? -EFAULT : 0;
2087         /*
2088          * If you change siginfo_t structure, please be sure
2089          * this code is fixed accordingly.
2090          * Please remember to update the signalfd_copyinfo() function
2091          * inside fs/signalfd.c too, in case siginfo_t changes.
2092          * It should never copy any pad contained in the structure
2093          * to avoid security leaks, but must copy the generic
2094          * 3 ints plus the relevant union member.
2095          */
2096         err = __put_user(from->si_signo, &to->si_signo);
2097         err |= __put_user(from->si_errno, &to->si_errno);
2098         err |= __put_user((short)from->si_code, &to->si_code);
2099         switch (from->si_code & __SI_MASK) {
2100         case __SI_KILL:
2101                 err |= __put_user(from->si_pid, &to->si_pid);
2102                 err |= __put_user(from->si_uid, &to->si_uid);
2103                 break;
2104         case __SI_TIMER:
2105                  err |= __put_user(from->si_tid, &to->si_tid);
2106                  err |= __put_user(from->si_overrun, &to->si_overrun);
2107                  err |= __put_user(from->si_ptr, &to->si_ptr);
2108                 break;
2109         case __SI_POLL:
2110                 err |= __put_user(from->si_band, &to->si_band);
2111                 err |= __put_user(from->si_fd, &to->si_fd);
2112                 break;
2113         case __SI_FAULT:
2114                 err |= __put_user(from->si_addr, &to->si_addr);
2115 #ifdef __ARCH_SI_TRAPNO
2116                 err |= __put_user(from->si_trapno, &to->si_trapno);
2117 #endif
2118                 break;
2119         case __SI_CHLD:
2120                 err |= __put_user(from->si_pid, &to->si_pid);
2121                 err |= __put_user(from->si_uid, &to->si_uid);
2122                 err |= __put_user(from->si_status, &to->si_status);
2123                 err |= __put_user(from->si_utime, &to->si_utime);
2124                 err |= __put_user(from->si_stime, &to->si_stime);
2125                 break;
2126         case __SI_RT: /* This is not generated by the kernel as of now. */
2127         case __SI_MESGQ: /* But this is */
2128                 err |= __put_user(from->si_pid, &to->si_pid);
2129                 err |= __put_user(from->si_uid, &to->si_uid);
2130                 err |= __put_user(from->si_ptr, &to->si_ptr);
2131                 break;
2132         default: /* this is just in case for now ... */
2133                 err |= __put_user(from->si_pid, &to->si_pid);
2134                 err |= __put_user(from->si_uid, &to->si_uid);
2135                 break;
2136         }
2137         return err;
2138 }
2139
2140 #endif
2141
2142 asmlinkage long
2143 sys_rt_sigtimedwait(const sigset_t __user *uthese,
2144                     siginfo_t __user *uinfo,
2145                     const struct timespec __user *uts,
2146                     size_t sigsetsize)
2147 {
2148         int ret, sig;
2149         sigset_t these;
2150         struct timespec ts;
2151         siginfo_t info;
2152         long timeout = 0;
2153
2154         /* XXX: Don't preclude handling different sized sigset_t's.  */
2155         if (sigsetsize != sizeof(sigset_t))
2156                 return -EINVAL;
2157
2158         if (copy_from_user(&these, uthese, sizeof(these)))
2159                 return -EFAULT;
2160
2161         /*
2162          * Invert the set of allowed signals to get those we
2163          * want to block.
2164          */
2165         sigdelsetmask(&these, sigmask(SIGKILL)|sigmask(SIGSTOP));
2166         signotset(&these);
2167
2168         if (uts) {
2169                 if (copy_from_user(&ts, uts, sizeof(ts)))
2170                         return -EFAULT;
2171                 if (ts.tv_nsec >= 1000000000L || ts.tv_nsec < 0
2172                     || ts.tv_sec < 0)
2173                         return -EINVAL;
2174         }
2175
2176         spin_lock_irq(&current->sighand->siglock);
2177         sig = dequeue_signal(current, &these, &info);
2178         if (!sig) {
2179                 timeout = MAX_SCHEDULE_TIMEOUT;
2180                 if (uts)
2181                         timeout = (timespec_to_jiffies(&ts)
2182                                    + (ts.tv_sec || ts.tv_nsec));
2183
2184                 if (timeout) {
2185                         /* None ready -- temporarily unblock those we're
2186                          * interested while we are sleeping in so that we'll
2187                          * be awakened when they arrive.  */
2188                         current->real_blocked = current->blocked;
2189                         sigandsets(&current->blocked, &current->blocked, &these);
2190                         recalc_sigpending();
2191                         spin_unlock_irq(&current->sighand->siglock);
2192
2193                         timeout = schedule_timeout_interruptible(timeout);
2194
2195                         spin_lock_irq(&current->sighand->siglock);
2196                         sig = dequeue_signal(current, &these, &info);
2197                         current->blocked = current->real_blocked;
2198                         siginitset(&current->real_blocked, 0);
2199                         recalc_sigpending();
2200                 }
2201         }
2202         spin_unlock_irq(&current->sighand->siglock);
2203
2204         if (sig) {
2205                 ret = sig;
2206                 if (uinfo) {
2207                         if (copy_siginfo_to_user(uinfo, &info))
2208                                 ret = -EFAULT;
2209                 }
2210         } else {
2211                 ret = -EAGAIN;
2212                 if (timeout)
2213                         ret = -EINTR;
2214         }
2215
2216         return ret;
2217 }
2218
2219 asmlinkage long
2220 sys_kill(int pid, int sig)
2221 {
2222         struct siginfo info;
2223
2224         info.si_signo = sig;
2225         info.si_errno = 0;
2226         info.si_code = SI_USER;
2227         info.si_pid = task_tgid_vnr(current);
2228         info.si_uid = current->uid;
2229
2230         return kill_something_info(sig, &info, pid);
2231 }
2232
2233 static int do_tkill(int tgid, int pid, int sig)
2234 {
2235         int error;
2236         struct siginfo info;
2237         struct task_struct *p;
2238
2239         error = -ESRCH;
2240         info.si_signo = sig;
2241         info.si_errno = 0;
2242         info.si_code = SI_TKILL;
2243         info.si_pid = task_tgid_vnr(current);
2244         info.si_uid = current->uid;
2245
2246         read_lock(&tasklist_lock);
2247         p = find_task_by_vpid(pid);
2248         if (p && (tgid <= 0 || task_tgid_vnr(p) == tgid)) {
2249                 error = check_kill_permission(sig, &info, p);
2250                 /*
2251                  * The null signal is a permissions and process existence
2252                  * probe.  No signal is actually delivered.
2253                  */
2254                 if (!error && sig && p->sighand) {
2255                         spin_lock_irq(&p->sighand->siglock);
2256                         handle_stop_signal(sig, p);
2257                         error = specific_send_sig_info(sig, &info, p);
2258                         spin_unlock_irq(&p->sighand->siglock);
2259                 }
2260         }
2261         read_unlock(&tasklist_lock);
2262
2263         return error;
2264 }
2265
2266 /**
2267  *  sys_tgkill - send signal to one specific thread
2268  *  @tgid: the thread group ID of the thread
2269  *  @pid: the PID of the thread
2270  *  @sig: signal to be sent
2271  *
2272  *  This syscall also checks the @tgid and returns -ESRCH even if the PID
2273  *  exists but it's not belonging to the target process anymore. This
2274  *  method solves the problem of threads exiting and PIDs getting reused.
2275  */
2276 asmlinkage long sys_tgkill(int tgid, int pid, int sig)
2277 {
2278         /* This is only valid for single tasks */
2279         if (pid <= 0 || tgid <= 0)
2280                 return -EINVAL;
2281
2282         return do_tkill(tgid, pid, sig);
2283 }
2284
2285 /*
2286  *  Send a signal to only one task, even if it's a CLONE_THREAD task.
2287  */
2288 asmlinkage long
2289 sys_tkill(int pid, int sig)
2290 {
2291         /* This is only valid for single tasks */
2292         if (pid <= 0)
2293                 return -EINVAL;
2294
2295         return do_tkill(0, pid, sig);
2296 }
2297
2298 asmlinkage long
2299 sys_rt_sigqueueinfo(int pid, int sig, siginfo_t __user *uinfo)
2300 {
2301         siginfo_t info;
2302
2303         if (copy_from_user(&info, uinfo, sizeof(siginfo_t)))
2304                 return -EFAULT;
2305
2306         /* Not even root can pretend to send signals from the kernel.
2307            Nor can they impersonate a kill(), which adds source info.  */
2308         if (info.si_code >= 0)
2309                 return -EPERM;
2310         info.si_signo = sig;
2311
2312         /* POSIX.1b doesn't mention process groups.  */
2313         return kill_proc_info(sig, &info, pid);
2314 }
2315
2316 int do_sigaction(int sig, struct k_sigaction *act, struct k_sigaction *oact)
2317 {
2318         struct task_struct *t = current;
2319         struct k_sigaction *k;
2320         sigset_t mask;
2321
2322         if (!valid_signal(sig) || sig < 1 || (act && sig_kernel_only(sig)))
2323                 return -EINVAL;
2324
2325         k = &t->sighand->action[sig-1];
2326
2327         spin_lock_irq(&current->sighand->siglock);
2328         if (oact)
2329                 *oact = *k;
2330
2331         if (act) {
2332                 sigdelsetmask(&act->sa.sa_mask,
2333                               sigmask(SIGKILL) | sigmask(SIGSTOP));
2334                 *k = *act;
2335                 /*
2336                  * POSIX 3.3.1.3:
2337                  *  "Setting a signal action to SIG_IGN for a signal that is
2338                  *   pending shall cause the pending signal to be discarded,
2339                  *   whether or not it is blocked."
2340                  *
2341                  *  "Setting a signal action to SIG_DFL for a signal that is
2342                  *   pending and whose default action is to ignore the signal
2343                  *   (for example, SIGCHLD), shall cause the pending signal to
2344                  *   be discarded, whether or not it is blocked"
2345                  */
2346                 if (__sig_ignored(t, sig)) {
2347                         sigemptyset(&mask);
2348                         sigaddset(&mask, sig);
2349                         rm_from_queue_full(&mask, &t->signal->shared_pending);
2350                         do {
2351                                 rm_from_queue_full(&mask, &t->pending);
2352                                 t = next_thread(t);
2353                         } while (t != current);
2354                 }
2355         }
2356
2357         spin_unlock_irq(&current->sighand->siglock);
2358         return 0;
2359 }
2360
2361 int
2362 do_sigaltstack (const stack_t __user *uss, stack_t __user *uoss, unsigned long sp)
2363 {
2364         stack_t oss;
2365         int error;
2366
2367         if (uoss) {
2368                 oss.ss_sp = (void __user *) current->sas_ss_sp;
2369                 oss.ss_size = current->sas_ss_size;
2370                 oss.ss_flags = sas_ss_flags(sp);
2371         }
2372
2373         if (uss) {
2374                 void __user *ss_sp;
2375                 size_t ss_size;
2376                 int ss_flags;
2377
2378                 error = -EFAULT;
2379                 if (!access_ok(VERIFY_READ, uss, sizeof(*uss))
2380                     || __get_user(ss_sp, &uss->ss_sp)
2381                     || __get_user(ss_flags, &uss->ss_flags)
2382                     || __get_user(ss_size, &uss->ss_size))
2383                         goto out;
2384
2385                 error = -EPERM;
2386                 if (on_sig_stack(sp))
2387                         goto out;
2388
2389                 error = -EINVAL;
2390                 /*
2391                  *
2392                  * Note - this code used to test ss_flags incorrectly
2393                  *        old code may have been written using ss_flags==0
2394                  *        to mean ss_flags==SS_ONSTACK (as this was the only
2395                  *        way that worked) - this fix preserves that older
2396                  *        mechanism
2397                  */
2398                 if (ss_flags != SS_DISABLE && ss_flags != SS_ONSTACK && ss_flags != 0)
2399                         goto out;
2400
2401                 if (ss_flags == SS_DISABLE) {
2402                         ss_size = 0;
2403                         ss_sp = NULL;
2404                 } else {
2405                         error = -ENOMEM;
2406                         if (ss_size < MINSIGSTKSZ)
2407                                 goto out;
2408                 }
2409
2410                 current->sas_ss_sp = (unsigned long) ss_sp;
2411                 current->sas_ss_size = ss_size;
2412         }
2413
2414         if (uoss) {
2415                 error = -EFAULT;
2416                 if (copy_to_user(uoss, &oss, sizeof(oss)))
2417                         goto out;
2418         }
2419
2420         error = 0;
2421 out:
2422         return error;
2423 }
2424
2425 #ifdef __ARCH_WANT_SYS_SIGPENDING
2426
2427 asmlinkage long
2428 sys_sigpending(old_sigset_t __user *set)
2429 {
2430         return do_sigpending(set, sizeof(*set));
2431 }
2432
2433 #endif
2434
2435 #ifdef __ARCH_WANT_SYS_SIGPROCMASK
2436 /* Some platforms have their own version with special arguments others
2437    support only sys_rt_sigprocmask.  */
2438
2439 asmlinkage long
2440 sys_sigprocmask(int how, old_sigset_t __user *set, old_sigset_t __user *oset)
2441 {
2442         int error;
2443         old_sigset_t old_set, new_set;
2444
2445         if (set) {
2446                 error = -EFAULT;
2447                 if (copy_from_user(&new_set, set, sizeof(*set)))
2448                         goto out;
2449                 new_set &= ~(sigmask(SIGKILL) | sigmask(SIGSTOP));
2450
2451                 spin_lock_irq(&current->sighand->siglock);
2452                 old_set = current->blocked.sig[0];
2453
2454                 error = 0;
2455                 switch (how) {
2456                 default:
2457                         error = -EINVAL;
2458                         break;
2459                 case SIG_BLOCK:
2460                         sigaddsetmask(&current->blocked, new_set);
2461                         break;
2462                 case SIG_UNBLOCK:
2463                         sigdelsetmask(&current->blocked, new_set);
2464                         break;
2465                 case SIG_SETMASK:
2466                         current->blocked.sig[0] = new_set;
2467                         break;
2468                 }
2469
2470                 recalc_sigpending();
2471                 spin_unlock_irq(&current->sighand->siglock);
2472                 if (error)
2473                         goto out;
2474                 if (oset)
2475                         goto set_old;
2476         } else if (oset) {
2477                 old_set = current->blocked.sig[0];
2478         set_old:
2479                 error = -EFAULT;
2480                 if (copy_to_user(oset, &old_set, sizeof(*oset)))
2481                         goto out;
2482         }
2483         error = 0;
2484 out:
2485         return error;
2486 }
2487 #endif /* __ARCH_WANT_SYS_SIGPROCMASK */
2488
2489 #ifdef __ARCH_WANT_SYS_RT_SIGACTION
2490 asmlinkage long
2491 sys_rt_sigaction(int sig,
2492                  const struct sigaction __user *act,
2493                  struct sigaction __user *oact,
2494                  size_t sigsetsize)
2495 {
2496         struct k_sigaction new_sa, old_sa;
2497         int ret = -EINVAL;
2498
2499         /* XXX: Don't preclude handling different sized sigset_t's.  */
2500         if (sigsetsize != sizeof(sigset_t))
2501                 goto out;
2502
2503         if (act) {
2504                 if (copy_from_user(&new_sa.sa, act, sizeof(new_sa.sa)))
2505                         return -EFAULT;
2506         }
2507
2508         ret = do_sigaction(sig, act ? &new_sa : NULL, oact ? &old_sa : NULL);
2509
2510         if (!ret && oact) {
2511                 if (copy_to_user(oact, &old_sa.sa, sizeof(old_sa.sa)))
2512                         return -EFAULT;
2513         }
2514 out:
2515         return ret;
2516 }
2517 #endif /* __ARCH_WANT_SYS_RT_SIGACTION */
2518
2519 #ifdef __ARCH_WANT_SYS_SGETMASK
2520
2521 /*
2522  * For backwards compatibility.  Functionality superseded by sigprocmask.
2523  */
2524 asmlinkage long
2525 sys_sgetmask(void)
2526 {
2527         /* SMP safe */
2528         return current->blocked.sig[0];
2529 }
2530
2531 asmlinkage long
2532 sys_ssetmask(int newmask)
2533 {
2534         int old;
2535
2536         spin_lock_irq(&current->sighand->siglock);
2537         old = current->blocked.sig[0];
2538
2539         siginitset(&current->blocked, newmask & ~(sigmask(SIGKILL)|
2540                                                   sigmask(SIGSTOP)));
2541         recalc_sigpending();
2542         spin_unlock_irq(&current->sighand->siglock);
2543
2544         return old;
2545 }
2546 #endif /* __ARCH_WANT_SGETMASK */
2547
2548 #ifdef __ARCH_WANT_SYS_SIGNAL
2549 /*
2550  * For backwards compatibility.  Functionality superseded by sigaction.
2551  */
2552 asmlinkage unsigned long
2553 sys_signal(int sig, __sighandler_t handler)
2554 {
2555         struct k_sigaction new_sa, old_sa;
2556         int ret;
2557
2558         new_sa.sa.sa_handler = handler;
2559         new_sa.sa.sa_flags = SA_ONESHOT | SA_NOMASK;
2560         sigemptyset(&new_sa.sa.sa_mask);
2561
2562         ret = do_sigaction(sig, &new_sa, &old_sa);
2563
2564         return ret ? ret : (unsigned long)old_sa.sa.sa_handler;
2565 }
2566 #endif /* __ARCH_WANT_SYS_SIGNAL */
2567
2568 #ifdef __ARCH_WANT_SYS_PAUSE
2569
2570 asmlinkage long
2571 sys_pause(void)
2572 {
2573         current->state = TASK_INTERRUPTIBLE;
2574         schedule();
2575         return -ERESTARTNOHAND;
2576 }
2577
2578 #endif
2579
2580 #ifdef __ARCH_WANT_SYS_RT_SIGSUSPEND
2581 asmlinkage long sys_rt_sigsuspend(sigset_t __user *unewset, size_t sigsetsize)
2582 {
2583         sigset_t newset;
2584
2585         /* XXX: Don't preclude handling different sized sigset_t's.  */
2586         if (sigsetsize != sizeof(sigset_t))
2587                 return -EINVAL;
2588
2589         if (copy_from_user(&newset, unewset, sizeof(newset)))
2590                 return -EFAULT;
2591         sigdelsetmask(&newset, sigmask(SIGKILL)|sigmask(SIGSTOP));
2592
2593         spin_lock_irq(&current->sighand->siglock);
2594         current->saved_sigmask = current->blocked;
2595         current->blocked = newset;
2596         recalc_sigpending();
2597         spin_unlock_irq(&current->sighand->siglock);
2598
2599         current->state = TASK_INTERRUPTIBLE;
2600         schedule();
2601         set_thread_flag(TIF_RESTORE_SIGMASK);
2602         return -ERESTARTNOHAND;
2603 }
2604 #endif /* __ARCH_WANT_SYS_RT_SIGSUSPEND */
2605
2606 __attribute__((weak)) const char *arch_vma_name(struct vm_area_struct *vma)
2607 {
2608         return NULL;
2609 }
2610
2611 void __init signals_init(void)
2612 {
2613         sigqueue_cachep = KMEM_CACHE(sigqueue, SLAB_PANIC);
2614 }