SAFE public projects git trees. - safe/jmp/linux-2.6/blob - kernel/signal.c

   1 /*
   2  *  linux/kernel/signal.c
   3  *
   4  *  Copyright (C) 1991, 1992  Linus Torvalds
   5  *
   6  *  1997-11-02  Modified for POSIX.1b signals by Richard Henderson
   7  *
   8  *  2003-06-02  Jim Houston - Concurrent Computer Corp.
   9  *              Changes to use preallocated sigqueue structures
  10  *              to allow signals to be sent reliably.
  11  */
  12
  13 #include <linux/slab.h>
  14 #include <linux/module.h>
  15 #include <linux/init.h>
  16 #include <linux/sched.h>
  17 #include <linux/fs.h>
  18 #include <linux/tty.h>
  19 #include <linux/binfmts.h>
  20 #include <linux/security.h>
  21 #include <linux/syscalls.h>
  22 #include <linux/ptrace.h>
  23 #include <linux/signal.h>
  24 #include <linux/signalfd.h>
  25 #include <linux/capability.h>
  26 #include <linux/freezer.h>
  27 #include <linux/pid_namespace.h>
  28 #include <linux/nsproxy.h>
  29
  30 #include <asm/param.h>
  31 #include <asm/uaccess.h>
  32 #include <asm/unistd.h>
  33 #include <asm/siginfo.h>
  34 #include "audit.h"      /* audit_signal_info() */
  35
  36 /*
  37  * SLAB caches for signal bits.
  38  */
  39
  40 static struct kmem_cache *sigqueue_cachep;
  41
  42 static int __sig_ignored(struct task_struct *t, int sig)
  43 {
  44         void __user *handler;
  45
  46         /* Is it explicitly or implicitly ignored? */
  47
  48         handler = t->sighand->action[sig - 1].sa.sa_handler;
  49         return handler == SIG_IGN ||
  50                 (handler == SIG_DFL && sig_kernel_ignore(sig));
  51 }
  52
  53 static int sig_ignored(struct task_struct *t, int sig)
  54 {
  55         /*
  56          * Tracers always want to know about signals..
  57          */
  58         if (t->ptrace & PT_PTRACED)
  59                 return 0;
  60
  61         /*
  62          * Blocked signals are never ignored, since the
  63          * signal handler may change by the time it is
  64          * unblocked.
  65          */
  66         if (sigismember(&t->blocked, sig) || sigismember(&t->real_blocked, sig))
  67                 return 0;
  68
  69         return __sig_ignored(t, sig);
  70 }
  71
  72 /*
  73  * Re-calculate pending state from the set of locally pending
  74  * signals, globally pending signals, and blocked signals.
  75  */
  76 static inline int has_pending_signals(sigset_t *signal, sigset_t *blocked)
  77 {
  78         unsigned long ready;
  79         long i;
  80
  81         switch (_NSIG_WORDS) {
  82         default:
  83                 for (i = _NSIG_WORDS, ready = 0; --i >= 0 ;)
  84                         ready |= signal->sig[i] &~ blocked->sig[i];
  85                 break;
  86
  87         case 4: ready  = signal->sig[3] &~ blocked->sig[3];
  88                 ready |= signal->sig[2] &~ blocked->sig[2];
  89                 ready |= signal->sig[1] &~ blocked->sig[1];
  90                 ready |= signal->sig[0] &~ blocked->sig[0];
  91                 break;
  92
  93         case 2: ready  = signal->sig[1] &~ blocked->sig[1];
  94                 ready |= signal->sig[0] &~ blocked->sig[0];
  95                 break;
  96
  97         case 1: ready  = signal->sig[0] &~ blocked->sig[0];
  98         }
  99         return ready != 0;
 100 }
 101
 102 #define PENDING(p,b) has_pending_signals(&(p)->signal, (b))
 103
 104 static int recalc_sigpending_tsk(struct task_struct *t)
 105 {
 106         if (t->signal->group_stop_count > 0 ||
 107             PENDING(&t->pending, &t->blocked) ||
 108             PENDING(&t->signal->shared_pending, &t->blocked)) {
 109                 set_tsk_thread_flag(t, TIF_SIGPENDING);
 110                 return 1;
 111         }
 112         /*
 113          * We must never clear the flag in another thread, or in current
 114          * when it's possible the current syscall is returning -ERESTART*.
 115          * So we don't clear it here, and only callers who know they should do.
 116          */
 117         return 0;
 118 }
 119
 120 /*
 121  * After recalculating TIF_SIGPENDING, we need to make sure the task wakes up.
 122  * This is superfluous when called on current, the wakeup is a harmless no-op.
 123  */
 124 void recalc_sigpending_and_wake(struct task_struct *t)
 125 {
 126         if (recalc_sigpending_tsk(t))
 127                 signal_wake_up(t, 0);
 128 }
 129
 130 void recalc_sigpending(void)
 131 {
 132         if (!recalc_sigpending_tsk(current) && !freezing(current))
 133                 clear_thread_flag(TIF_SIGPENDING);
 134
 135 }
 136
 137 /* Given the mask, find the first available signal that should be serviced. */
 138
 139 int next_signal(struct sigpending *pending, sigset_t *mask)
 140 {
 141         unsigned long i, *s, *m, x;
 142         int sig = 0;
 143
 144         s = pending->signal.sig;
 145         m = mask->sig;
 146         switch (_NSIG_WORDS) {
 147         default:
 148                 for (i = 0; i < _NSIG_WORDS; ++i, ++s, ++m)
 149                         if ((x = *s &~ *m) != 0) {
 150                                 sig = ffz(~x) + i*_NSIG_BPW + 1;
 151                                 break;
 152                         }
 153                 break;
 154
 155         case 2: if ((x = s[0] &~ m[0]) != 0)
 156                         sig = 1;
 157                 else if ((x = s[1] &~ m[1]) != 0)
 158                         sig = _NSIG_BPW + 1;
 159                 else
 160                         break;
 161                 sig += ffz(~x);
 162                 break;
 163
 164         case 1: if ((x = *s &~ *m) != 0)
 165                         sig = ffz(~x) + 1;
 166                 break;
 167         }
 168
 169         return sig;
 170 }
 171
 172 static struct sigqueue *__sigqueue_alloc(struct task_struct *t, gfp_t flags,
 173                                          int override_rlimit)
 174 {
 175         struct sigqueue *q = NULL;
 176         struct user_struct *user;
 177
 178         /*
 179          * In order to avoid problems with "switch_user()", we want to make
 180          * sure that the compiler doesn't re-load "t->user"
 181          */
 182         user = t->user;
 183         barrier();
 184         atomic_inc(&user->sigpending);
 185         if (override_rlimit ||
 186             atomic_read(&user->sigpending) <=
 187                         t->signal->rlim[RLIMIT_SIGPENDING].rlim_cur)
 188                 q = kmem_cache_alloc(sigqueue_cachep, flags);
 189         if (unlikely(q == NULL)) {
 190                 atomic_dec(&user->sigpending);
 191         } else {
 192                 INIT_LIST_HEAD(&q->list);
 193                 q->flags = 0;
 194                 q->user = get_uid(user);
 195         }
 196         return(q);
 197 }
 198
 199 static void __sigqueue_free(struct sigqueue *q)
 200 {
 201         if (q->flags & SIGQUEUE_PREALLOC)
 202                 return;
 203         atomic_dec(&q->user->sigpending);
 204         free_uid(q->user);
 205         kmem_cache_free(sigqueue_cachep, q);
 206 }
 207
 208 void flush_sigqueue(struct sigpending *queue)
 209 {
 210         struct sigqueue *q;
 211
 212         sigemptyset(&queue->signal);
 213         while (!list_empty(&queue->list)) {
 214                 q = list_entry(queue->list.next, struct sigqueue , list);
 215                 list_del_init(&q->list);
 216                 __sigqueue_free(q);
 217         }
 218 }
 219
 220 /*
 221  * Flush all pending signals for a task.
 222  */
 223 void flush_signals(struct task_struct *t)
 224 {
 225         unsigned long flags;
 226
 227         spin_lock_irqsave(&t->sighand->siglock, flags);
 228         clear_tsk_thread_flag(t, TIF_SIGPENDING);
 229         flush_sigqueue(&t->pending);
 230         flush_sigqueue(&t->signal->shared_pending);
 231         spin_unlock_irqrestore(&t->sighand->siglock, flags);
 232 }
 233
 234 void ignore_signals(struct task_struct *t)
 235 {
 236         int i;
 237
 238         for (i = 0; i < _NSIG; ++i)
 239                 t->sighand->action[i].sa.sa_handler = SIG_IGN;
 240
 241         flush_signals(t);
 242 }
 243
 244 /*
 245  * Flush all handlers for a task.
 246  */
 247
 248 void
 249 flush_signal_handlers(struct task_struct *t, int force_default)
 250 {
 251         int i;
 252         struct k_sigaction *ka = &t->sighand->action[0];
 253         for (i = _NSIG ; i != 0 ; i--) {
 254                 if (force_default || ka->sa.sa_handler != SIG_IGN)
 255                         ka->sa.sa_handler = SIG_DFL;
 256                 ka->sa.sa_flags = 0;
 257                 sigemptyset(&ka->sa.sa_mask);
 258                 ka++;
 259         }
 260 }
 261
 262 int unhandled_signal(struct task_struct *tsk, int sig)
 263 {
 264         if (is_global_init(tsk))
 265                 return 1;
 266         if (tsk->ptrace & PT_PTRACED)
 267                 return 0;
 268         return (tsk->sighand->action[sig-1].sa.sa_handler == SIG_IGN) ||
 269                 (tsk->sighand->action[sig-1].sa.sa_handler == SIG_DFL);
 270 }
 271
 272
 273 /* Notify the system that a driver wants to block all signals for this
 274  * process, and wants to be notified if any signals at all were to be
 275  * sent/acted upon.  If the notifier routine returns non-zero, then the
 276  * signal will be acted upon after all.  If the notifier routine returns 0,
 277  * then then signal will be blocked.  Only one block per process is
 278  * allowed.  priv is a pointer to private data that the notifier routine
 279  * can use to determine if the signal should be blocked or not.  */
 280
 281 void
 282 block_all_signals(int (*notifier)(void *priv), void *priv, sigset_t *mask)
 283 {
 284         unsigned long flags;
 285
 286         spin_lock_irqsave(&current->sighand->siglock, flags);
 287         current->notifier_mask = mask;
 288         current->notifier_data = priv;
 289         current->notifier = notifier;
 290         spin_unlock_irqrestore(&current->sighand->siglock, flags);
 291 }
 292
 293 /* Notify the system that blocking has ended. */
 294
 295 void
 296 unblock_all_signals(void)
 297 {
 298         unsigned long flags;
 299
 300         spin_lock_irqsave(&current->sighand->siglock, flags);
 301         current->notifier = NULL;
 302         current->notifier_data = NULL;
 303         recalc_sigpending();
 304         spin_unlock_irqrestore(&current->sighand->siglock, flags);
 305 }
 306
 307 static int collect_signal(int sig, struct sigpending *list, siginfo_t *info)
 308 {
 309         struct sigqueue *q, *first = NULL;
 310         int still_pending = 0;
 311
 312         if (unlikely(!sigismember(&list->signal, sig)))
 313                 return 0;
 314
 315         /*
 316          * Collect the siginfo appropriate to this signal.  Check if
 317          * there is another siginfo for the same signal.
 318         */
 319         list_for_each_entry(q, &list->list, list) {
 320                 if (q->info.si_signo == sig) {
 321                         if (first) {
 322                                 still_pending = 1;
 323                                 break;
 324                         }
 325                         first = q;
 326                 }
 327         }
 328         if (first) {
 329                 list_del_init(&first->list);
 330                 copy_siginfo(info, &first->info);
 331                 __sigqueue_free(first);
 332                 if (!still_pending)
 333                         sigdelset(&list->signal, sig);
 334         } else {
 335
 336                 /* Ok, it wasn't in the queue.  This must be
 337                    a fast-pathed signal or we must have been
 338                    out of queue space.  So zero out the info.
 339                  */
 340                 sigdelset(&list->signal, sig);
 341                 info->si_signo = sig;
 342                 info->si_errno = 0;
 343                 info->si_code = 0;
 344                 info->si_pid = 0;
 345                 info->si_uid = 0;
 346         }
 347         return 1;
 348 }
 349
 350 static int __dequeue_signal(struct sigpending *pending, sigset_t *mask,
 351                         siginfo_t *info)
 352 {
 353         int sig = next_signal(pending, mask);
 354
 355         if (sig) {
 356                 if (current->notifier) {
 357                         if (sigismember(current->notifier_mask, sig)) {
 358                                 if (!(current->notifier)(current->notifier_data)) {
 359                                         clear_thread_flag(TIF_SIGPENDING);
 360                                         return 0;
 361                                 }
 362                         }
 363                 }
 364
 365                 if (!collect_signal(sig, pending, info))
 366                         sig = 0;
 367         }
 368
 369         return sig;
 370 }
 371
 372 /*
 373  * Dequeue a signal and return the element to the caller, which is
 374  * expected to free it.
 375  *
 376  * All callers have to hold the siglock.
 377  */
 378 int dequeue_signal(struct task_struct *tsk, sigset_t *mask, siginfo_t *info)
 379 {
 380         int signr;
 381
 382         /* We only dequeue private signals from ourselves, we don't let
 383          * signalfd steal them
 384          */
 385         signr = __dequeue_signal(&tsk->pending, mask, info);
 386         if (!signr) {
 387                 signr = __dequeue_signal(&tsk->signal->shared_pending,
 388                                          mask, info);
 389                 /*
 390                  * itimer signal ?
 391                  *
 392                  * itimers are process shared and we restart periodic
 393                  * itimers in the signal delivery path to prevent DoS
 394                  * attacks in the high resolution timer case. This is
 395                  * compliant with the old way of self restarting
 396                  * itimers, as the SIGALRM is a legacy signal and only
 397                  * queued once. Changing the restart behaviour to
 398                  * restart the timer in the signal dequeue path is
 399                  * reducing the timer noise on heavy loaded !highres
 400                  * systems too.
 401                  */
 402                 if (unlikely(signr == SIGALRM)) {
 403                         struct hrtimer *tmr = &tsk->signal->real_timer;
 404
 405                         if (!hrtimer_is_queued(tmr) &&
 406                             tsk->signal->it_real_incr.tv64 != 0) {
 407                                 hrtimer_forward(tmr, tmr->base->get_time(),
 408                                                 tsk->signal->it_real_incr);
 409                                 hrtimer_restart(tmr);
 410                         }
 411                 }
 412         }
 413
 414         recalc_sigpending();
 415         if (!signr)
 416                 return 0;
 417
 418         if (unlikely(sig_kernel_stop(signr))) {
 419                 /*
 420                  * Set a marker that we have dequeued a stop signal.  Our
 421                  * caller might release the siglock and then the pending
 422                  * stop signal it is about to process is no longer in the
 423                  * pending bitmasks, but must still be cleared by a SIGCONT
 424                  * (and overruled by a SIGKILL).  So those cases clear this
 425                  * shared flag after we've set it.  Note that this flag may
 426                  * remain set after the signal we return is ignored or
 427                  * handled.  That doesn't matter because its only purpose
 428                  * is to alert stop-signal processing code when another
 429                  * processor has come along and cleared the flag.
 430                  */
 431                 if (!(tsk->signal->flags & SIGNAL_GROUP_EXIT))
 432                         tsk->signal->flags |= SIGNAL_STOP_DEQUEUED;
 433         }
 434         if ((info->si_code & __SI_MASK) == __SI_TIMER && info->si_sys_private) {
 435                 /*
 436                  * Release the siglock to ensure proper locking order
 437                  * of timer locks outside of siglocks.  Note, we leave
 438                  * irqs disabled here, since the posix-timers code is
 439                  * about to disable them again anyway.
 440                  */
 441                 spin_unlock(&tsk->sighand->siglock);
 442                 do_schedule_next_timer(info);
 443                 spin_lock(&tsk->sighand->siglock);
 444         }
 445         return signr;
 446 }
 447
 448 /*
 449  * Tell a process that it has a new active signal..
 450  *
 451  * NOTE! we rely on the previous spin_lock to
 452  * lock interrupts for us! We can only be called with
 453  * "siglock" held, and the local interrupt must
 454  * have been disabled when that got acquired!
 455  *
 456  * No need to set need_resched since signal event passing
 457  * goes through ->blocked
 458  */
 459 void signal_wake_up(struct task_struct *t, int resume)
 460 {
 461         unsigned int mask;
 462
 463         set_tsk_thread_flag(t, TIF_SIGPENDING);
 464
 465         /*
 466          * For SIGKILL, we want to wake it up in the stopped/traced/killable
 467          * case. We don't check t->state here because there is a race with it
 468          * executing another processor and just now entering stopped state.
 469          * By using wake_up_state, we ensure the process will wake up and
 470          * handle its death signal.
 471          */
 472         mask = TASK_INTERRUPTIBLE;
 473         if (resume)
 474                 mask |= TASK_WAKEKILL;
 475         if (!wake_up_state(t, mask))
 476                 kick_process(t);
 477 }
 478
 479 /*
 480  * Remove signals in mask from the pending set and queue.
 481  * Returns 1 if any signals were found.
 482  *
 483  * All callers must be holding the siglock.
 484  *
 485  * This version takes a sigset mask and looks at all signals,
 486  * not just those in the first mask word.
 487  */
 488 static int rm_from_queue_full(sigset_t *mask, struct sigpending *s)
 489 {
 490         struct sigqueue *q, *n;
 491         sigset_t m;
 492
 493         sigandsets(&m, mask, &s->signal);
 494         if (sigisemptyset(&m))
 495                 return 0;
 496
 497         signandsets(&s->signal, &s->signal, mask);
 498         list_for_each_entry_safe(q, n, &s->list, list) {
 499                 if (sigismember(mask, q->info.si_signo)) {
 500                         list_del_init(&q->list);
 501                         __sigqueue_free(q);
 502                 }
 503         }
 504         return 1;
 505 }
 506 /*
 507  * Remove signals in mask from the pending set and queue.
 508  * Returns 1 if any signals were found.
 509  *
 510  * All callers must be holding the siglock.
 511  */
 512 static int rm_from_queue(unsigned long mask, struct sigpending *s)
 513 {
 514         struct sigqueue *q, *n;
 515
 516         if (!sigtestsetmask(&s->signal, mask))
 517                 return 0;
 518
 519         sigdelsetmask(&s->signal, mask);
 520         list_for_each_entry_safe(q, n, &s->list, list) {
 521                 if (q->info.si_signo < SIGRTMIN &&
 522                     (mask & sigmask(q->info.si_signo))) {
 523                         list_del_init(&q->list);
 524                         __sigqueue_free(q);
 525                 }
 526         }
 527         return 1;
 528 }
 529
 530 /*
 531  * Bad permissions for sending the signal
 532  */
 533 static int check_kill_permission(int sig, struct siginfo *info,
 534                                  struct task_struct *t)
 535 {
 536         int error;
 537
 538         if (!valid_signal(sig))
 539                 return -EINVAL;
 540
 541         if (info != SEND_SIG_NOINFO && (is_si_special(info) || SI_FROMKERNEL(info)))
 542                 return 0;
 543
 544         error = audit_signal_info(sig, t); /* Let audit system see the signal */
 545         if (error)
 546                 return error;
 547
 548         if (((sig != SIGCONT) || (task_session_nr(current) != task_session_nr(t)))
 549             && (current->euid ^ t->suid) && (current->euid ^ t->uid)
 550             && (current->uid ^ t->suid) && (current->uid ^ t->uid)
 551             && !capable(CAP_KILL))
 552                 return -EPERM;
 553
 554         return security_task_kill(t, info, sig, 0);
 555 }
 556
 557 /* forward decl */
 558 static void do_notify_parent_cldstop(struct task_struct *tsk, int why);
 559
 560 /*
 561  * Handle magic process-wide effects of stop/continue signals.
 562  * Unlike the signal actions, these happen immediately at signal-generation
 563  * time regardless of blocking, ignoring, or handling.  This does the
 564  * actual continuing for SIGCONT, but not the actual stopping for stop
 565  * signals.  The process stop is done as a signal action for SIG_DFL.
 566  */
 567 static void handle_stop_signal(int sig, struct task_struct *p)
 568 {
 569         struct task_struct *t;
 570
 571         if (p->signal->flags & SIGNAL_GROUP_EXIT)
 572                 /*
 573                  * The process is in the middle of dying already.
 574                  */
 575                 return;
 576
 577         if (sig_kernel_stop(sig)) {
 578                 /*
 579                  * This is a stop signal.  Remove SIGCONT from all queues.
 580                  */
 581                 rm_from_queue(sigmask(SIGCONT), &p->signal->shared_pending);
 582                 t = p;
 583                 do {
 584                         rm_from_queue(sigmask(SIGCONT), &t->pending);
 585                         t = next_thread(t);
 586                 } while (t != p);
 587         } else if (sig == SIGCONT) {
 588                 /*
 589                  * Remove all stop signals from all queues,
 590                  * and wake all threads.
 591                  */
 592                 if (unlikely(p->signal->group_stop_count > 0)) {
 593                         /*
 594                          * There was a group stop in progress.  We'll
 595                          * pretend it finished before we got here.  We are
 596                          * obliged to report it to the parent: if the
 597                          * SIGSTOP happened "after" this SIGCONT, then it
 598                          * would have cleared this pending SIGCONT.  If it
 599                          * happened "before" this SIGCONT, then the parent
 600                          * got the SIGCHLD about the stop finishing before
 601                          * the continue happened.  We do the notification
 602                          * now, and it's as if the stop had finished and
 603                          * the SIGCHLD was pending on entry to this kill.
 604                          */
 605                         p->signal->group_stop_count = 0;
 606                         p->signal->flags = SIGNAL_STOP_CONTINUED;
 607                         spin_unlock(&p->sighand->siglock);
 608                         do_notify_parent_cldstop(p, CLD_STOPPED);
 609                         spin_lock(&p->sighand->siglock);
 610                 }
 611                 rm_from_queue(SIG_KERNEL_STOP_MASK, &p->signal->shared_pending);
 612                 t = p;
 613                 do {
 614                         unsigned int state;
 615                         rm_from_queue(SIG_KERNEL_STOP_MASK, &t->pending);
 616
 617                         /*
 618                          * If there is a handler for SIGCONT, we must make
 619                          * sure that no thread returns to user mode before
 620                          * we post the signal, in case it was the only
 621                          * thread eligible to run the signal handler--then
 622                          * it must not do anything between resuming and
 623                          * running the handler.  With the TIF_SIGPENDING
 624                          * flag set, the thread will pause and acquire the
 625                          * siglock that we hold now and until we've queued
 626                          * the pending signal.
 627                          *
 628                          * Wake up the stopped thread _after_ setting
 629                          * TIF_SIGPENDING
 630                          */
 631                         state = __TASK_STOPPED;
 632                         if (sig_user_defined(t, SIGCONT) && !sigismember(&t->blocked, SIGCONT)) {
 633                                 set_tsk_thread_flag(t, TIF_SIGPENDING);
 634                                 state |= TASK_INTERRUPTIBLE;
 635                         }
 636                         wake_up_state(t, state);
 637
 638                         t = next_thread(t);
 639                 } while (t != p);
 640
 641                 if (p->signal->flags & SIGNAL_STOP_STOPPED) {
 642                         /*
 643                          * We were in fact stopped, and are now continued.
 644                          * Notify the parent with CLD_CONTINUED.
 645                          */
 646                         p->signal->flags = SIGNAL_STOP_CONTINUED;
 647                         p->signal->group_exit_code = 0;
 648                         spin_unlock(&p->sighand->siglock);
 649                         do_notify_parent_cldstop(p, CLD_CONTINUED);
 650                         spin_lock(&p->sighand->siglock);
 651                 } else {
 652                         /*
 653                          * We are not stopped, but there could be a stop
 654                          * signal in the middle of being processed after
 655                          * being removed from the queue.  Clear that too.
 656                          */
 657                         p->signal->flags = 0;
 658                 }
 659         } else if (sig == SIGKILL) {
 660                 /*
 661                  * Make sure that any pending stop signal already dequeued
 662                  * is undone by the wakeup for SIGKILL.
 663                  */
 664                 p->signal->flags = 0;
 665         }
 666 }
 667
 668 static inline int legacy_queue(struct sigpending *signals, int sig)
 669 {
 670         return (sig < SIGRTMIN) && sigismember(&signals->signal, sig);
 671 }
 672
 673 static int send_signal(int sig, struct siginfo *info, struct task_struct *t,
 674                         struct sigpending *signals)
 675 {
 676         struct sigqueue * q = NULL;
 677
 678         /*
 679          * Short-circuit ignored signals and support queuing
 680          * exactly one non-rt signal, so that we can get more
 681          * detailed information about the cause of the signal.
 682          */
 683         if (sig_ignored(t, sig) || legacy_queue(signals, sig))
 684                 return 0;
 685
 686         /*
 687          * Deliver the signal to listening signalfds. This must be called
 688          * with the sighand lock held.
 689          */
 690         signalfd_notify(t, sig);
 691
 692         /*
 693          * fast-pathed signals for kernel-internal things like SIGSTOP
 694          * or SIGKILL.
 695          */
 696         if (info == SEND_SIG_FORCED)
 697                 goto out_set;
 698
 699         /* Real-time signals must be queued if sent by sigqueue, or
 700            some other real-time mechanism.  It is implementation
 701            defined whether kill() does so.  We attempt to do so, on
 702            the principle of least surprise, but since kill is not
 703            allowed to fail with EAGAIN when low on memory we just
 704            make sure at least one signal gets delivered and don't
 705            pass on the info struct.  */
 706
 707         q = __sigqueue_alloc(t, GFP_ATOMIC, (sig < SIGRTMIN &&
 708                                              (is_si_special(info) ||
 709                                               info->si_code >= 0)));
 710         if (q) {
 711                 list_add_tail(&q->list, &signals->list);
 712                 switch ((unsigned long) info) {
 713                 case (unsigned long) SEND_SIG_NOINFO:
 714                         q->info.si_signo = sig;
 715                         q->info.si_errno = 0;
 716                         q->info.si_code = SI_USER;
 717                         q->info.si_pid = task_pid_vnr(current);
 718                         q->info.si_uid = current->uid;
 719                         break;
 720                 case (unsigned long) SEND_SIG_PRIV:
 721                         q->info.si_signo = sig;
 722                         q->info.si_errno = 0;
 723                         q->info.si_code = SI_KERNEL;
 724                         q->info.si_pid = 0;
 725                         q->info.si_uid = 0;
 726                         break;
 727                 default:
 728                         copy_siginfo(&q->info, info);
 729                         break;
 730                 }
 731         } else if (!is_si_special(info)) {
 732                 if (sig >= SIGRTMIN && info->si_code != SI_USER)
 733                 /*
 734                  * Queue overflow, abort.  We may abort if the signal was rt
 735                  * and sent by user using something other than kill().
 736                  */
 737                         return -EAGAIN;
 738         }
 739
 740 out_set:
 741         sigaddset(&signals->signal, sig);
 742         return 1;
 743 }
 744
 745 int print_fatal_signals;
 746
 747 static void print_fatal_signal(struct pt_regs *regs, int signr)
 748 {
 749         printk("%s/%d: potentially unexpected fatal signal %d.\n",
 750                 current->comm, task_pid_nr(current), signr);
 751
 752 #if defined(__i386__) && !defined(__arch_um__)
 753         printk("code at %08lx: ", regs->ip);
 754         {
 755                 int i;
 756                 for (i = 0; i < 16; i++) {
 757                         unsigned char insn;
 758
 759                         __get_user(insn, (unsigned char *)(regs->ip + i));
 760                         printk("%02x ", insn);
 761                 }
 762         }
 763 #endif
 764         printk("\n");
 765         show_regs(regs);
 766 }
 767
 768 static int __init setup_print_fatal_signals(char *str)
 769 {
 770         get_option (&str, &print_fatal_signals);
 771
 772         return 1;
 773 }
 774
 775 __setup("print-fatal-signals=", setup_print_fatal_signals);
 776
 777 static int
 778 specific_send_sig_info(int sig, struct siginfo *info, struct task_struct *t)
 779 {
 780         int ret;
 781
 782         BUG_ON(!irqs_disabled());
 783         assert_spin_locked(&t->sighand->siglock);
 784
 785         ret = send_signal(sig, info, t, &t->pending);
 786         if (ret <= 0)
 787                 return ret;
 788
 789         if (!sigismember(&t->blocked, sig))
 790                 signal_wake_up(t, sig == SIGKILL);
 791         return 0;
 792 }
 793
 794 /*
 795  * Force a signal that the process can't ignore: if necessary
 796  * we unblock the signal and change any SIG_IGN to SIG_DFL.
 797  *
 798  * Note: If we unblock the signal, we always reset it to SIG_DFL,
 799  * since we do not want to have a signal handler that was blocked
 800  * be invoked when user space had explicitly blocked it.
 801  *
 802  * We don't want to have recursive SIGSEGV's etc, for example.
 803  */
 804 int
 805 force_sig_info(int sig, struct siginfo *info, struct task_struct *t)
 806 {
 807         unsigned long int flags;
 808         int ret, blocked, ignored;
 809         struct k_sigaction *action;
 810
 811         spin_lock_irqsave(&t->sighand->siglock, flags);
 812         action = &t->sighand->action[sig-1];
 813         ignored = action->sa.sa_handler == SIG_IGN;
 814         blocked = sigismember(&t->blocked, sig);
 815         if (blocked || ignored) {
 816                 action->sa.sa_handler = SIG_DFL;
 817                 if (blocked) {
 818                         sigdelset(&t->blocked, sig);
 819                         recalc_sigpending_and_wake(t);
 820                 }
 821         }
 822         ret = specific_send_sig_info(sig, info, t);
 823         spin_unlock_irqrestore(&t->sighand->siglock, flags);
 824
 825         return ret;
 826 }
 827
 828 void
 829 force_sig_specific(int sig, struct task_struct *t)
 830 {
 831         force_sig_info(sig, SEND_SIG_FORCED, t);
 832 }
 833
 834 /*
 835  * Test if P wants to take SIG.  After we've checked all threads with this,
 836  * it's equivalent to finding no threads not blocking SIG.  Any threads not
 837  * blocking SIG were ruled out because they are not running and already
 838  * have pending signals.  Such threads will dequeue from the shared queue
 839  * as soon as they're available, so putting the signal on the shared queue
 840  * will be equivalent to sending it to one such thread.
 841  */
 842 static inline int wants_signal(int sig, struct task_struct *p)
 843 {
 844         if (sigismember(&p->blocked, sig))
 845                 return 0;
 846         if (p->flags & PF_EXITING)
 847                 return 0;
 848         if (sig == SIGKILL)
 849                 return 1;
 850         if (task_is_stopped_or_traced(p))
 851                 return 0;
 852         return task_curr(p) || !signal_pending(p);
 853 }
 854
 855 static void
 856 __group_complete_signal(int sig, struct task_struct *p)
 857 {
 858         struct task_struct *t;
 859
 860         /*
 861          * Now find a thread we can wake up to take the signal off the queue.
 862          *
 863          * If the main thread wants the signal, it gets first crack.
 864          * Probably the least surprising to the average bear.
 865          */
 866         if (wants_signal(sig, p))
 867                 t = p;
 868         else if (thread_group_empty(p))
 869                 /*
 870                  * There is just one thread and it does not need to be woken.
 871                  * It will dequeue unblocked signals before it runs again.
 872                  */
 873                 return;
 874         else {
 875                 /*
 876                  * Otherwise try to find a suitable thread.
 877                  */
 878                 t = p->signal->curr_target;
 879                 if (t == NULL)
 880                         /* restart balancing at this thread */
 881                         t = p->signal->curr_target = p;
 882
 883                 while (!wants_signal(sig, t)) {
 884                         t = next_thread(t);
 885                         if (t == p->signal->curr_target)
 886                                 /*
 887                                  * No thread needs to be woken.
 888                                  * Any eligible threads will see
 889                                  * the signal in the queue soon.
 890                                  */
 891                                 return;
 892                 }
 893                 p->signal->curr_target = t;
 894         }
 895
 896         /*
 897          * Found a killable thread.  If the signal will be fatal,
 898          * then start taking the whole group down immediately.
 899          */
 900         if (sig_fatal(p, sig) && !(p->signal->flags & SIGNAL_GROUP_EXIT) &&
 901             !sigismember(&t->real_blocked, sig) &&
 902             (sig == SIGKILL || !(t->ptrace & PT_PTRACED))) {
 903                 /*
 904                  * This signal will be fatal to the whole group.
 905                  */
 906                 if (!sig_kernel_coredump(sig)) {
 907                         /*
 908                          * Start a group exit and wake everybody up.
 909                          * This way we don't have other threads
 910                          * running and doing things after a slower
 911                          * thread has the fatal signal pending.
 912                          */
 913                         p->signal->flags = SIGNAL_GROUP_EXIT;
 914                         p->signal->group_exit_code = sig;
 915                         p->signal->group_stop_count = 0;
 916                         t = p;
 917                         do {
 918                                 sigaddset(&t->pending.signal, SIGKILL);
 919                                 signal_wake_up(t, 1);
 920                         } while_each_thread(p, t);
 921                         return;
 922                 }
 923         }
 924
 925         /*
 926          * The signal is already in the shared-pending queue.
 927          * Tell the chosen thread to wake up and dequeue it.
 928          */
 929         signal_wake_up(t, sig == SIGKILL);
 930         return;
 931 }
 932
 933 int
 934 __group_send_sig_info(int sig, struct siginfo *info, struct task_struct *p)
 935 {
 936         int ret;
 937
 938         assert_spin_locked(&p->sighand->siglock);
 939         handle_stop_signal(sig, p);
 940
 941         /*
 942          * Put this signal on the shared-pending queue, or fail with EAGAIN.
 943          * We always use the shared queue for process-wide signals,
 944          * to avoid several races.
 945          */
 946         ret = send_signal(sig, info, p, &p->signal->shared_pending);
 947         if (ret <= 0)
 948                 return ret;
 949
 950         __group_complete_signal(sig, p);
 951         return 0;
 952 }
 953
 954 /*
 955  * Nuke all other threads in the group.
 956  */
 957 void zap_other_threads(struct task_struct *p)
 958 {
 959         struct task_struct *t;
 960
 961         p->signal->group_stop_count = 0;
 962
 963         for (t = next_thread(p); t != p; t = next_thread(t)) {
 964                 /*
 965                  * Don't bother with already dead threads
 966                  */
 967                 if (t->exit_state)
 968                         continue;
 969
 970                 /* SIGKILL will be handled before any pending SIGSTOP */
 971                 sigaddset(&t->pending.signal, SIGKILL);
 972                 signal_wake_up(t, 1);
 973         }
 974 }
 975
 976 int __fatal_signal_pending(struct task_struct *tsk)
 977 {
 978         return sigismember(&tsk->pending.signal, SIGKILL);
 979 }
 980 EXPORT_SYMBOL(__fatal_signal_pending);
 981
 982 struct sighand_struct *lock_task_sighand(struct task_struct *tsk, unsigned long *flags)
 983 {
 984         struct sighand_struct *sighand;
 985
 986         rcu_read_lock();
 987         for (;;) {
 988                 sighand = rcu_dereference(tsk->sighand);
 989                 if (unlikely(sighand == NULL))
 990                         break;
 991
 992                 spin_lock_irqsave(&sighand->siglock, *flags);
 993                 if (likely(sighand == tsk->sighand))
 994                         break;
 995                 spin_unlock_irqrestore(&sighand->siglock, *flags);
 996         }
 997         rcu_read_unlock();
 998
 999         return sighand;
1000 }
1001
1002 int group_send_sig_info(int sig, struct siginfo *info, struct task_struct *p)
1003 {
1004         unsigned long flags;
1005         int ret;
1006
1007         ret = check_kill_permission(sig, info, p);
1008
1009         if (!ret && sig) {
1010                 ret = -ESRCH;
1011                 if (lock_task_sighand(p, &flags)) {
1012                         ret = __group_send_sig_info(sig, info, p);
1013                         unlock_task_sighand(p, &flags);
1014                 }
1015         }
1016
1017         return ret;
1018 }
1019
1020 /*
1021  * __kill_pgrp_info() sends a signal to a process group: this is what the tty
1022  * control characters do (^C, ^Z etc)
1023  */
1024
1025 int __kill_pgrp_info(int sig, struct siginfo *info, struct pid *pgrp)
1026 {
1027         struct task_struct *p = NULL;
1028         int retval, success;
1029
1030         success = 0;
1031         retval = -ESRCH;
1032         do_each_pid_task(pgrp, PIDTYPE_PGID, p) {
1033                 int err = group_send_sig_info(sig, info, p);
1034                 success |= !err;
1035                 retval = err;
1036         } while_each_pid_task(pgrp, PIDTYPE_PGID, p);
1037         return success ? 0 : retval;
1038 }
1039
1040 int kill_pid_info(int sig, struct siginfo *info, struct pid *pid)
1041 {
1042         int error = -ESRCH;
1043         struct task_struct *p;
1044
1045         rcu_read_lock();
1046         if (unlikely(sig_needs_tasklist(sig)))
1047                 read_lock(&tasklist_lock);
1048
1049 retry:
1050         p = pid_task(pid, PIDTYPE_PID);
1051         if (p) {
1052                 error = group_send_sig_info(sig, info, p);
1053                 if (unlikely(error == -ESRCH))
1054                         /*
1055                          * The task was unhashed in between, try again.
1056                          * If it is dead, pid_task() will return NULL,
1057                          * if we race with de_thread() it will find the
1058                          * new leader.
1059                          */
1060                         goto retry;
1061         }
1062
1063         if (unlikely(sig_needs_tasklist(sig)))
1064                 read_unlock(&tasklist_lock);
1065         rcu_read_unlock();
1066         return error;
1067 }
1068
1069 int
1070 kill_proc_info(int sig, struct siginfo *info, pid_t pid)
1071 {
1072         int error;
1073         rcu_read_lock();
1074         error = kill_pid_info(sig, info, find_vpid(pid));
1075         rcu_read_unlock();
1076         return error;
1077 }
1078
1079 /* like kill_pid_info(), but doesn't use uid/euid of "current" */
1080 int kill_pid_info_as_uid(int sig, struct siginfo *info, struct pid *pid,
1081                       uid_t uid, uid_t euid, u32 secid)
1082 {
1083         int ret = -EINVAL;
1084         struct task_struct *p;
1085
1086         if (!valid_signal(sig))
1087                 return ret;
1088
1089         read_lock(&tasklist_lock);
1090         p = pid_task(pid, PIDTYPE_PID);
1091         if (!p) {
1092                 ret = -ESRCH;
1093                 goto out_unlock;
1094         }
1095         if ((info == SEND_SIG_NOINFO || (!is_si_special(info) && SI_FROMUSER(info)))
1096             && (euid != p->suid) && (euid != p->uid)
1097             && (uid != p->suid) && (uid != p->uid)) {
1098                 ret = -EPERM;
1099                 goto out_unlock;
1100         }
1101         ret = security_task_kill(p, info, sig, secid);
1102         if (ret)
1103                 goto out_unlock;
1104         if (sig && p->sighand) {
1105                 unsigned long flags;
1106                 spin_lock_irqsave(&p->sighand->siglock, flags);
1107                 ret = __group_send_sig_info(sig, info, p);
1108                 spin_unlock_irqrestore(&p->sighand->siglock, flags);
1109         }
1110 out_unlock:
1111         read_unlock(&tasklist_lock);
1112         return ret;
1113 }
1114 EXPORT_SYMBOL_GPL(kill_pid_info_as_uid);
1115
1116 /*
1117  * kill_something_info() interprets pid in interesting ways just like kill(2).
1118  *
1119  * POSIX specifies that kill(-1,sig) is unspecified, but what we have
1120  * is probably wrong.  Should make it like BSD or SYSV.
1121  */
1122
1123 static int kill_something_info(int sig, struct siginfo *info, int pid)
1124 {
1125         int ret;
1126
1127         if (pid > 0) {
1128                 rcu_read_lock();
1129                 ret = kill_pid_info(sig, info, find_vpid(pid));
1130                 rcu_read_unlock();
1131                 return ret;
1132         }
1133
1134         read_lock(&tasklist_lock);
1135         if (pid != -1) {
1136                 ret = __kill_pgrp_info(sig, info,
1137                                 pid ? find_vpid(-pid) : task_pgrp(current));
1138         } else {
1139                 int retval = 0, count = 0;
1140                 struct task_struct * p;
1141
1142                 for_each_process(p) {
1143                         if (p->pid > 1 && !same_thread_group(p, current)) {
1144                                 int err = group_send_sig_info(sig, info, p);
1145                                 ++count;
1146                                 if (err != -EPERM)
1147                                         retval = err;
1148                         }
1149                 }
1150                 ret = count ? retval : -ESRCH;
1151         }
1152         read_unlock(&tasklist_lock);
1153
1154         return ret;
1155 }
1156
1157 /*
1158  * These are for backward compatibility with the rest of the kernel source.
1159  */
1160
1161 /*
1162  * These two are the most common entry points.  They send a signal
1163  * just to the specific thread.
1164  */
1165 int
1166 send_sig_info(int sig, struct siginfo *info, struct task_struct *p)
1167 {
1168         int ret;
1169         unsigned long flags;
1170
1171         /*
1172          * Make sure legacy kernel users don't send in bad values
1173          * (normal paths check this in check_kill_permission).
1174          */
1175         if (!valid_signal(sig))
1176                 return -EINVAL;
1177
1178         /*
1179          * We need the tasklist lock even for the specific
1180          * thread case (when we don't need to follow the group
1181          * lists) in order to avoid races with "p->sighand"
1182          * going away or changing from under us.
1183          */
1184         read_lock(&tasklist_lock);
1185         spin_lock_irqsave(&p->sighand->siglock, flags);
1186         ret = specific_send_sig_info(sig, info, p);
1187         spin_unlock_irqrestore(&p->sighand->siglock, flags);
1188         read_unlock(&tasklist_lock);
1189         return ret;
1190 }
1191
1192 #define __si_special(priv) \
1193         ((priv) ? SEND_SIG_PRIV : SEND_SIG_NOINFO)
1194
1195 int
1196 send_sig(int sig, struct task_struct *p, int priv)
1197 {
1198         return send_sig_info(sig, __si_special(priv), p);
1199 }
1200
1201 void
1202 force_sig(int sig, struct task_struct *p)
1203 {
1204         force_sig_info(sig, SEND_SIG_PRIV, p);
1205 }
1206
1207 /*
1208  * When things go south during signal handling, we
1209  * will force a SIGSEGV. And if the signal that caused
1210  * the problem was already a SIGSEGV, we'll want to
1211  * make sure we don't even try to deliver the signal..
1212  */
1213 int
1214 force_sigsegv(int sig, struct task_struct *p)
1215 {
1216         if (sig == SIGSEGV) {
1217                 unsigned long flags;
1218                 spin_lock_irqsave(&p->sighand->siglock, flags);
1219                 p->sighand->action[sig - 1].sa.sa_handler = SIG_DFL;
1220                 spin_unlock_irqrestore(&p->sighand->siglock, flags);
1221         }
1222         force_sig(SIGSEGV, p);
1223         return 0;
1224 }
1225
1226 int kill_pgrp(struct pid *pid, int sig, int priv)
1227 {
1228         int ret;
1229
1230         read_lock(&tasklist_lock);
1231         ret = __kill_pgrp_info(sig, __si_special(priv), pid);
1232         read_unlock(&tasklist_lock);
1233
1234         return ret;
1235 }
1236 EXPORT_SYMBOL(kill_pgrp);
1237
1238 int kill_pid(struct pid *pid, int sig, int priv)
1239 {
1240         return kill_pid_info(sig, __si_special(priv), pid);
1241 }
1242 EXPORT_SYMBOL(kill_pid);
1243
1244 int
1245 kill_proc(pid_t pid, int sig, int priv)
1246 {
1247         int ret;
1248
1249         rcu_read_lock();
1250         ret = kill_pid_info(sig, __si_special(priv), find_pid(pid));
1251         rcu_read_unlock();
1252         return ret;
1253 }
1254
1255 /*
1256  * These functions support sending signals using preallocated sigqueue
1257  * structures.  This is needed "because realtime applications cannot
1258  * afford to lose notifications of asynchronous events, like timer
1259  * expirations or I/O completions".  In the case of Posix Timers
1260  * we allocate the sigqueue structure from the timer_create.  If this
1261  * allocation fails we are able to report the failure to the application
1262  * with an EAGAIN error.
1263  */
1264
1265 struct sigqueue *sigqueue_alloc(void)
1266 {
1267         struct sigqueue *q;
1268
1269         if ((q = __sigqueue_alloc(current, GFP_KERNEL, 0)))
1270                 q->flags |= SIGQUEUE_PREALLOC;
1271         return(q);
1272 }
1273
1274 void sigqueue_free(struct sigqueue *q)
1275 {
1276         unsigned long flags;
1277         spinlock_t *lock = &current->sighand->siglock;
1278
1279         BUG_ON(!(q->flags & SIGQUEUE_PREALLOC));
1280         /*
1281          * If the signal is still pending remove it from the
1282          * pending queue. We must hold ->siglock while testing
1283          * q->list to serialize with collect_signal().
1284          */
1285         spin_lock_irqsave(lock, flags);
1286         if (!list_empty(&q->list))
1287                 list_del_init(&q->list);
1288         spin_unlock_irqrestore(lock, flags);
1289
1290         q->flags &= ~SIGQUEUE_PREALLOC;
1291         __sigqueue_free(q);
1292 }
1293
1294 static int do_send_sigqueue(int sig, struct sigqueue *q, struct task_struct *t,
1295                 struct sigpending *pending)
1296 {
1297         if (unlikely(!list_empty(&q->list))) {
1298                 /*
1299                  * If an SI_TIMER entry is already queue just increment
1300                  * the overrun count.
1301                  */
1302
1303                 BUG_ON(q->info.si_code != SI_TIMER);
1304                 q->info.si_overrun++;
1305                 return 0;
1306         }
1307
1308         if (sig_ignored(t, sig))
1309                 return 1;
1310
1311         signalfd_notify(t, sig);
1312         list_add_tail(&q->list, &pending->list);
1313         sigaddset(&pending->signal, sig);
1314         return 0;
1315 }
1316
1317 int send_sigqueue(int sig, struct sigqueue *q, struct task_struct *p)
1318 {
1319         unsigned long flags;
1320         int ret = -1;
1321
1322         BUG_ON(!(q->flags & SIGQUEUE_PREALLOC));
1323
1324         /*
1325          * The rcu based delayed sighand destroy makes it possible to
1326          * run this without tasklist lock held. The task struct itself
1327          * cannot go away as create_timer did get_task_struct().
1328          *
1329          * We return -1, when the task is marked exiting, so
1330          * posix_timer_event can redirect it to the group leader
1331          */
1332         rcu_read_lock();
1333
1334         if (!likely(lock_task_sighand(p, &flags)))
1335                 goto out_err;
1336
1337         ret = do_send_sigqueue(sig, q, p, &p->pending);
1338
1339         if (!sigismember(&p->blocked, sig))
1340                 signal_wake_up(p, sig == SIGKILL);
1341
1342         unlock_task_sighand(p, &flags);
1343 out_err:
1344         rcu_read_unlock();
1345
1346         return ret;
1347 }
1348
1349 int
1350 send_group_sigqueue(int sig, struct sigqueue *q, struct task_struct *p)
1351 {
1352         unsigned long flags;
1353         int ret;
1354
1355         BUG_ON(!(q->flags & SIGQUEUE_PREALLOC));
1356
1357         read_lock(&tasklist_lock);
1358         /* Since it_lock is held, p->sighand cannot be NULL. */
1359         spin_lock_irqsave(&p->sighand->siglock, flags);
1360         handle_stop_signal(sig, p);
1361
1362         ret = do_send_sigqueue(sig, q, p, &p->signal->shared_pending);
1363
1364         __group_complete_signal(sig, p);
1365
1366         spin_unlock_irqrestore(&p->sighand->siglock, flags);
1367         read_unlock(&tasklist_lock);
1368         return ret;
1369 }
1370
1371 /*
1372  * Wake up any threads in the parent blocked in wait* syscalls.
1373  */
1374 static inline void __wake_up_parent(struct task_struct *p,
1375                                     struct task_struct *parent)
1376 {
1377         wake_up_interruptible_sync(&parent->signal->wait_chldexit);
1378 }
1379
1380 /*
1381  * Let a parent know about the death of a child.
1382  * For a stopped/continued status change, use do_notify_parent_cldstop instead.
1383  */
1384
1385 void do_notify_parent(struct task_struct *tsk, int sig)
1386 {
1387         struct siginfo info;
1388         unsigned long flags;
1389         struct sighand_struct *psig;
1390
1391         BUG_ON(sig == -1);
1392
1393         /* do_notify_parent_cldstop should have been called instead.  */
1394         BUG_ON(task_is_stopped_or_traced(tsk));
1395
1396         BUG_ON(!tsk->ptrace &&
1397                (tsk->group_leader != tsk || !thread_group_empty(tsk)));
1398
1399         info.si_signo = sig;
1400         info.si_errno = 0;
1401         /*
1402          * we are under tasklist_lock here so our parent is tied to
1403          * us and cannot exit and release its namespace.
1404          *
1405          * the only it can is to switch its nsproxy with sys_unshare,
1406          * bu uncharing pid namespaces is not allowed, so we'll always
1407          * see relevant namespace
1408          *
1409          * write_lock() currently calls preempt_disable() which is the
1410          * same as rcu_read_lock(), but according to Oleg, this is not
1411          * correct to rely on this
1412          */
1413         rcu_read_lock();
1414         info.si_pid = task_pid_nr_ns(tsk, tsk->parent->nsproxy->pid_ns);
1415         rcu_read_unlock();
1416
1417         info.si_uid = tsk->uid;
1418
1419         /* FIXME: find out whether or not this is supposed to be c*time. */
1420         info.si_utime = cputime_to_jiffies(cputime_add(tsk->utime,
1421                                                        tsk->signal->utime));
1422         info.si_stime = cputime_to_jiffies(cputime_add(tsk->stime,
1423                                                        tsk->signal->stime));
1424
1425         info.si_status = tsk->exit_code & 0x7f;
1426         if (tsk->exit_code & 0x80)
1427                 info.si_code = CLD_DUMPED;
1428         else if (tsk->exit_code & 0x7f)
1429                 info.si_code = CLD_KILLED;
1430         else {
1431                 info.si_code = CLD_EXITED;
1432                 info.si_status = tsk->exit_code >> 8;
1433         }
1434
1435         psig = tsk->parent->sighand;
1436         spin_lock_irqsave(&psig->siglock, flags);
1437         if (!tsk->ptrace && sig == SIGCHLD &&
1438             (psig->action[SIGCHLD-1].sa.sa_handler == SIG_IGN ||
1439              (psig->action[SIGCHLD-1].sa.sa_flags & SA_NOCLDWAIT))) {
1440                 /*
1441                  * We are exiting and our parent doesn't care.  POSIX.1
1442                  * defines special semantics for setting SIGCHLD to SIG_IGN
1443                  * or setting the SA_NOCLDWAIT flag: we should be reaped
1444                  * automatically and not left for our parent's wait4 call.
1445                  * Rather than having the parent do it as a magic kind of
1446                  * signal handler, we just set this to tell do_exit that we
1447                  * can be cleaned up without becoming a zombie.  Note that
1448                  * we still call __wake_up_parent in this case, because a
1449                  * blocked sys_wait4 might now return -ECHILD.
1450                  *
1451                  * Whether we send SIGCHLD or not for SA_NOCLDWAIT
1452                  * is implementation-defined: we do (if you don't want
1453                  * it, just use SIG_IGN instead).
1454                  */
1455                 tsk->exit_signal = -1;
1456                 if (psig->action[SIGCHLD-1].sa.sa_handler == SIG_IGN)
1457                         sig = 0;
1458         }
1459         if (valid_signal(sig) && sig > 0)
1460                 __group_send_sig_info(sig, &info, tsk->parent);
1461         __wake_up_parent(tsk, tsk->parent);
1462         spin_unlock_irqrestore(&psig->siglock, flags);
1463 }
1464
1465 static void do_notify_parent_cldstop(struct task_struct *tsk, int why)
1466 {
1467         struct siginfo info;
1468         unsigned long flags;
1469         struct task_struct *parent;
1470         struct sighand_struct *sighand;
1471
1472         if (tsk->ptrace & PT_PTRACED)
1473                 parent = tsk->parent;
1474         else {
1475                 tsk = tsk->group_leader;
1476                 parent = tsk->real_parent;
1477         }
1478
1479         info.si_signo = SIGCHLD;
1480         info.si_errno = 0;
1481         /*
1482          * see comment in do_notify_parent() abot the following 3 lines
1483          */
1484         rcu_read_lock();
1485         info.si_pid = task_pid_nr_ns(tsk, tsk->parent->nsproxy->pid_ns);
1486         rcu_read_unlock();
1487
1488         info.si_uid = tsk->uid;
1489
1490         /* FIXME: find out whether or not this is supposed to be c*time. */
1491         info.si_utime = cputime_to_jiffies(tsk->utime);
1492         info.si_stime = cputime_to_jiffies(tsk->stime);
1493
1494         info.si_code = why;
1495         switch (why) {
1496         case CLD_CONTINUED:
1497                 info.si_status = SIGCONT;
1498                 break;
1499         case CLD_STOPPED:
1500                 info.si_status = tsk->signal->group_exit_code & 0x7f;
1501                 break;
1502         case CLD_TRAPPED:
1503                 info.si_status = tsk->exit_code & 0x7f;
1504                 break;
1505         default:
1506                 BUG();
1507         }
1508
1509         sighand = parent->sighand;
1510         spin_lock_irqsave(&sighand->siglock, flags);
1511         if (sighand->action[SIGCHLD-1].sa.sa_handler != SIG_IGN &&
1512             !(sighand->action[SIGCHLD-1].sa.sa_flags & SA_NOCLDSTOP))
1513                 __group_send_sig_info(SIGCHLD, &info, parent);
1514         /*
1515          * Even if SIGCHLD is not generated, we must wake up wait4 calls.
1516          */
1517         __wake_up_parent(tsk, parent);
1518         spin_unlock_irqrestore(&sighand->siglock, flags);
1519 }
1520
1521 static inline int may_ptrace_stop(void)
1522 {
1523         if (!likely(current->ptrace & PT_PTRACED))
1524                 return 0;
1525         /*
1526          * Are we in the middle of do_coredump?
1527          * If so and our tracer is also part of the coredump stopping
1528          * is a deadlock situation, and pointless because our tracer
1529          * is dead so don't allow us to stop.
1530          * If SIGKILL was already sent before the caller unlocked
1531          * ->siglock we must see ->core_waiters != 0. Otherwise it
1532          * is safe to enter schedule().
1533          */
1534         if (unlikely(current->mm->core_waiters) &&
1535             unlikely(current->mm == current->parent->mm))
1536                 return 0;
1537
1538         return 1;
1539 }
1540
1541 /*
1542  * Return nonzero if there is a SIGKILL that should be waking us up.
1543  * Called with the siglock held.
1544  */
1545 static int sigkill_pending(struct task_struct *tsk)
1546 {
1547         return ((sigismember(&tsk->pending.signal, SIGKILL) ||
1548                  sigismember(&tsk->signal->shared_pending.signal, SIGKILL)) &&
1549                 !unlikely(sigismember(&tsk->blocked, SIGKILL)));
1550 }
1551
1552 /*
1553  * This must be called with current->sighand->siglock held.
1554  *
1555  * This should be the path for all ptrace stops.
1556  * We always set current->last_siginfo while stopped here.
1557  * That makes it a way to test a stopped process for
1558  * being ptrace-stopped vs being job-control-stopped.
1559  *
1560  * If we actually decide not to stop at all because the tracer
1561  * is gone, we keep current->exit_code unless clear_code.
1562  */
1563 static void ptrace_stop(int exit_code, int clear_code, siginfo_t *info)
1564 {
1565         int killed = 0;
1566
1567         if (arch_ptrace_stop_needed(exit_code, info)) {
1568                 /*
1569                  * The arch code has something special to do before a
1570                  * ptrace stop.  This is allowed to block, e.g. for faults
1571                  * on user stack pages.  We can't keep the siglock while
1572                  * calling arch_ptrace_stop, so we must release it now.
1573                  * To preserve proper semantics, we must do this before
1574                  * any signal bookkeeping like checking group_stop_count.
1575                  * Meanwhile, a SIGKILL could come in before we retake the
1576                  * siglock.  That must prevent us from sleeping in TASK_TRACED.
1577                  * So after regaining the lock, we must check for SIGKILL.
1578                  */
1579                 spin_unlock_irq(&current->sighand->siglock);
1580                 arch_ptrace_stop(exit_code, info);
1581                 spin_lock_irq(&current->sighand->siglock);
1582                 killed = sigkill_pending(current);
1583         }
1584
1585         /*
1586          * If there is a group stop in progress,
1587          * we must participate in the bookkeeping.
1588          */
1589         if (current->signal->group_stop_count > 0)
1590                 --current->signal->group_stop_count;
1591
1592         current->last_siginfo = info;
1593         current->exit_code = exit_code;
1594
1595         /* Let the debugger run.  */
1596         __set_current_state(TASK_TRACED);
1597         spin_unlock_irq(&current->sighand->siglock);
1598         read_lock(&tasklist_lock);
1599         if (!unlikely(killed) && may_ptrace_stop()) {
1600                 do_notify_parent_cldstop(current, CLD_TRAPPED);
1601                 read_unlock(&tasklist_lock);
1602                 schedule();
1603         } else {
1604                 /*
1605                  * By the time we got the lock, our tracer went away.
1606                  * Don't drop the lock yet, another tracer may come.
1607                  */
1608                 __set_current_state(TASK_RUNNING);
1609                 if (clear_code)
1610                         current->exit_code = 0;
1611                 read_unlock(&tasklist_lock);
1612         }
1613
1614         /*
1615          * While in TASK_TRACED, we were considered "frozen enough".
1616          * Now that we woke up, it's crucial if we're supposed to be
1617          * frozen that we freeze now before running anything substantial.
1618          */
1619         try_to_freeze();
1620
1621         /*
1622          * We are back.  Now reacquire the siglock before touching
1623          * last_siginfo, so that we are sure to have synchronized with
1624          * any signal-sending on another CPU that wants to examine it.
1625          */
1626         spin_lock_irq(&current->sighand->siglock);
1627         current->last_siginfo = NULL;
1628
1629         /*
1630          * Queued signals ignored us while we were stopped for tracing.
1631          * So check for any that we should take before resuming user mode.
1632          * This sets TIF_SIGPENDING, but never clears it.
1633          */
1634         recalc_sigpending_tsk(current);
1635 }
1636
1637 void ptrace_notify(int exit_code)
1638 {
1639         siginfo_t info;
1640
1641         BUG_ON((exit_code & (0x7f | ~0xffff)) != SIGTRAP);
1642
1643         memset(&info, 0, sizeof info);
1644         info.si_signo = SIGTRAP;
1645         info.si_code = exit_code;
1646         info.si_pid = task_pid_vnr(current);
1647         info.si_uid = current->uid;
1648
1649         /* Let the debugger run.  */
1650         spin_lock_irq(&current->sighand->siglock);
1651         ptrace_stop(exit_code, 1, &info);
1652         spin_unlock_irq(&current->sighand->siglock);
1653 }
1654
1655 static void
1656 finish_stop(int stop_count)
1657 {
1658         /*
1659          * If there are no other threads in the group, or if there is
1660          * a group stop in progress and we are the last to stop,
1661          * report to the parent.  When ptraced, every thread reports itself.
1662          */
1663         if (stop_count == 0 || (current->ptrace & PT_PTRACED)) {
1664                 read_lock(&tasklist_lock);
1665                 do_notify_parent_cldstop(current, CLD_STOPPED);
1666                 read_unlock(&tasklist_lock);
1667         }
1668
1669         do {
1670                 schedule();
1671         } while (try_to_freeze());
1672         /*
1673          * Now we don't run again until continued.
1674          */
1675         current->exit_code = 0;
1676 }
1677
1678 /*
1679  * This performs the stopping for SIGSTOP and other stop signals.
1680  * We have to stop all threads in the thread group.
1681  * Returns nonzero if we've actually stopped and released the siglock.
1682  * Returns zero if we didn't stop and still hold the siglock.
1683  */
1684 static int do_signal_stop(int signr)
1685 {
1686         struct signal_struct *sig = current->signal;
1687         int stop_count;
1688
1689         if (sig->group_stop_count > 0) {
1690                 /*
1691                  * There is a group stop in progress.  We don't need to
1692                  * start another one.
1693                  */
1694                 stop_count = --sig->group_stop_count;
1695         } else {
1696                 struct task_struct *t;
1697
1698                 if (!likely(sig->flags & SIGNAL_STOP_DEQUEUED) ||
1699                     unlikely(signal_group_exit(sig)))
1700                         return 0;
1701                 /*
1702                  * There is no group stop already in progress.
1703                  * We must initiate one now.
1704                  */
1705                 sig->group_exit_code = signr;
1706
1707                 stop_count = 0;
1708                 for (t = next_thread(current); t != current; t = next_thread(t))
1709                         /*
1710                          * Setting state to TASK_STOPPED for a group
1711                          * stop is always done with the siglock held,
1712                          * so this check has no races.
1713                          */
1714                         if (!(t->flags & PF_EXITING) &&
1715                             !task_is_stopped_or_traced(t)) {
1716                                 stop_count++;
1717                                 signal_wake_up(t, 0);
1718                         }
1719                 sig->group_stop_count = stop_count;
1720         }
1721
1722         if (stop_count == 0)
1723                 sig->flags = SIGNAL_STOP_STOPPED;
1724         current->exit_code = sig->group_exit_code;
1725         __set_current_state(TASK_STOPPED);
1726
1727         spin_unlock_irq(&current->sighand->siglock);
1728         finish_stop(stop_count);
1729         return 1;
1730 }
1731
1732 static int ptrace_signal(int signr, siginfo_t *info,
1733                          struct pt_regs *regs, void *cookie)
1734 {
1735         if (!(current->ptrace & PT_PTRACED))
1736                 return signr;
1737
1738         ptrace_signal_deliver(regs, cookie);
1739
1740         /* Let the debugger run.  */
1741         ptrace_stop(signr, 0, info);
1742
1743         /* We're back.  Did the debugger cancel the sig?  */
1744         signr = current->exit_code;
1745         if (signr == 0)
1746                 return signr;
1747
1748         current->exit_code = 0;
1749
1750         /* Update the siginfo structure if the signal has
1751            changed.  If the debugger wanted something
1752            specific in the siginfo structure then it should
1753            have updated *info via PTRACE_SETSIGINFO.  */
1754         if (signr != info->si_signo) {
1755                 info->si_signo = signr;
1756                 info->si_errno = 0;
1757                 info->si_code = SI_USER;
1758                 info->si_pid = task_pid_vnr(current->parent);
1759                 info->si_uid = current->parent->uid;
1760         }
1761
1762         /* If the (new) signal is now blocked, requeue it.  */
1763         if (sigismember(&current->blocked, signr)) {
1764                 specific_send_sig_info(signr, info, current);
1765                 signr = 0;
1766         }
1767
1768         return signr;
1769 }
1770
1771 int get_signal_to_deliver(siginfo_t *info, struct k_sigaction *return_ka,
1772                           struct pt_regs *regs, void *cookie)
1773 {
1774         sigset_t *mask = &current->blocked;
1775         int signr = 0;
1776
1777 relock:
1778         /*
1779          * We'll jump back here after any time we were stopped in TASK_STOPPED.
1780          * While in TASK_STOPPED, we were considered "frozen enough".
1781          * Now that we woke up, it's crucial if we're supposed to be
1782          * frozen that we freeze now before running anything substantial.
1783          */
1784         try_to_freeze();
1785
1786         spin_lock_irq(&current->sighand->siglock);
1787         for (;;) {
1788                 struct k_sigaction *ka;
1789
1790                 if (unlikely(current->signal->group_stop_count > 0) &&
1791                     do_signal_stop(0))
1792                         goto relock;
1793
1794                 signr = dequeue_signal(current, mask, info);
1795
1796                 if (!signr)
1797                         break; /* will return 0 */
1798
1799                 if (signr != SIGKILL) {
1800                         signr = ptrace_signal(signr, info, regs, cookie);
1801                         if (!signr)
1802                                 continue;
1803                 }
1804
1805                 ka = &current->sighand->action[signr-1];
1806                 if (ka->sa.sa_handler == SIG_IGN) /* Do nothing.  */
1807                         continue;
1808                 if (ka->sa.sa_handler != SIG_DFL) {
1809                         /* Run the handler.  */
1810                         *return_ka = *ka;
1811
1812                         if (ka->sa.sa_flags & SA_ONESHOT)
1813                                 ka->sa.sa_handler = SIG_DFL;
1814
1815                         break; /* will return non-zero "signr" value */
1816                 }
1817
1818                 /*
1819                  * Now we are doing the default action for this signal.
1820                  */
1821                 if (sig_kernel_ignore(signr)) /* Default is nothing. */
1822                         continue;
1823
1824                 /*
1825                  * Global init gets no signals it doesn't want.
1826                  */
1827                 if (is_global_init(current))
1828                         continue;
1829
1830                 if (sig_kernel_stop(signr)) {
1831                         /*
1832                          * The default action is to stop all threads in
1833                          * the thread group.  The job control signals
1834                          * do nothing in an orphaned pgrp, but SIGSTOP
1835                          * always works.  Note that siglock needs to be
1836                          * dropped during the call to is_orphaned_pgrp()
1837                          * because of lock ordering with tasklist_lock.
1838                          * This allows an intervening SIGCONT to be posted.
1839                          * We need to check for that and bail out if necessary.
1840                          */
1841                         if (signr != SIGSTOP) {
1842                                 spin_unlock_irq(&current->sighand->siglock);
1843
1844                                 /* signals can be posted during this window */
1845
1846                                 if (is_current_pgrp_orphaned())
1847                                         goto relock;
1848
1849                                 spin_lock_irq(&current->sighand->siglock);
1850                         }
1851
1852                         if (likely(do_signal_stop(signr))) {
1853                                 /* It released the siglock.  */
1854                                 goto relock;
1855                         }
1856
1857                         /*
1858                          * We didn't actually stop, due to a race
1859                          * with SIGCONT or something like that.
1860                          */
1861                         continue;
1862                 }
1863
1864                 spin_unlock_irq(&current->sighand->siglock);
1865
1866                 /*
1867                  * Anything else is fatal, maybe with a core dump.
1868                  */
1869                 current->flags |= PF_SIGNALED;
1870                 if ((signr != SIGKILL) && print_fatal_signals)
1871                         print_fatal_signal(regs, signr);
1872                 if (sig_kernel_coredump(signr)) {
1873                         /*
1874                          * If it was able to dump core, this kills all
1875                          * other threads in the group and synchronizes with
1876                          * their demise.  If we lost the race with another
1877                          * thread getting here, it set group_exit_code
1878                          * first and our do_group_exit call below will use
1879                          * that value and ignore the one we pass it.
1880                          */
1881                         do_coredump((long)signr, signr, regs);
1882                 }
1883
1884                 /*
1885                  * Death signals, no core dump.
1886                  */
1887                 do_group_exit(signr);
1888                 /* NOTREACHED */
1889         }
1890         spin_unlock_irq(&current->sighand->siglock);
1891         return signr;
1892 }
1893
1894 void exit_signals(struct task_struct *tsk)
1895 {
1896         int group_stop = 0;
1897         struct task_struct *t;
1898
1899         if (thread_group_empty(tsk) || signal_group_exit(tsk->signal)) {
1900                 tsk->flags |= PF_EXITING;
1901                 return;
1902         }
1903
1904         spin_lock_irq(&tsk->sighand->siglock);
1905         /*
1906          * From now this task is not visible for group-wide signals,
1907          * see wants_signal(), do_signal_stop().
1908          */
1909         tsk->flags |= PF_EXITING;
1910         if (!signal_pending(tsk))
1911                 goto out;
1912
1913         /* It could be that __group_complete_signal() choose us to
1914          * notify about group-wide signal. Another thread should be
1915          * woken now to take the signal since we will not.
1916          */
1917         for (t = tsk; (t = next_thread(t)) != tsk; )
1918                 if (!signal_pending(t) && !(t->flags & PF_EXITING))
1919                         recalc_sigpending_and_wake(t);
1920
1921         if (unlikely(tsk->signal->group_stop_count) &&
1922                         !--tsk->signal->group_stop_count) {
1923                 tsk->signal->flags = SIGNAL_STOP_STOPPED;
1924                 group_stop = 1;
1925         }
1926 out:
1927         spin_unlock_irq(&tsk->sighand->siglock);
1928
1929         if (unlikely(group_stop)) {
1930                 read_lock(&tasklist_lock);
1931                 do_notify_parent_cldstop(tsk, CLD_STOPPED);
1932                 read_unlock(&tasklist_lock);
1933         }
1934 }
1935
1936 EXPORT_SYMBOL(recalc_sigpending);
1937 EXPORT_SYMBOL_GPL(dequeue_signal);
1938 EXPORT_SYMBOL(flush_signals);
1939 EXPORT_SYMBOL(force_sig);
1940 EXPORT_SYMBOL(kill_proc);
1941 EXPORT_SYMBOL(ptrace_notify);
1942 EXPORT_SYMBOL(send_sig);
1943 EXPORT_SYMBOL(send_sig_info);
1944 EXPORT_SYMBOL(sigprocmask);
1945 EXPORT_SYMBOL(block_all_signals);
1946 EXPORT_SYMBOL(unblock_all_signals);
1947
1948
1949 /*
1950  * System call entry points.
1951  */
1952
1953 asmlinkage long sys_restart_syscall(void)
1954 {
1955         struct restart_block *restart = &current_thread_info()->restart_block;
1956         return restart->fn(restart);
1957 }
1958
1959 long do_no_restart_syscall(struct restart_block *param)
1960 {
1961         return -EINTR;
1962 }
1963
1964 /*
1965  * We don't need to get the kernel lock - this is all local to this
1966  * particular thread.. (and that's good, because this is _heavily_
1967  * used by various programs)
1968  */
1969
1970 /*
1971  * This is also useful for kernel threads that want to temporarily
1972  * (or permanently) block certain signals.
1973  *
1974  * NOTE! Unlike the user-mode sys_sigprocmask(), the kernel
1975  * interface happily blocks "unblockable" signals like SIGKILL
1976  * and friends.
1977  */
1978 int sigprocmask(int how, sigset_t *set, sigset_t *oldset)
1979 {
1980         int error;
1981
1982         spin_lock_irq(&current->sighand->siglock);
1983         if (oldset)
1984                 *oldset = current->blocked;
1985
1986         error = 0;
1987         switch (how) {
1988         case SIG_BLOCK:
1989                 sigorsets(&current->blocked, &current->blocked, set);
1990                 break;
1991         case SIG_UNBLOCK:
1992                 signandsets(&current->blocked, &current->blocked, set);
1993                 break;
1994         case SIG_SETMASK:
1995                 current->blocked = *set;
1996                 break;
1997         default:
1998                 error = -EINVAL;
1999         }
2000         recalc_sigpending();
2001         spin_unlock_irq(&current->sighand->siglock);
2002
2003         return error;
2004 }
2005
2006 asmlinkage long
2007 sys_rt_sigprocmask(int how, sigset_t __user *set, sigset_t __user *oset, size_t sigsetsize)
2008 {
2009         int error = -EINVAL;
2010         sigset_t old_set, new_set;
2011
2012         /* XXX: Don't preclude handling different sized sigset_t's.  */
2013         if (sigsetsize != sizeof(sigset_t))
2014                 goto out;
2015
2016         if (set) {
2017                 error = -EFAULT;
2018                 if (copy_from_user(&new_set, set, sizeof(*set)))
2019                         goto out;
2020                 sigdelsetmask(&new_set, sigmask(SIGKILL)|sigmask(SIGSTOP));
2021
2022                 error = sigprocmask(how, &new_set, &old_set);
2023                 if (error)
2024                         goto out;
2025                 if (oset)
2026                         goto set_old;
2027         } else if (oset) {
2028                 spin_lock_irq(&current->sighand->siglock);
2029                 old_set = current->blocked;
2030                 spin_unlock_irq(&current->sighand->siglock);
2031
2032         set_old:
2033                 error = -EFAULT;
2034                 if (copy_to_user(oset, &old_set, sizeof(*oset)))
2035                         goto out;
2036         }
2037         error = 0;
2038 out:
2039         return error;
2040 }
2041
2042 long do_sigpending(void __user *set, unsigned long sigsetsize)
2043 {
2044         long error = -EINVAL;
2045         sigset_t pending;
2046
2047         if (sigsetsize > sizeof(sigset_t))
2048                 goto out;
2049
2050         spin_lock_irq(&current->sighand->siglock);
2051         sigorsets(&pending, &current->pending.signal,
2052                   &current->signal->shared_pending.signal);
2053         spin_unlock_irq(&current->sighand->siglock);
2054
2055         /* Outside the lock because only this thread touches it.  */
2056         sigandsets(&pending, &current->blocked, &pending);
2057
2058         error = -EFAULT;
2059         if (!copy_to_user(set, &pending, sigsetsize))
2060                 error = 0;
2061
2062 out:
2063         return error;
2064 }
2065
2066 asmlinkage long
2067 sys_rt_sigpending(sigset_t __user *set, size_t sigsetsize)
2068 {
2069         return do_sigpending(set, sigsetsize);
2070 }
2071
2072 #ifndef HAVE_ARCH_COPY_SIGINFO_TO_USER
2073
2074 int copy_siginfo_to_user(siginfo_t __user *to, siginfo_t *from)
2075 {
2076         int err;
2077
2078         if (!access_ok (VERIFY_WRITE, to, sizeof(siginfo_t)))
2079                 return -EFAULT;
2080         if (from->si_code < 0)
2081                 return __copy_to_user(to, from, sizeof(siginfo_t))
2082                         ? -EFAULT : 0;
2083         /*
2084          * If you change siginfo_t structure, please be sure
2085          * this code is fixed accordingly.
2086          * Please remember to update the signalfd_copyinfo() function
2087          * inside fs/signalfd.c too, in case siginfo_t changes.
2088          * It should never copy any pad contained in the structure
2089          * to avoid security leaks, but must copy the generic
2090          * 3 ints plus the relevant union member.
2091          */
2092         err = __put_user(from->si_signo, &to->si_signo);
2093         err |= __put_user(from->si_errno, &to->si_errno);
2094         err |= __put_user((short)from->si_code, &to->si_code);
2095         switch (from->si_code & __SI_MASK) {
2096         case __SI_KILL:
2097                 err |= __put_user(from->si_pid, &to->si_pid);
2098                 err |= __put_user(from->si_uid, &to->si_uid);
2099                 break;
2100         case __SI_TIMER:
2101                  err |= __put_user(from->si_tid, &to->si_tid);
2102                  err |= __put_user(from->si_overrun, &to->si_overrun);
2103                  err |= __put_user(from->si_ptr, &to->si_ptr);
2104                 break;
2105         case __SI_POLL:
2106                 err |= __put_user(from->si_band, &to->si_band);
2107                 err |= __put_user(from->si_fd, &to->si_fd);
2108                 break;
2109         case __SI_FAULT:
2110                 err |= __put_user(from->si_addr, &to->si_addr);
2111 #ifdef __ARCH_SI_TRAPNO
2112                 err |= __put_user(from->si_trapno, &to->si_trapno);
2113 #endif
2114                 break;
2115         case __SI_CHLD:
2116                 err |= __put_user(from->si_pid, &to->si_pid);
2117                 err |= __put_user(from->si_uid, &to->si_uid);
2118                 err |= __put_user(from->si_status, &to->si_status);
2119                 err |= __put_user(from->si_utime, &to->si_utime);
2120                 err |= __put_user(from->si_stime, &to->si_stime);
2121                 break;
2122         case __SI_RT: /* This is not generated by the kernel as of now. */
2123         case __SI_MESGQ: /* But this is */
2124                 err |= __put_user(from->si_pid, &to->si_pid);
2125                 err |= __put_user(from->si_uid, &to->si_uid);
2126                 err |= __put_user(from->si_ptr, &to->si_ptr);
2127                 break;
2128         default: /* this is just in case for now ... */
2129                 err |= __put_user(from->si_pid, &to->si_pid);
2130                 err |= __put_user(from->si_uid, &to->si_uid);
2131                 break;
2132         }
2133         return err;
2134 }
2135
2136 #endif
2137
2138 asmlinkage long
2139 sys_rt_sigtimedwait(const sigset_t __user *uthese,
2140                     siginfo_t __user *uinfo,
2141                     const struct timespec __user *uts,
2142                     size_t sigsetsize)
2143 {
2144         int ret, sig;
2145         sigset_t these;
2146         struct timespec ts;
2147         siginfo_t info;
2148         long timeout = 0;
2149
2150         /* XXX: Don't preclude handling different sized sigset_t's.  */
2151         if (sigsetsize != sizeof(sigset_t))
2152                 return -EINVAL;
2153
2154         if (copy_from_user(&these, uthese, sizeof(these)))
2155                 return -EFAULT;
2156
2157         /*
2158          * Invert the set of allowed signals to get those we
2159          * want to block.
2160          */
2161         sigdelsetmask(&these, sigmask(SIGKILL)|sigmask(SIGSTOP));
2162         signotset(&these);
2163
2164         if (uts) {
2165                 if (copy_from_user(&ts, uts, sizeof(ts)))
2166                         return -EFAULT;
2167                 if (ts.tv_nsec >= 1000000000L || ts.tv_nsec < 0
2168                     || ts.tv_sec < 0)
2169                         return -EINVAL;
2170         }
2171
2172         spin_lock_irq(&current->sighand->siglock);
2173         sig = dequeue_signal(current, &these, &info);
2174         if (!sig) {
2175                 timeout = MAX_SCHEDULE_TIMEOUT;
2176                 if (uts)
2177                         timeout = (timespec_to_jiffies(&ts)
2178                                    + (ts.tv_sec || ts.tv_nsec));
2179
2180                 if (timeout) {
2181                         /* None ready -- temporarily unblock those we're
2182                          * interested while we are sleeping in so that we'll
2183                          * be awakened when they arrive.  */
2184                         current->real_blocked = current->blocked;
2185                         sigandsets(&current->blocked, &current->blocked, &these);
2186                         recalc_sigpending();
2187                         spin_unlock_irq(&current->sighand->siglock);
2188
2189                         timeout = schedule_timeout_interruptible(timeout);
2190
2191                         spin_lock_irq(&current->sighand->siglock);
2192                         sig = dequeue_signal(current, &these, &info);
2193                         current->blocked = current->real_blocked;
2194                         siginitset(&current->real_blocked, 0);
2195                         recalc_sigpending();
2196                 }
2197         }
2198         spin_unlock_irq(&current->sighand->siglock);
2199
2200         if (sig) {
2201                 ret = sig;
2202                 if (uinfo) {
2203                         if (copy_siginfo_to_user(uinfo, &info))
2204                                 ret = -EFAULT;
2205                 }
2206         } else {
2207                 ret = -EAGAIN;
2208                 if (timeout)
2209                         ret = -EINTR;
2210         }
2211
2212         return ret;
2213 }
2214
2215 asmlinkage long
2216 sys_kill(int pid, int sig)
2217 {
2218         struct siginfo info;
2219
2220         info.si_signo = sig;
2221         info.si_errno = 0;
2222         info.si_code = SI_USER;
2223         info.si_pid = task_tgid_vnr(current);
2224         info.si_uid = current->uid;
2225
2226         return kill_something_info(sig, &info, pid);
2227 }
2228
2229 static int do_tkill(int tgid, int pid, int sig)
2230 {
2231         int error;
2232         struct siginfo info;
2233         struct task_struct *p;
2234
2235         error = -ESRCH;
2236         info.si_signo = sig;
2237         info.si_errno = 0;
2238         info.si_code = SI_TKILL;
2239         info.si_pid = task_tgid_vnr(current);
2240         info.si_uid = current->uid;
2241
2242         read_lock(&tasklist_lock);
2243         p = find_task_by_vpid(pid);
2244         if (p && (tgid <= 0 || task_tgid_vnr(p) == tgid)) {
2245                 error = check_kill_permission(sig, &info, p);
2246                 /*
2247                  * The null signal is a permissions and process existence
2248                  * probe.  No signal is actually delivered.
2249                  */
2250                 if (!error && sig && p->sighand) {
2251                         spin_lock_irq(&p->sighand->siglock);
2252                         handle_stop_signal(sig, p);
2253                         error = specific_send_sig_info(sig, &info, p);
2254                         spin_unlock_irq(&p->sighand->siglock);
2255                 }
2256         }
2257         read_unlock(&tasklist_lock);
2258
2259         return error;
2260 }
2261
2262 /**
2263  *  sys_tgkill - send signal to one specific thread
2264  *  @tgid: the thread group ID of the thread
2265  *  @pid: the PID of the thread
2266  *  @sig: signal to be sent
2267  *
2268  *  This syscall also checks the @tgid and returns -ESRCH even if the PID
2269  *  exists but it's not belonging to the target process anymore. This
2270  *  method solves the problem of threads exiting and PIDs getting reused.
2271  */
2272 asmlinkage long sys_tgkill(int tgid, int pid, int sig)
2273 {
2274         /* This is only valid for single tasks */
2275         if (pid <= 0 || tgid <= 0)
2276                 return -EINVAL;
2277
2278         return do_tkill(tgid, pid, sig);
2279 }
2280
2281 /*
2282  *  Send a signal to only one task, even if it's a CLONE_THREAD task.
2283  */
2284 asmlinkage long
2285 sys_tkill(int pid, int sig)
2286 {
2287         /* This is only valid for single tasks */
2288         if (pid <= 0)
2289                 return -EINVAL;
2290
2291         return do_tkill(0, pid, sig);
2292 }
2293
2294 asmlinkage long
2295 sys_rt_sigqueueinfo(int pid, int sig, siginfo_t __user *uinfo)
2296 {
2297         siginfo_t info;
2298
2299         if (copy_from_user(&info, uinfo, sizeof(siginfo_t)))
2300                 return -EFAULT;
2301
2302         /* Not even root can pretend to send signals from the kernel.
2303            Nor can they impersonate a kill(), which adds source info.  */
2304         if (info.si_code >= 0)
2305                 return -EPERM;
2306         info.si_signo = sig;
2307
2308         /* POSIX.1b doesn't mention process groups.  */
2309         return kill_proc_info(sig, &info, pid);
2310 }
2311
2312 int do_sigaction(int sig, struct k_sigaction *act, struct k_sigaction *oact)
2313 {
2314         struct task_struct *t = current;
2315         struct k_sigaction *k;
2316         sigset_t mask;
2317
2318         if (!valid_signal(sig) || sig < 1 || (act && sig_kernel_only(sig)))
2319                 return -EINVAL;
2320
2321         k = &t->sighand->action[sig-1];
2322
2323         spin_lock_irq(&current->sighand->siglock);
2324         if (oact)
2325                 *oact = *k;
2326
2327         if (act) {
2328                 sigdelsetmask(&act->sa.sa_mask,
2329                               sigmask(SIGKILL) | sigmask(SIGSTOP));
2330                 *k = *act;
2331                 /*
2332                  * POSIX 3.3.1.3:
2333                  *  "Setting a signal action to SIG_IGN for a signal that is
2334                  *   pending shall cause the pending signal to be discarded,
2335                  *   whether or not it is blocked."
2336                  *
2337                  *  "Setting a signal action to SIG_DFL for a signal that is
2338                  *   pending and whose default action is to ignore the signal
2339                  *   (for example, SIGCHLD), shall cause the pending signal to
2340                  *   be discarded, whether or not it is blocked"
2341                  */
2342                 if (__sig_ignored(t, sig)) {
2343                         sigemptyset(&mask);
2344                         sigaddset(&mask, sig);
2345                         rm_from_queue_full(&mask, &t->signal->shared_pending);
2346                         do {
2347                                 rm_from_queue_full(&mask, &t->pending);
2348                                 t = next_thread(t);
2349                         } while (t != current);
2350                 }
2351         }
2352
2353         spin_unlock_irq(&current->sighand->siglock);
2354         return 0;
2355 }
2356
2357 int
2358 do_sigaltstack (const stack_t __user *uss, stack_t __user *uoss, unsigned long sp)
2359 {
2360         stack_t oss;
2361         int error;
2362
2363         if (uoss) {
2364                 oss.ss_sp = (void __user *) current->sas_ss_sp;
2365                 oss.ss_size = current->sas_ss_size;
2366                 oss.ss_flags = sas_ss_flags(sp);
2367         }
2368
2369         if (uss) {
2370                 void __user *ss_sp;
2371                 size_t ss_size;
2372                 int ss_flags;
2373
2374                 error = -EFAULT;
2375                 if (!access_ok(VERIFY_READ, uss, sizeof(*uss))
2376                     || __get_user(ss_sp, &uss->ss_sp)
2377                     || __get_user(ss_flags, &uss->ss_flags)
2378                     || __get_user(ss_size, &uss->ss_size))
2379                         goto out;
2380
2381                 error = -EPERM;
2382                 if (on_sig_stack(sp))
2383                         goto out;
2384
2385                 error = -EINVAL;
2386                 /*
2387                  *
2388                  * Note - this code used to test ss_flags incorrectly
2389                  *        old code may have been written using ss_flags==0
2390                  *        to mean ss_flags==SS_ONSTACK (as this was the only
2391                  *        way that worked) - this fix preserves that older
2392                  *        mechanism
2393                  */
2394                 if (ss_flags != SS_DISABLE && ss_flags != SS_ONSTACK && ss_flags != 0)
2395                         goto out;
2396
2397                 if (ss_flags == SS_DISABLE) {
2398                         ss_size = 0;
2399                         ss_sp = NULL;
2400                 } else {
2401                         error = -ENOMEM;
2402                         if (ss_size < MINSIGSTKSZ)
2403                                 goto out;
2404                 }
2405
2406                 current->sas_ss_sp = (unsigned long) ss_sp;
2407                 current->sas_ss_size = ss_size;
2408         }
2409
2410         if (uoss) {
2411                 error = -EFAULT;
2412                 if (copy_to_user(uoss, &oss, sizeof(oss)))
2413                         goto out;
2414         }
2415
2416         error = 0;
2417 out:
2418         return error;
2419 }
2420
2421 #ifdef __ARCH_WANT_SYS_SIGPENDING
2422
2423 asmlinkage long
2424 sys_sigpending(old_sigset_t __user *set)
2425 {
2426         return do_sigpending(set, sizeof(*set));
2427 }
2428
2429 #endif
2430
2431 #ifdef __ARCH_WANT_SYS_SIGPROCMASK
2432 /* Some platforms have their own version with special arguments others
2433    support only sys_rt_sigprocmask.  */
2434
2435 asmlinkage long
2436 sys_sigprocmask(int how, old_sigset_t __user *set, old_sigset_t __user *oset)
2437 {
2438         int error;
2439         old_sigset_t old_set, new_set;
2440
2441         if (set) {
2442                 error = -EFAULT;
2443                 if (copy_from_user(&new_set, set, sizeof(*set)))
2444                         goto out;
2445                 new_set &= ~(sigmask(SIGKILL) | sigmask(SIGSTOP));
2446
2447                 spin_lock_irq(&current->sighand->siglock);
2448                 old_set = current->blocked.sig[0];
2449
2450                 error = 0;
2451                 switch (how) {
2452                 default:
2453                         error = -EINVAL;
2454                         break;
2455                 case SIG_BLOCK:
2456                         sigaddsetmask(&current->blocked, new_set);
2457                         break;
2458                 case SIG_UNBLOCK:
2459                         sigdelsetmask(&current->blocked, new_set);
2460                         break;
2461                 case SIG_SETMASK:
2462                         current->blocked.sig[0] = new_set;
2463                         break;
2464                 }
2465
2466                 recalc_sigpending();
2467                 spin_unlock_irq(&current->sighand->siglock);
2468                 if (error)
2469                         goto out;
2470                 if (oset)
2471                         goto set_old;
2472         } else if (oset) {
2473                 old_set = current->blocked.sig[0];
2474         set_old:
2475                 error = -EFAULT;
2476                 if (copy_to_user(oset, &old_set, sizeof(*oset)))
2477                         goto out;
2478         }
2479         error = 0;
2480 out:
2481         return error;
2482 }
2483 #endif /* __ARCH_WANT_SYS_SIGPROCMASK */
2484
2485 #ifdef __ARCH_WANT_SYS_RT_SIGACTION
2486 asmlinkage long
2487 sys_rt_sigaction(int sig,
2488                  const struct sigaction __user *act,
2489                  struct sigaction __user *oact,
2490                  size_t sigsetsize)
2491 {
2492         struct k_sigaction new_sa, old_sa;
2493         int ret = -EINVAL;
2494
2495         /* XXX: Don't preclude handling different sized sigset_t's.  */
2496         if (sigsetsize != sizeof(sigset_t))
2497                 goto out;
2498
2499         if (act) {
2500                 if (copy_from_user(&new_sa.sa, act, sizeof(new_sa.sa)))
2501                         return -EFAULT;
2502         }
2503
2504         ret = do_sigaction(sig, act ? &new_sa : NULL, oact ? &old_sa : NULL);
2505
2506         if (!ret && oact) {
2507                 if (copy_to_user(oact, &old_sa.sa, sizeof(old_sa.sa)))
2508                         return -EFAULT;
2509         }
2510 out:
2511         return ret;
2512 }
2513 #endif /* __ARCH_WANT_SYS_RT_SIGACTION */
2514
2515 #ifdef __ARCH_WANT_SYS_SGETMASK
2516
2517 /*
2518  * For backwards compatibility.  Functionality superseded by sigprocmask.
2519  */
2520 asmlinkage long
2521 sys_sgetmask(void)
2522 {
2523         /* SMP safe */
2524         return current->blocked.sig[0];
2525 }
2526
2527 asmlinkage long
2528 sys_ssetmask(int newmask)
2529 {
2530         int old;
2531
2532         spin_lock_irq(&current->sighand->siglock);
2533         old = current->blocked.sig[0];
2534
2535         siginitset(&current->blocked, newmask & ~(sigmask(SIGKILL)|
2536                                                   sigmask(SIGSTOP)));
2537         recalc_sigpending();
2538         spin_unlock_irq(&current->sighand->siglock);
2539
2540         return old;
2541 }
2542 #endif /* __ARCH_WANT_SGETMASK */
2543
2544 #ifdef __ARCH_WANT_SYS_SIGNAL
2545 /*
2546  * For backwards compatibility.  Functionality superseded by sigaction.
2547  */
2548 asmlinkage unsigned long
2549 sys_signal(int sig, __sighandler_t handler)
2550 {
2551         struct k_sigaction new_sa, old_sa;
2552         int ret;
2553
2554         new_sa.sa.sa_handler = handler;
2555         new_sa.sa.sa_flags = SA_ONESHOT | SA_NOMASK;
2556         sigemptyset(&new_sa.sa.sa_mask);
2557
2558         ret = do_sigaction(sig, &new_sa, &old_sa);
2559
2560         return ret ? ret : (unsigned long)old_sa.sa.sa_handler;
2561 }
2562 #endif /* __ARCH_WANT_SYS_SIGNAL */
2563
2564 #ifdef __ARCH_WANT_SYS_PAUSE
2565
2566 asmlinkage long
2567 sys_pause(void)
2568 {
2569         current->state = TASK_INTERRUPTIBLE;
2570         schedule();
2571         return -ERESTARTNOHAND;
2572 }
2573
2574 #endif
2575
2576 #ifdef __ARCH_WANT_SYS_RT_SIGSUSPEND
2577 asmlinkage long sys_rt_sigsuspend(sigset_t __user *unewset, size_t sigsetsize)
2578 {
2579         sigset_t newset;
2580
2581         /* XXX: Don't preclude handling different sized sigset_t's.  */
2582         if (sigsetsize != sizeof(sigset_t))
2583                 return -EINVAL;
2584
2585         if (copy_from_user(&newset, unewset, sizeof(newset)))
2586                 return -EFAULT;
2587         sigdelsetmask(&newset, sigmask(SIGKILL)|sigmask(SIGSTOP));
2588
2589         spin_lock_irq(&current->sighand->siglock);
2590         current->saved_sigmask = current->blocked;
2591         current->blocked = newset;
2592         recalc_sigpending();
2593         spin_unlock_irq(&current->sighand->siglock);
2594
2595         current->state = TASK_INTERRUPTIBLE;
2596         schedule();
2597         set_thread_flag(TIF_RESTORE_SIGMASK);
2598         return -ERESTARTNOHAND;
2599 }
2600 #endif /* __ARCH_WANT_SYS_RT_SIGSUSPEND */
2601
2602 __attribute__((weak)) const char *arch_vma_name(struct vm_area_struct *vma)
2603 {
2604         return NULL;
2605 }
2606
2607 void __init signals_init(void)
2608 {
2609         sigqueue_cachep = KMEM_CACHE(sigqueue, SLAB_PANIC);
2610 }