perf: Do the big rename: Performance Counters -> Performance Events

[safe/jmp/linux-2.6] / include / linux / sched.h
diff --git a/include/linux/sched.h b/include/linux/sched.h

index 2c36f62..8b265a8 100644 (file)
--- a/include/linux/sched.h
+++ b/include/linux/sched.h
@@ -38,6 +38,8 @@
  #define SCHED_BATCH            3
  /* SCHED_ISO: reserved but not implemented yet */
  #define SCHED_IDLE             5
+/* Can be ORed in to make sure the process is reverted back to SCHED_NORMAL on fork */
+#define SCHED_RESET_ON_FORK     0x40000000
  
  #ifdef __KERNEL__
  
@@ -68,7 +70,7 @@ struct sched_param {
  #include <linux/smp.h>
  #include <linux/sem.h>
  #include <linux/signal.h>
-#include <linux/fs_struct.h>
+#include <linux/path.h>
  #include <linux/compiler.h>
  #include <linux/completion.h>
  #include <linux/pid.h>
@@ -77,6 +79,7 @@ struct sched_param {
  #include <linux/proportions.h>
  #include <linux/seccomp.h>
  #include <linux/rcupdate.h>
+#include <linux/rculist.h>
  #include <linux/rtmutex.h>
  
  #include <linux/time.h>
@@ -91,12 +94,13 @@ struct sched_param {
  
  #include <asm/processor.h>
  
-struct mem_cgroup;
  struct exec_domain;
  struct futex_pi_state;
  struct robust_list_head;
  struct bio;
-struct bts_tracer;
+struct fs_struct;
+struct bts_context;
+struct perf_event_context;
  
  /*
   * List of flags we want to share for kernel threads,
@@ -115,6 +119,7 @@ struct bts_tracer;
   *    11 bit fractions.
   */
  extern unsigned long avenrun[];                /* Load averages */
+extern void get_avenrun(unsigned long *loads, unsigned long offset, int shift);
  
  #define FSHIFT         11              /* nr of bits of precision */
  #define FIXED_1                (1<<FSHIFT)     /* 1.0 as fixed-point */
@@ -134,8 +139,11 @@ DECLARE_PER_CPU(unsigned long, process_counts);
  extern int nr_processes(void);
  extern unsigned long nr_running(void);
  extern unsigned long nr_uninterruptible(void);
-extern unsigned long nr_active(void);
  extern unsigned long nr_iowait(void);
+extern void calc_global_load(void);
+extern u64 cpu_nr_migrations(int cpu);
+
+extern unsigned long get_parent_ip(unsigned long addr);
  
  struct seq_file;
  struct cfs_rq;
@@ -182,6 +190,7 @@ extern unsigned long long time_sync_thresh;
  /* in tsk->state again */
  #define TASK_DEAD              64
  #define TASK_WAKEKILL          128
+#define TASK_WAKING            256
  
  /* Convenience macros for the sake of set_task_state */
  #define TASK_KILLABLE          (TASK_WAKEKILL | TASK_UNINTERRUPTIBLE)
@@ -202,7 +211,8 @@ extern unsigned long long time_sync_thresh;
  #define task_is_stopped_or_traced(task)        \
                         ((task->state & (__TASK_STOPPED | __TASK_TRACED)) != 0)
  #define task_contributes_to_load(task) \
-                               ((task->state & TASK_UNINTERRUPTIBLE) != 0)
+                               ((task->state & TASK_UNINTERRUPTIBLE) != 0 && \
+                                (task->flags & PF_FREEZING) == 0)
  
  #define __set_task_state(tsk, state_value)             \
         do { (tsk)->state = (state_value); } while (0)
@@ -253,6 +263,7 @@ extern void task_rq_unlock_wait(struct task_struct *p);
  extern cpumask_var_t nohz_cpu_mask;
  #if defined(CONFIG_SMP) && defined(CONFIG_NO_HZ)
  extern int select_nohz_load_balancer(int cpu);
+extern int get_nohz_load_balancer(void);
  #else
  static inline int select_nohz_load_balancer(int cpu)
  {
@@ -297,17 +308,11 @@ extern int proc_dosoftlockup_thresh(struct ctl_table *table, int write,
                                     struct file *filp, void __user *buffer,
                                     size_t *lenp, loff_t *ppos);
  extern unsigned int  softlockup_panic;
-extern unsigned long sysctl_hung_task_check_count;
-extern unsigned long sysctl_hung_task_timeout_secs;
-extern unsigned long sysctl_hung_task_warnings;
  extern int softlockup_thresh;
  #else
  static inline void softlockup_tick(void)
  {
  }
-static inline void spawn_softlockup_task(void)
-{
-}
  static inline void touch_softlockup_watchdog(void)
  {
  }
@@ -316,6 +321,15 @@ static inline void touch_all_softlockup_watchdogs(void)
  }
  #endif
  
+#ifdef CONFIG_DETECT_HUNG_TASK
+extern unsigned int  sysctl_hung_task_panic;
+extern unsigned long sysctl_hung_task_check_count;
+extern unsigned long sysctl_hung_task_timeout_secs;
+extern unsigned long sysctl_hung_task_warnings;
+extern int proc_dohung_task_timeout_secs(struct ctl_table *table, int write,
+                                        struct file *filp, void __user *buffer,
+                                        size_t *lenp, loff_t *ppos);
+#endif
  
  /* Attach to any functions which should be ignored in wchan output. */
  #define __sched                __attribute__((__section__(".sched.text")))
@@ -331,13 +345,27 @@ extern signed long schedule_timeout(signed long timeout);
  extern signed long schedule_timeout_interruptible(signed long timeout);
  extern signed long schedule_timeout_killable(signed long timeout);
  extern signed long schedule_timeout_uninterruptible(signed long timeout);
+asmlinkage void __schedule(void);
  asmlinkage void schedule(void);
+extern int mutex_spin_on_owner(struct mutex *lock, struct thread_info *owner);
  
  struct nsproxy;
  struct user_namespace;
  
-/* Maximum number of active map areas.. This is a random (large) number */
-#define DEFAULT_MAX_MAP_COUNT  65536
+/*
+ * Default maximum number of active map areas, this limits the number of vmas
+ * per mm struct. Users can overwrite this number by sysctl but there is a
+ * problem.
+ *
+ * When a program's coredump is generated as ELF format, a section is created
+ * per a vma. In ELF, the number of sections is represented in unsigned short.
+ * This means the number of sections should be smaller than 65535 at coredump.
+ * Because the kernel adds some informative sections to a image of program at
+ * generating coredump, we need some margin. The number of extra sections is
+ * 1-3 now and depends on arch. We use "5" as safe margin, here.
+ */
+#define MAPCOUNT_ELF_CORE_MARGIN       (5)
+#define DEFAULT_MAX_MAP_COUNT  (USHORT_MAX - MAPCOUNT_ELF_CORE_MARGIN)
  
  extern int sysctl_max_map_count;
  
@@ -389,8 +417,15 @@ extern void arch_unmap_area_topdown(struct mm_struct *, unsigned long);
                 (mm)->hiwater_vm = (mm)->total_vm;      \
  } while (0)
  
-#define get_mm_hiwater_rss(mm) max((mm)->hiwater_rss, get_mm_rss(mm))
-#define get_mm_hiwater_vm(mm)  max((mm)->hiwater_vm, (mm)->total_vm)
+static inline unsigned long get_mm_hiwater_rss(struct mm_struct *mm)
+{
+       return max(mm->hiwater_rss, get_mm_rss(mm));
+}
+
+static inline unsigned long get_mm_hiwater_vm(struct mm_struct *mm)
+{
+       return max(mm->hiwater_vm, mm->total_vm);
+}
  
  extern void set_dumpable(struct mm_struct *mm, int value);
  extern int get_dumpable(struct mm_struct *mm);
@@ -466,6 +501,15 @@ struct task_cputime {
                 .sum_exec_runtime = 0,                          \
         }
  
+/*
+ * Disable preemption until the scheduler is running.
+ * Reset by start_kernel()->sched_init()->init_idle().
+ *
+ * We include PREEMPT_ACTIVE to avoid cond_resched() from working
+ * before the scheduler is active -- see should_resched().
+ */
+#define INIT_PREEMPT_COUNT     (1 + PREEMPT_ACTIVE)
+
  /**
   * struct thread_group_cputimer - thread group interval timer counts
   * @cputime:           thread group interval timers.
@@ -538,25 +582,8 @@ struct signal_struct {
  
         struct list_head cpu_timers[3];
  
-       /* job control IDs */
-
-       /*
-        * pgrp and session fields are deprecated.
-        * use the task_session_Xnr and task_pgrp_Xnr routines below
-        */
-
-       union {
-               pid_t pgrp __deprecated;
-               pid_t __pgrp;
-       };
-
         struct pid *tty_old_pgrp;
  
-       union {
-               pid_t session __deprecated;
-               pid_t __session;
-       };
-
         /* boolean value for session group leader */
         int leader;
  
@@ -670,9 +697,13 @@ struct user_struct {
         struct task_group *tg;
  #ifdef CONFIG_SYSFS
         struct kobject kobj;
-       struct work_struct work;
+       struct delayed_work work;
  #endif
  #endif
+
+#ifdef CONFIG_PERF_EVENTS
+       atomic_long_t locked_vm;
+#endif
  };
  
  extern int uids_sysfs_init(void);
@@ -768,18 +799,19 @@ enum cpu_idle_type {
  #define SCHED_LOAD_SCALE_FUZZ  SCHED_LOAD_SCALE
  
  #ifdef CONFIG_SMP
-#define SD_LOAD_BALANCE                1       /* Do load balancing on this domain. */
-#define SD_BALANCE_NEWIDLE     2       /* Balance when about to become idle */
-#define SD_BALANCE_EXEC                4       /* Balance on exec */
-#define SD_BALANCE_FORK                8       /* Balance on fork, clone */
-#define SD_WAKE_IDLE           16      /* Wake to idle CPU on task wakeup */
-#define SD_WAKE_AFFINE         32      /* Wake task to waking CPU */
-#define SD_WAKE_BALANCE                64      /* Perform balancing at task wakeup */
-#define SD_SHARE_CPUPOWER      128     /* Domain members share cpu power */
-#define SD_POWERSAVINGS_BALANCE        256     /* Balance for power savings */
-#define SD_SHARE_PKG_RESOURCES 512     /* Domain members share cpu pkg resources */
-#define SD_SERIALIZE           1024    /* Only a single load balancing instance */
-#define SD_WAKE_IDLE_FAR       2048    /* Gain latency sacrificing cache hit */
+#define SD_LOAD_BALANCE                0x0001  /* Do load balancing on this domain. */
+#define SD_BALANCE_NEWIDLE     0x0002  /* Balance when about to become idle */
+#define SD_BALANCE_EXEC                0x0004  /* Balance on exec */
+#define SD_BALANCE_FORK                0x0008  /* Balance on fork, clone */
+#define SD_BALANCE_WAKE                0x0010  /* Balance on wakeup */
+#define SD_WAKE_AFFINE         0x0020  /* Wake task to waking CPU */
+#define SD_PREFER_LOCAL                0x0040  /* Prefer to keep tasks local to this domain */
+#define SD_SHARE_CPUPOWER      0x0080  /* Domain members share cpu power */
+#define SD_POWERSAVINGS_BALANCE        0x0100  /* Balance for power savings */
+#define SD_SHARE_PKG_RESOURCES 0x0200  /* Domain members share cpu pkg resources */
+#define SD_SERIALIZE           0x0400  /* Only a single load balancing instance */
+
+#define SD_PREFER_SIBLING      0x1000  /* Prefer to place tasks in a sibling domain */
  
  enum powersavings_balance_level {
         POWERSAVINGS_BALANCE_NONE = 0,  /* No power saving load balance */
@@ -799,7 +831,7 @@ static inline int sd_balance_for_mc_power(void)
         if (sched_smt_power_savings)
                 return SD_POWERSAVINGS_BALANCE;
  
-       return 0;
+       return SD_PREFER_SIBLING;
  }
  
  static inline int sd_balance_for_package_power(void)
@@ -807,7 +839,7 @@ static inline int sd_balance_for_package_power(void)
         if (sched_mc_power_savings | sched_smt_power_savings)
                 return SD_POWERSAVINGS_BALANCE;
  
-       return 0;
+       return SD_PREFER_SIBLING;
  }
  
  /*
@@ -829,17 +861,21 @@ struct sched_group {
  
         /*
          * CPU power of this group, SCHED_LOAD_SCALE being max power for a
-        * single CPU. This is read only (except for setup, hotplug CPU).
-        * Note : Never change cpu_power without recompute its reciprocal
+        * single CPU.
          */
-       unsigned int __cpu_power;
+       unsigned int cpu_power;
+
         /*
-        * reciprocal value of cpu_power to avoid expensive divides
-        * (see include/linux/reciprocal_div.h)
+        * The CPUs this group covers.
+        *
+        * NOTE: this field is variable length. (Allocated dynamically
+        * by attaching extra space to the end of the structure,
+        * depending on how many CPUs the kernel has booted up with)
+        *
+        * It is also be embedded into static data structures at build
+        * time. (See 'struct static_sched_group' in kernel/sched.c)
          */
-       u32 reciprocal_cpu_power;
-
-       unsigned long cpumask[];
+       unsigned long cpumask[0];
  };
  
  static inline struct cpumask *sched_group_cpus(struct sched_group *sg)
@@ -880,6 +916,7 @@ struct sched_domain {
         unsigned int newidle_idx;
         unsigned int wake_idx;
         unsigned int forkexec_idx;
+       unsigned int smt_gain;
         int flags;                      /* See SD_* */
         enum sched_domain_level level;
  
@@ -925,8 +962,17 @@ struct sched_domain {
         char *name;
  #endif
  
-       /* span of all CPUs in this domain */
-       unsigned long span[];
+       /*
+        * Span of all CPUs in this domain.
+        *
+        * NOTE: this field is variable length. (Allocated dynamically
+        * by attaching extra space to the end of the structure,
+        * depending on how many CPUs the kernel has booted up with)
+        *
+        * It is also be embedded into static data structures at build
+        * time. (See 'struct static_sched_domain' in kernel/sched.c)
+        */
+       unsigned long span[0];
  };
  
  static inline struct cpumask *sched_domain_span(struct sched_domain *sd)
@@ -946,6 +992,9 @@ static inline int test_sd_parent(struct sched_domain *sd, int flag)
         return 0;
  }
  
+unsigned long default_scale_freq_power(struct sched_domain *sd, int cpu);
+unsigned long default_scale_smt_power(struct sched_domain *sd, int cpu);
+
  #else /* CONFIG_SMP */
  
  struct sched_domain_attr;
@@ -957,6 +1006,7 @@ partition_sched_domains(int ndoms_new, struct cpumask *doms_new,
  }
  #endif /* !CONFIG_SMP */
  
+
  struct io_context;                     /* See blkdev.h */
  
  
@@ -974,6 +1024,12 @@ struct uts_namespace;
  struct rq;
  struct sched_domain;
  
+/*
+ * wake flags
+ */
+#define WF_SYNC                0x01            /* waker goes to sleep after wakup */
+#define WF_FORK                0x02            /* child wakeup after fork */
+
  struct sched_class {
         const struct sched_class *next;
  
@@ -981,13 +1037,13 @@ struct sched_class {
         void (*dequeue_task) (struct rq *rq, struct task_struct *p, int sleep);
         void (*yield_task) (struct rq *rq);
  
-       void (*check_preempt_curr) (struct rq *rq, struct task_struct *p, int sync);
+       void (*check_preempt_curr) (struct rq *rq, struct task_struct *p, int flags);
  
         struct task_struct * (*pick_next_task) (struct rq *rq);
         void (*put_prev_task) (struct rq *rq, struct task_struct *p);
  
  #ifdef CONFIG_SMP
-       int  (*select_task_rq)(struct task_struct *p, int sync);
+       int  (*select_task_rq)(struct task_struct *p, int sd_flag, int flags);
  
         unsigned long (*load_balance) (struct rq *this_rq, int this_cpu,
                         struct rq *busiest, unsigned long max_load_move,
@@ -1052,11 +1108,20 @@ struct sched_entity {
         u64                     last_wakeup;
         u64                     avg_overlap;
  
+       u64                     nr_migrations;
+
+       u64                     start_runtime;
+       u64                     avg_wakeup;
+
+       u64                     avg_running;
+
  #ifdef CONFIG_SCHEDSTATS
         u64                     wait_start;
         u64                     wait_max;
         u64                     wait_count;
         u64                     wait_sum;
+       u64                     iowait_count;
+       u64                     iowait_sum;
  
         u64                     sleep_start;
         u64                     sleep_max;
@@ -1067,7 +1132,6 @@ struct sched_entity {
         u64                     exec_max;
         u64                     slice_max;
  
-       u64                     nr_migrations;
         u64                     nr_migrations_cold;
         u64                     nr_failed_migrations_affine;
         u64                     nr_failed_migrations_running;
@@ -1111,6 +1175,8 @@ struct sched_rt_entity {
  #endif
  };
  
+struct rcu_node;
+
  struct task_struct {
         volatile long state;    /* -1 unrunnable, 0 runnable, >0 stopped */
         void *stack;
@@ -1154,16 +1220,19 @@ struct task_struct {
         unsigned int policy;
         cpumask_t cpus_allowed;
  
-#ifdef CONFIG_PREEMPT_RCU
+#ifdef CONFIG_TREE_PREEMPT_RCU
         int rcu_read_lock_nesting;
-       int rcu_flipctr_idx;
-#endif /* #ifdef CONFIG_PREEMPT_RCU */
+       char rcu_read_unlock_special;
+       struct rcu_node *rcu_blocked_node;
+       struct list_head rcu_node_entry;
+#endif /* #ifdef CONFIG_TREE_PREEMPT_RCU */
  
  #if defined(CONFIG_SCHEDSTATS) || defined(CONFIG_TASK_DELAY_ACCT)
         struct sched_info sched_info;
  #endif
  
         struct list_head tasks;
+       struct plist_node pushable_tasks;
  
         struct mm_struct *mm, *active_mm;
  
@@ -1177,6 +1246,12 @@ struct task_struct {
         unsigned did_exec:1;
         unsigned in_execve:1;   /* Tell the LSMs that the process is doing an
                                  * execve */
+       unsigned in_iowait:1;
+
+
+       /* Revert to default priority/policy when forking */
+       unsigned sched_reset_on_fork:1;
+
         pid_t pid;
         pid_t tgid;
  
@@ -1184,6 +1259,7 @@ struct task_struct {
         /* Canary value for the -fstack-protector gcc feature */
         unsigned long stack_canary;
  #endif
+
         /* 
          * pointers to (original) parent process, youngest child, younger sibling,
          * older sibling, respectively.  (p->father can be replaced with 
@@ -1206,18 +1282,11 @@ struct task_struct {
         struct list_head ptraced;
         struct list_head ptrace_entry;
  
-#ifdef CONFIG_X86_PTRACE_BTS
         /*
          * This is the tracer handle for the ptrace BTS extension.
          * This field actually belongs to the ptracer task.
          */
-       struct bts_tracer *bts;
-       /*
-        * The buffer to hold the BTS data.
-        */
-       void *bts_buffer;
-       size_t bts_size;
-#endif /* CONFIG_X86_PTRACE_BTS */
+       struct bts_context *bts;
  
         /* PID/PID hash table linkage. */
         struct pid_link pids[PIDTYPE_MAX];
@@ -1244,7 +1313,10 @@ struct task_struct {
                                          * credentials (COW) */
         const struct cred *cred;        /* effective (overridable) subjective task
                                          * credentials (COW) */
-       struct mutex cred_exec_mutex;   /* execve vs ptrace cred calculation mutex */
+       struct mutex cred_guard_mutex;  /* guard against foreign influences on
+                                        * credential calculations
+                                        * (notably. ptrace) */
+       struct cred *replacement_session_keyring; /* for KEYCTL_SESSION_TO_PARENT */
  
         char comm[TASK_COMM_LEN]; /* executable name excluding path
                                      - access with [gs]et_task_comm (which lock
@@ -1256,9 +1328,8 @@ struct task_struct {
  /* ipc stuff */
         struct sysv_sem sysvsem;
  #endif
-#ifdef CONFIG_DETECT_SOFTLOCKUP
+#ifdef CONFIG_DETECT_HUNG_TASK
  /* hung task detection */
-       unsigned long last_switch_timestamp;
         unsigned long last_switch_count;
  #endif
  /* CPU-specific state of this task */
@@ -1292,9 +1363,15 @@ struct task_struct {
  /* Thread group tracking */
         u32 parent_exec_id;
         u32 self_exec_id;
-/* Protection of (de-)allocation: mm, files, fs, tty, keyrings */
+/* Protection of (de-)allocation: mm, files, fs, tty, keyrings, mems_allowed,
+ * mempolicy */
         spinlock_t alloc_lock;
  
+#ifdef CONFIG_GENERIC_HARDIRQS
+       /* IRQ handler threads */
+       struct irqaction *irqaction;
+#endif
+
         /* Protection of the PI data structures: */
         spinlock_t pi_lock;
  
@@ -1330,6 +1407,7 @@ struct task_struct {
         int lockdep_depth;
         unsigned int lockdep_recursion;
         struct held_lock held_locks[MAX_LOCK_DEPTH];
+       gfp_t lockdep_reclaim_gfp;
  #endif
  
  /* journalling filesystem info */
@@ -1354,8 +1432,7 @@ struct task_struct {
         cputime_t acct_timexpd; /* stime + utime since last update */
  #endif
  #ifdef CONFIG_CPUSETS
-       nodemask_t mems_allowed;
-       int cpuset_mems_generation;
+       nodemask_t mems_allowed;        /* Protected by alloc_lock */
         int cpuset_mem_spread_rotor;
  #endif
  #ifdef CONFIG_CGROUPS
@@ -1372,8 +1449,13 @@ struct task_struct {
         struct list_head pi_state_list;
         struct futex_pi_state *pi_state_cache;
  #endif
+#ifdef CONFIG_PERF_EVENTS
+       struct perf_event_context *perf_event_ctxp;
+       struct mutex perf_event_mutex;
+       struct list_head perf_event_list;
+#endif
  #ifdef CONFIG_NUMA
-       struct mempolicy *mempolicy;
+       struct mempolicy *mempolicy;    /* Protected by alloc_lock */
         short il_next;
  #endif
         atomic_t fs_excl;       /* holding fs exclusive resources */
@@ -1407,6 +1489,8 @@ struct task_struct {
         int curr_ret_stack;
         /* Stack of return addresses for return function tracing */
         struct ftrace_ret_stack *ret_stack;
+       /* time stamp for last schedule */
+       unsigned long long ftrace_timestamp;
         /*
          * Number of functions that haven't been traced
          * because of depth overrun.
@@ -1418,7 +1502,9 @@ struct task_struct {
  #ifdef CONFIG_TRACING
         /* state flags for use by tracers */
         unsigned long trace;
-#endif
+       /* bitmask of trace recursion */
+       unsigned long trace_recursion;
+#endif /* CONFIG_TRACING */
  };
  
  /* Future-safe accessor for struct task_struct's cpus_allowed. */
@@ -1455,16 +1541,6 @@ static inline int rt_task(struct task_struct *p)
         return rt_prio(p->prio);
  }
  
-static inline void set_task_session(struct task_struct *tsk, pid_t session)
-{
-       tsk->signal->__session = session;
-}
-
-static inline void set_task_pgrp(struct task_struct *tsk, pid_t pgrp)
-{
-       tsk->signal->__pgrp = pgrp;
-}
-
  static inline struct pid *task_pid(struct task_struct *task)
  {
         return task->pids[PIDTYPE_PID].pid;
@@ -1475,6 +1551,11 @@ static inline struct pid *task_tgid(struct task_struct *task)
         return task->group_leader->pids[PIDTYPE_PID].pid;
  }
  
+/*
+ * Without tasklist or rcu lock it is not safe to dereference
+ * the result of task_pgrp/task_session even if task == current,
+ * we can race with another thread doing sys_setsid/sys_setpgid.
+ */
  static inline struct pid *task_pgrp(struct task_struct *task)
  {
         return task->group_leader->pids[PIDTYPE_PGID].pid;
@@ -1500,17 +1581,23 @@ struct pid_namespace;
   *
   * see also pid_nr() etc in include/linux/pid.h
   */
+pid_t __task_pid_nr_ns(struct task_struct *task, enum pid_type type,
+                       struct pid_namespace *ns);
  
  static inline pid_t task_pid_nr(struct task_struct *tsk)
  {
         return tsk->pid;
  }
  
-pid_t task_pid_nr_ns(struct task_struct *tsk, struct pid_namespace *ns);
+static inline pid_t task_pid_nr_ns(struct task_struct *tsk,
+                                       struct pid_namespace *ns)
+{
+       return __task_pid_nr_ns(tsk, PIDTYPE_PID, ns);
+}
  
  static inline pid_t task_pid_vnr(struct task_struct *tsk)
  {
-       return pid_vnr(task_pid(tsk));
+       return __task_pid_nr_ns(tsk, PIDTYPE_PID, NULL);
  }
  
  
@@ -1527,31 +1614,34 @@ static inline pid_t task_tgid_vnr(struct task_struct *tsk)
  }
  
  
-static inline pid_t task_pgrp_nr(struct task_struct *tsk)
+static inline pid_t task_pgrp_nr_ns(struct task_struct *tsk,
+                                       struct pid_namespace *ns)
  {
-       return tsk->signal->__pgrp;
+       return __task_pid_nr_ns(tsk, PIDTYPE_PGID, ns);
  }
  
-pid_t task_pgrp_nr_ns(struct task_struct *tsk, struct pid_namespace *ns);
-
  static inline pid_t task_pgrp_vnr(struct task_struct *tsk)
  {
-       return pid_vnr(task_pgrp(tsk));
+       return __task_pid_nr_ns(tsk, PIDTYPE_PGID, NULL);
  }
  
  
-static inline pid_t task_session_nr(struct task_struct *tsk)
+static inline pid_t task_session_nr_ns(struct task_struct *tsk,
+                                       struct pid_namespace *ns)
  {
-       return tsk->signal->__session;
+       return __task_pid_nr_ns(tsk, PIDTYPE_SID, ns);
  }
  
-pid_t task_session_nr_ns(struct task_struct *tsk, struct pid_namespace *ns);
-
  static inline pid_t task_session_vnr(struct task_struct *tsk)
  {
-       return pid_vnr(task_session(tsk));
+       return __task_pid_nr_ns(tsk, PIDTYPE_SID, NULL);
  }
  
+/* obsolete, do not use */
+static inline pid_t task_pgrp_nr(struct task_struct *tsk)
+{
+       return task_pgrp_nr_ns(tsk, &init_pid_ns);
+}
  
  /**
   * pid_alive - check that a task structure is not stale
@@ -1616,6 +1706,7 @@ extern cputime_t task_gtime(struct task_struct *p);
  #define PF_MEMALLOC    0x00000800      /* Allocating memory */
  #define PF_FLUSHER     0x00001000      /* responsible for disk writeback */
  #define PF_USED_MATH   0x00002000      /* if unset the fpu must be initialized before use */
+#define PF_FREEZING    0x00004000      /* freeze in progress. do not account to load */
  #define PF_NOFREEZE    0x00008000      /* this thread should not be frozen */
  #define PF_FROZEN      0x00010000      /* frozen for system suspend */
  #define PF_FSTRANS     0x00020000      /* inside a filesystem transaction */
@@ -1658,6 +1749,28 @@ extern cputime_t task_gtime(struct task_struct *p);
  #define tsk_used_math(p) ((p)->flags & PF_USED_MATH)
  #define used_math() tsk_used_math(current)
  
+#ifdef CONFIG_TREE_PREEMPT_RCU
+
+#define RCU_READ_UNLOCK_BLOCKED (1 << 0) /* blocked while in RCU read-side. */
+#define RCU_READ_UNLOCK_NEED_QS (1 << 1) /* RCU core needs CPU response. */
+#define RCU_READ_UNLOCK_GOT_QS  (1 << 2) /* CPU has responded to RCU core. */
+
+static inline void rcu_copy_process(struct task_struct *p)
+{
+       p->rcu_read_lock_nesting = 0;
+       p->rcu_read_unlock_special = 0;
+       p->rcu_blocked_node = NULL;
+       INIT_LIST_HEAD(&p->rcu_node_entry);
+}
+
+#else
+
+static inline void rcu_copy_process(struct task_struct *p)
+{
+}
+
+#endif
+
  #ifdef CONFIG_SMP
  extern int set_cpus_allowed_ptr(struct task_struct *p,
                                 const struct cpumask *new_mask);
@@ -1675,6 +1788,16 @@ static inline int set_cpus_allowed(struct task_struct *p, cpumask_t new_mask)
         return set_cpus_allowed_ptr(p, &new_mask);
  }
  
+/*
+ * Architectures can set this to 1 if they have specified
+ * CONFIG_HAVE_UNSTABLE_SCHED_CLOCK in their arch Kconfig,
+ * but then during bootup it turns out that sched_clock()
+ * is reliable after all:
+ */
+#ifdef CONFIG_HAVE_UNSTABLE_SCHED_CLOCK
+extern int sched_clock_stable;
+#endif
+
  extern unsigned long long sched_clock(void);
  
  extern void sched_clock_init(void);
@@ -1737,16 +1860,29 @@ extern unsigned int sysctl_sched_min_granularity;
  extern unsigned int sysctl_sched_wakeup_granularity;
  extern unsigned int sysctl_sched_shares_ratelimit;
  extern unsigned int sysctl_sched_shares_thresh;
-#ifdef CONFIG_SCHED_DEBUG
  extern unsigned int sysctl_sched_child_runs_first;
+#ifdef CONFIG_SCHED_DEBUG
  extern unsigned int sysctl_sched_features;
  extern unsigned int sysctl_sched_migration_cost;
  extern unsigned int sysctl_sched_nr_migrate;
+extern unsigned int sysctl_sched_time_avg;
+extern unsigned int sysctl_timer_migration;
  
  int sched_nr_latency_handler(struct ctl_table *table, int write,
                 struct file *file, void __user *buffer, size_t *length,
                 loff_t *ppos);
  #endif
+#ifdef CONFIG_SCHED_DEBUG
+static inline unsigned int get_sysctl_timer_migration(void)
+{
+       return sysctl_timer_migration;
+}
+#else
+static inline unsigned int get_sysctl_timer_migration(void)
+{
+       return 1;
+}
+#endif
  extern unsigned int sysctl_sched_rt_period;
  extern int sysctl_sched_rt_runtime;
  
@@ -1813,9 +1949,6 @@ extern struct pid_namespace init_pid_ns;
  /*
   * find a task by one of its numerical ids
   *
- * find_task_by_pid_type_ns():
- *      it is the most generic call - it finds a task by all id,
- *      type and namespace specified
   * find_task_by_pid_ns():
   *      finds a task by its pid in the specified namespace
   * find_task_by_vpid():
@@ -1824,9 +1957,6 @@ extern struct pid_namespace init_pid_ns;
   * see also find_vpid() etc in include/linux/pid.h
   */
  
-extern struct task_struct *find_task_by_pid_type_ns(int type, int pid,
-               struct pid_namespace *ns);
-
  extern struct task_struct *find_task_by_vpid(pid_t nr);
  extern struct task_struct *find_task_by_pid_ns(pid_t nr,
                 struct pid_namespace *ns);
@@ -1861,6 +1991,7 @@ extern void sched_dead(struct task_struct *p);
  
  extern void proc_caches_init(void);
  extern void flush_signals(struct task_struct *);
+extern void __flush_signals(struct task_struct *);
  extern void ignore_signals(struct task_struct *);
  extern void flush_signal_handlers(struct task_struct *, int force_default);
  extern int dequeue_signal(struct task_struct *tsk, sigset_t *mask, siginfo_t *info);
@@ -1951,7 +2082,8 @@ extern void mm_release(struct task_struct *, struct mm_struct *);
  /* Allocate a new mm structure and copy contents from tsk->mm */
  extern struct mm_struct *dup_mm(struct task_struct *tsk);
  
-extern int  copy_thread(int, unsigned long, unsigned long, unsigned long, struct task_struct *, struct pt_regs *);
+extern int copy_thread(unsigned long, unsigned long, unsigned long,
+                       struct task_struct *, struct pt_regs *);
  extern void flush_thread(void);
  extern void exit_thread(void);
  
@@ -1976,8 +2108,10 @@ extern void set_task_comm(struct task_struct *tsk, char *from);
  extern char *get_task_comm(char *to, struct task_struct *tsk);
  
  #ifdef CONFIG_SMP
+extern void wait_task_context_switch(struct task_struct *p);
  extern unsigned long wait_task_inactive(struct task_struct *, long match_state);
  #else
+static inline void wait_task_context_switch(struct task_struct *p) {}
  static inline unsigned long wait_task_inactive(struct task_struct *p,
                                                long match_state)
  {
@@ -1985,12 +2119,13 @@ static inline unsigned long wait_task_inactive(struct task_struct *p,
  }
  #endif
  
-#define next_task(p)   list_entry(rcu_dereference((p)->tasks.next), struct task_struct, tasks)
+#define next_task(p) \
+       list_entry_rcu((p)->tasks.next, struct task_struct, tasks)
  
  #define for_each_process(p) \
         for (p = &init_task ; (p = next_task(p)) != &init_task ; )
  
-extern bool is_single_threaded(struct task_struct *);
+extern bool current_is_single_threaded(void);
  
  /*
   * Careful: do_each_thread/while_each_thread is a double loop so
@@ -2024,8 +2159,8 @@ int same_thread_group(struct task_struct *p1, struct task_struct *p2)
  
  static inline struct task_struct *next_thread(const struct task_struct *p)
  {
-       return list_entry(rcu_dereference(p->thread_group.next),
-                         struct task_struct, thread_group);
+       return list_entry_rcu(p->thread_group.next,
+                             struct task_struct, thread_group);
  }
  
  static inline int thread_group_empty(struct task_struct *p)
@@ -2036,6 +2171,11 @@ static inline int thread_group_empty(struct task_struct *p)
  #define delay_group_leader(p) \
                 (thread_group_leader(p) && !thread_group_empty(p))
  
+static inline int task_detached(struct task_struct *p)
+{
+       return p->exit_signal == -1;
+}
+
  /*
   * Protects ->fs, ->files, ->mm, ->group_info, ->comm, keyring
   * subscriptions and synchronises with wait4().  Also used in procfs.  Also
@@ -2092,6 +2232,19 @@ static inline int object_is_on_stack(void *obj)
  
  extern void thread_info_cache_init(void);
  
+#ifdef CONFIG_DEBUG_STACK_USAGE
+static inline unsigned long stack_not_used(struct task_struct *p)
+{
+       unsigned long *n = end_of_stack(p);
+
+       do {    /* Skip over canary */
+               n++;
+       } while (!*n);
+
+       return (unsigned long)n - (unsigned long)end_of_stack(p);
+}
+#endif
+
  /* set thread flags in other task's structures
   * - see asm/thread_info.h for TIF_xxxx flags available
   */
@@ -2135,6 +2288,12 @@ static inline int test_tsk_need_resched(struct task_struct *tsk)
         return unlikely(test_tsk_thread_flag(tsk,TIF_NEED_RESCHED));
  }
  
+static inline int restart_syscall(void)
+{
+       set_tsk_thread_flag(current, TIF_SIGPENDING);
+       return -ERESTARTNOINTR;
+}
+
  static inline int signal_pending(struct task_struct *p)
  {
         return unlikely(test_tsk_thread_flag(p,TIF_SIGPENDING));
@@ -2170,23 +2329,31 @@ static inline int need_resched(void)
   * cond_resched_softirq() will enable bhs before scheduling.
   */
  extern int _cond_resched(void);
-#ifdef CONFIG_PREEMPT_BKL
-static inline int cond_resched(void)
-{
-       return 0;
-}
+
+#define cond_resched() ({                      \
+       __might_sleep(__FILE__, __LINE__, 0);   \
+       _cond_resched();                        \
+})
+
+extern int __cond_resched_lock(spinlock_t *lock);
+
+#ifdef CONFIG_PREEMPT
+#define PREEMPT_LOCK_OFFSET    PREEMPT_OFFSET
  #else
-static inline int cond_resched(void)
-{
-       return _cond_resched();
-}
+#define PREEMPT_LOCK_OFFSET    0
  #endif
-extern int cond_resched_lock(spinlock_t * lock);
-extern int cond_resched_softirq(void);
-static inline int cond_resched_bkl(void)
-{
-       return _cond_resched();
-}
+
+#define cond_resched_lock(lock) ({                             \
+       __might_sleep(__FILE__, __LINE__, PREEMPT_LOCK_OFFSET); \
+       __cond_resched_lock(lock);                              \
+})
+
+extern int __cond_resched_softirq(void);
+
+#define cond_resched_softirq() ({                              \
+       __might_sleep(__FILE__, __LINE__, SOFTIRQ_OFFSET);      \
+       __cond_resched_softirq();                               \
+})
  
  /*
   * Does a critical section need to be broken due to another
@@ -2345,6 +2512,13 @@ static inline void inc_syscw(struct task_struct *tsk)
  #define TASK_SIZE_OF(tsk)      TASK_SIZE
  #endif
  
+/*
+ * Call the function if the target task is executing on a CPU right now:
+ */
+extern void task_oncpu_function_call(struct task_struct *p,
+                                    void (*func) (void *info), void *info);
+
+
  #ifdef CONFIG_MM_OWNER
  extern void mm_update_next_owner(struct mm_struct *mm);
  extern void mm_init_owner(struct mm_struct *mm, struct task_struct *p);