procfs: use proper units for noMMU statm

[safe/jmp/linux-2.6] / kernel / perf_event.c
diff --git a/kernel/perf_event.c b/kernel/perf_event.c

index 9425c96..e73e53c 100644 (file)
--- a/kernel/perf_event.c
+++ b/kernel/perf_event.c
@@ -36,7 +36,7 @@
  /*
   * Each CPU has a list of per CPU events:
   */
-DEFINE_PER_CPU(struct perf_cpu_context, perf_cpu_context);
+static DEFINE_PER_CPU(struct perf_cpu_context, perf_cpu_context);
  
  int perf_max_events __read_mostly = 1;
  static int perf_reserved_percpu __read_mostly;
@@ -338,7 +338,16 @@ list_del_event(struct perf_event *event, struct perf_event_context *ctx)
                 event->group_leader->nr_siblings--;
  
         update_event_times(event);
-       event->state = PERF_EVENT_STATE_OFF;
+
+       /*
+        * If event was in error state, then keep it
+        * that way, otherwise bogus counts will be
+        * returned on read(). The only way to get out
+        * of error state is by explicit re-enabling
+        * of the event
+        */
+       if (event->state > PERF_EVENT_STATE_OFF)
+               event->state = PERF_EVENT_STATE_OFF;
  
         /*
          * If this was a group event with sibling events then
@@ -467,7 +476,7 @@ static void perf_event_remove_from_context(struct perf_event *event)
         if (!task) {
                 /*
                  * Per cpu events are removed via an smp call and
-                * the removal is always sucessful.
+                * the removal is always successful.
                  */
                 smp_call_function_single(event->cpu,
                                          __perf_event_remove_from_context,
@@ -558,7 +567,7 @@ static void __perf_event_disable(void *info)
   * is the current context on this CPU and preemption is disabled,
   * hence we can't get into perf_event_task_sched_out for this context.
   */
-static void perf_event_disable(struct perf_event *event)
+void perf_event_disable(struct perf_event *event)
  {
         struct perf_event_context *ctx = event->ctx;
         struct task_struct *task = ctx->task;
@@ -836,7 +845,7 @@ perf_install_in_context(struct perf_event_context *ctx,
         if (!task) {
                 /*
                  * Per cpu events are installed via an smp call and
-                * the install is always sucessful.
+                * the install is always successful.
                  */
                 smp_call_function_single(cpu, __perf_install_in_context,
                                          event, 1);
@@ -962,7 +971,7 @@ static void __perf_event_enable(void *info)
   * perf_event_for_each_child or perf_event_for_each as described
   * for perf_event_disable.
   */
-static void perf_event_enable(struct perf_event *event)
+void perf_event_enable(struct perf_event *event)
  {
         struct perf_event_context *ctx = event->ctx;
         struct task_struct *task = ctx->task;
@@ -1570,7 +1579,6 @@ static void
  __perf_event_init_context(struct perf_event_context *ctx,
                             struct task_struct *task)
  {
-       memset(ctx, 0, sizeof(*ctx));
         spin_lock_init(&ctx->lock);
         mutex_init(&ctx->mutex);
         INIT_LIST_HEAD(&ctx->group_list);
@@ -1645,7 +1653,7 @@ static struct perf_event_context *find_get_context(pid_t pid, int cpu)
         }
  
         if (!ctx) {
-               ctx = kmalloc(sizeof(struct perf_event_context), GFP_KERNEL);
+               ctx = kzalloc(sizeof(struct perf_event_context), GFP_KERNEL);
                 err = -ENOMEM;
                 if (!ctx)
                         goto errout;
@@ -1831,7 +1839,7 @@ static int perf_event_read_group(struct perf_event *event,
  
                 size = n * sizeof(u64);
  
-               if (copy_to_user(buf + size, values, size)) {
+               if (copy_to_user(buf + ret, values, size)) {
                         ret = -EFAULT;
                         goto unlock;
                 }
@@ -2201,6 +2209,7 @@ static void perf_mmap_data_free(struct perf_mmap_data *data)
         perf_mmap_free_page((unsigned long)data->user_page);
         for (i = 0; i < data->nr_pages; i++)
                 perf_mmap_free_page((unsigned long)data->data_pages[i]);
+       kfree(data);
  }
  
  #else
@@ -2241,6 +2250,7 @@ static void perf_mmap_data_free_work(struct work_struct *work)
                 perf_mmap_unmark_page(base + (i * PAGE_SIZE));
  
         vfree(base);
+       kfree(data);
  }
  
  static void perf_mmap_data_free(struct perf_mmap_data *data)
@@ -2346,7 +2356,6 @@ static void perf_mmap_data_free_rcu(struct rcu_head *rcu_head)
  
         data = container_of(rcu_head, struct perf_mmap_data, rcu_head);
         perf_mmap_data_free(data);
-       kfree(data);
  }
  
  static void perf_mmap_data_release(struct perf_event *event)
@@ -3914,7 +3923,7 @@ void perf_swevent_put_recursion_context(int rctx)
  {
         struct perf_cpu_context *cpuctx = &__get_cpu_var(perf_cpu_context);
         barrier();
-       cpuctx->recursion[rctx]++;
+       cpuctx->recursion[rctx]--;
         put_cpu_var(perf_cpu_context);
  }
  EXPORT_SYMBOL_GPL(perf_swevent_put_recursion_context);
@@ -4001,6 +4010,8 @@ static enum hrtimer_restart perf_swevent_hrtimer(struct hrtimer *hrtimer)
         event->pmu->read(event);
  
         data.addr = 0;
+       data.raw = NULL;
+       data.period = event->hw.last_period;
         regs = get_irq_regs();
         /*
          * In case we exclude kernel IPs or are somehow not in interrupt
@@ -4069,8 +4080,7 @@ static void cpu_clock_perf_event_update(struct perf_event *event)
         u64 now;
  
         now = cpu_clock(cpu);
-       prev = atomic64_read(&event->hw.prev_count);
-       atomic64_set(&event->hw.prev_count, now);
+       prev = atomic64_xchg(&event->hw.prev_count, now);
         atomic64_add(now - prev, &event->count);
  }
  
@@ -4275,15 +4285,8 @@ static void bp_perf_event_destroy(struct perf_event *event)
  static const struct pmu *bp_perf_event_init(struct perf_event *bp)
  {
         int err;
-       /*
-        * The breakpoint is already filled if we haven't created the counter
-        * through perf syscall
-        * FIXME: manage to get trigerred to NULL if it comes from syscalls
-        */
-       if (!bp->callback)
-               err = register_perf_hw_breakpoint(bp);
-       else
-               err = __register_perf_hw_breakpoint(bp);
+
+       err = register_perf_hw_breakpoint(bp);
         if (err)
                 return ERR_PTR(err);
  
@@ -4297,16 +4300,13 @@ void perf_bp_event(struct perf_event *bp, void *data)
         struct perf_sample_data sample;
         struct pt_regs *regs = data;
  
+       sample.raw = NULL;
         sample.addr = bp->attr.bp_addr;
  
         if (!perf_exclude_event(bp, regs))
                 perf_swevent_add(bp, 1, 1, &sample, regs);
  }
  #else
-static void bp_perf_event_destroy(struct perf_event *event)
-{
-}
-
  static const struct pmu *bp_perf_event_init(struct perf_event *bp)
  {
         return NULL;
@@ -4383,7 +4383,7 @@ perf_event_alloc(struct perf_event_attr *attr,
                    struct perf_event_context *ctx,
                    struct perf_event *group_leader,
                    struct perf_event *parent_event,
-                  perf_callback_t callback,
+                  perf_overflow_handler_t overflow_handler,
                    gfp_t gfpflags)
  {
         const struct pmu *pmu;
@@ -4426,10 +4426,10 @@ perf_event_alloc(struct perf_event_attr *attr,
  
         event->state            = PERF_EVENT_STATE_INACTIVE;
  
-       if (!callback && parent_event)
-               callback = parent_event->callback;
+       if (!overflow_handler && parent_event)
+               overflow_handler = parent_event->overflow_handler;
         
-       event->callback = callback;
+       event->overflow_handler = overflow_handler;
  
         if (attr->disabled)
                 event->state = PERF_EVENT_STATE_OFF;
@@ -4769,7 +4769,8 @@ err_put_context:
   */
  struct perf_event *
  perf_event_create_kernel_counter(struct perf_event_attr *attr, int cpu,
-                                pid_t pid, perf_callback_t callback)
+                                pid_t pid,
+                                perf_overflow_handler_t overflow_handler)
  {
         struct perf_event *event;
         struct perf_event_context *ctx;
@@ -4780,14 +4781,17 @@ perf_event_create_kernel_counter(struct perf_event_attr *attr, int cpu,
          */
  
         ctx = find_get_context(pid, cpu);
-       if (IS_ERR(ctx))
-               return NULL;
+       if (IS_ERR(ctx)) {
+               err = PTR_ERR(ctx);
+               goto err_exit;
+       }
  
         event = perf_event_alloc(attr, cpu, ctx, NULL,
-                                    NULL, callback, GFP_KERNEL);
-       err = PTR_ERR(event);
-       if (IS_ERR(event))
+                                NULL, overflow_handler, GFP_KERNEL);
+       if (IS_ERR(event)) {
+               err = PTR_ERR(event);
                 goto err_put_context;
+       }
  
         event->filp = NULL;
         WARN_ON_ONCE(ctx->parent_ctx);
@@ -4804,11 +4808,10 @@ perf_event_create_kernel_counter(struct perf_event_attr *attr, int cpu,
  
         return event;
  
-err_put_context:
-       if (err < 0)
-               put_ctx(ctx);
-
-       return NULL;
+ err_put_context:
+       put_ctx(ctx);
+ err_exit:
+       return ERR_PTR(err);
  }
  EXPORT_SYMBOL_GPL(perf_event_create_kernel_counter);
  
@@ -5081,7 +5084,7 @@ again:
   */
  int perf_event_init_task(struct task_struct *child)
  {
-       struct perf_event_context *child_ctx, *parent_ctx;
+       struct perf_event_context *child_ctx = NULL, *parent_ctx;
         struct perf_event_context *cloned_ctx;
         struct perf_event *event;
         struct task_struct *parent = current;
@@ -5097,20 +5100,6 @@ int perf_event_init_task(struct task_struct *child)
                 return 0;
  
         /*
-        * This is executed from the parent task context, so inherit
-        * events that have been marked for cloning.
-        * First allocate and initialize a context for the child.
-        */
-
-       child_ctx = kmalloc(sizeof(struct perf_event_context), GFP_KERNEL);
-       if (!child_ctx)
-               return -ENOMEM;
-
-       __perf_event_init_context(child_ctx, child);
-       child->perf_event_ctxp = child_ctx;
-       get_task_struct(child);
-
-       /*
          * If the parent's context is a clone, pin it so it won't get
          * swapped under us.
          */
@@ -5140,6 +5129,26 @@ int perf_event_init_task(struct task_struct *child)
                         continue;
                 }
  
+               if (!child->perf_event_ctxp) {
+                       /*
+                        * This is executed from the parent task context, so
+                        * inherit events that have been marked for cloning.
+                        * First allocate and initialize a context for the
+                        * child.
+                        */
+
+                       child_ctx = kzalloc(sizeof(struct perf_event_context),
+                                           GFP_KERNEL);
+                       if (!child_ctx) {
+                               ret = -ENOMEM;
+                               goto exit;
+                       }
+
+                       __perf_event_init_context(child_ctx, child);
+                       child->perf_event_ctxp = child_ctx;
+                       get_task_struct(child);
+               }
+
                 ret = inherit_group(event, parent, parent_ctx,
                                              child, child_ctx);
                 if (ret) {
@@ -5168,6 +5177,7 @@ int perf_event_init_task(struct task_struct *child)
                 get_ctx(child_ctx->parent_ctx);
         }
  
+exit:
         mutex_unlock(&parent_ctx->mutex);
  
         perf_unpin_context(parent_ctx);