Release 4.11 drivers/oprofile/buffer_sync.c
/**
* @file buffer_sync.c
*
* @remark Copyright 2002-2009 OProfile authors
* @remark Read the file COPYING
*
* @author John Levon <levon@movementarian.org>
* @author Barry Kasindorf
* @author Robert Richter <robert.richter@amd.com>
*
* This is the core of the buffer management. Each
* CPU buffer is processed and entered into the
* global event buffer. Such processing is necessary
* in several circumstances, mentioned below.
*
* The processing does the job of converting the
* transitory EIP value into a persistent dentry/offset
* value that the profiler can record at its leisure.
*
* See fs/dcookies.c for a description of the dentry/offset
* objects.
*/
#include <linux/file.h>
#include <linux/mm.h>
#include <linux/workqueue.h>
#include <linux/notifier.h>
#include <linux/dcookies.h>
#include <linux/profile.h>
#include <linux/module.h>
#include <linux/fs.h>
#include <linux/oprofile.h>
#include <linux/sched.h>
#include <linux/sched/mm.h>
#include <linux/sched/task.h>
#include <linux/gfp.h>
#include "oprofile_stats.h"
#include "event_buffer.h"
#include "cpu_buffer.h"
#include "buffer_sync.h"
static LIST_HEAD(dying_tasks);
static LIST_HEAD(dead_tasks);
static cpumask_var_t marked_cpus;
static DEFINE_SPINLOCK(task_mortuary);
static void process_task_mortuary(void);
/* Take ownership of the task struct and place it on the
* list for processing. Only after two full buffer syncs
* does the task eventually get freed, because by then
* we are sure we will not reference it again.
* Can be invoked from softirq via RCU callback due to
* call_rcu() of the task struct, hence the _irqsave.
*/
static int
task_free_notify(struct notifier_block *self, unsigned long val, void *data)
{
unsigned long flags;
struct task_struct *task = data;
spin_lock_irqsave(&task_mortuary, flags);
list_add(&task->tasks, &dying_tasks);
spin_unlock_irqrestore(&task_mortuary, flags);
return NOTIFY_OK;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 50 | 83.33% | 2 | 66.67% |
Paul E. McKenney | 10 | 16.67% | 1 | 33.33% |
Total | 60 | 100.00% | 3 | 100.00% |
/* The task is on its way out. A sync of the buffer means we can catch
* any remaining samples for this task.
*/
static int
task_exit_notify(struct notifier_block *self, unsigned long val, void *data)
{
/* To avoid latency problems, we only process the current CPU,
* hoping that most samples for the task are on this CPU
*/
sync_buffer(raw_smp_processor_id());
return 0;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 28 | 96.55% | 2 | 66.67% |
Ingo Molnar | 1 | 3.45% | 1 | 33.33% |
Total | 29 | 100.00% | 3 | 100.00% |
/* The task is about to try a do_munmap(). We peek at what it's going to
* do, and if it's an executable region, process the samples first, so
* we don't lose any. This does not have to be exact, it's a QoI issue
* only.
*/
static int
munmap_notify(struct notifier_block *self, unsigned long val, void *data)
{
unsigned long addr = (unsigned long)data;
struct mm_struct *mm = current->mm;
struct vm_area_struct *mpnt;
down_read(&mm->mmap_sem);
mpnt = find_vma(mm, addr);
if (mpnt && mpnt->vm_file && (mpnt->vm_flags & VM_EXEC)) {
up_read(&mm->mmap_sem);
/* To avoid latency problems, we only process the current CPU,
* hoping that most samples for the task are on this CPU
*/
sync_buffer(raw_smp_processor_id());
return 0;
}
up_read(&mm->mmap_sem);
return 0;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 106 | 99.07% | 2 | 66.67% |
Ingo Molnar | 1 | 0.93% | 1 | 33.33% |
Total | 107 | 100.00% | 3 | 100.00% |
/* We need to be told about new modules so we don't attribute to a previously
* loaded module, or drop the samples on the floor.
*/
static int
module_load_notify(struct notifier_block *self, unsigned long val, void *data)
{
#ifdef CONFIG_MODULES
if (val != MODULE_STATE_COMING)
return 0;
/* FIXME: should we process all CPU buffers ? */
mutex_lock(&buffer_mutex);
add_event_entry(ESCAPE_CODE);
add_event_entry(MODULE_LOADED_CODE);
mutex_unlock(&buffer_mutex);
#endif
return 0;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 55 | 93.22% | 3 | 75.00% |
Markus Armbruster | 4 | 6.78% | 1 | 25.00% |
Total | 59 | 100.00% | 4 | 100.00% |
static struct notifier_block task_free_nb = {
.notifier_call = task_free_notify,
};
static struct notifier_block task_exit_nb = {
.notifier_call = task_exit_notify,
};
static struct notifier_block munmap_nb = {
.notifier_call = munmap_notify,
};
static struct notifier_block module_load_nb = {
.notifier_call = module_load_notify,
};
static void free_all_tasks(void)
{
/* make sure we don't leak task structs */
process_task_mortuary();
process_task_mortuary();
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
Robert Richter | 15 | 100.00% | 1 | 100.00% |
Total | 15 | 100.00% | 1 | 100.00% |
int sync_start(void)
{
int err;
if (!zalloc_cpumask_var(&marked_cpus, GFP_KERNEL))
return -ENOMEM;
err = task_handoff_register(&task_free_nb);
if (err)
goto out1;
err = profile_event_register(PROFILE_TASK_EXIT, &task_exit_nb);
if (err)
goto out2;
err = profile_event_register(PROFILE_MUNMAP, &munmap_nb);
if (err)
goto out3;
err = register_module_notifier(&module_load_nb);
if (err)
goto out4;
start_cpu_work();
out:
return err;
out4:
profile_event_unregister(PROFILE_MUNMAP, &munmap_nb);
out3:
profile_event_unregister(PROFILE_TASK_EXIT, &task_exit_nb);
out2:
task_handoff_unregister(&task_free_nb);
free_all_tasks();
out1:
free_cpumask_var(marked_cpus);
goto out;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 105 | 76.09% | 3 | 37.50% |
Robert Richter | 25 | 18.12% | 3 | 37.50% |
Andrew Morton | 7 | 5.07% | 1 | 12.50% |
Li Zefan | 1 | 0.72% | 1 | 12.50% |
Total | 138 | 100.00% | 8 | 100.00% |
void sync_stop(void)
{
end_cpu_work();
unregister_module_notifier(&module_load_nb);
profile_event_unregister(PROFILE_MUNMAP, &munmap_nb);
profile_event_unregister(PROFILE_TASK_EXIT, &task_exit_nb);
task_handoff_unregister(&task_free_nb);
barrier(); /* do all of the above first */
flush_cpu_work();
free_all_tasks();
free_cpumask_var(marked_cpus);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 37 | 69.81% | 4 | 44.44% |
Robert Richter | 15 | 28.30% | 4 | 44.44% |
Tejun Heo | 1 | 1.89% | 1 | 11.11% |
Total | 53 | 100.00% | 9 | 100.00% |
/* Optimisation. We can manage without taking the dcookie sem
* because we cannot reach this code without at least one
* dcookie user still being registered (namely, the reader
* of the event buffer). */
static inline unsigned long fast_get_dcookie(const struct path *path)
{
unsigned long cookie;
if (path->dentry->d_flags & DCACHE_COOKIE)
return (unsigned long)path->dentry;
get_dcookie(path, &cookie);
return cookie;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 37 | 77.08% | 2 | 40.00% |
Jan Blunck | 7 | 14.58% | 1 | 20.00% |
Nicholas Piggin | 3 | 6.25% | 1 | 20.00% |
Al Viro | 1 | 2.08% | 1 | 20.00% |
Total | 48 | 100.00% | 5 | 100.00% |
/* Look up the dcookie for the task's mm->exe_file,
* which corresponds loosely to "application name". This is
* not strictly necessary but allows oprofile to associate
* shared-library samples with particular applications
*/
static unsigned long get_exec_dcookie(struct mm_struct *mm)
{
unsigned long cookie = NO_COOKIE;
struct file *exe_file;
if (!mm)
goto done;
exe_file = get_mm_exe_file(mm);
if (!exe_file)
goto done;
cookie = fast_get_dcookie(&exe_file->f_path);
fput(exe_file);
done:
return cookie;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 33 | 50.00% | 3 | 42.86% |
Davidlohr Bueso A | 29 | 43.94% | 1 | 14.29% |
Konstantin Khlebnikov | 2 | 3.03% | 1 | 14.29% |
Josef 'Jeff' Sipek | 1 | 1.52% | 1 | 14.29% |
Jan Blunck | 1 | 1.52% | 1 | 14.29% |
Total | 66 | 100.00% | 7 | 100.00% |
/* Convert the EIP value of a sample into a persistent dentry/offset
* pair that can then be added to the global event buffer. We make
* sure to do this lookup before a mm->mmap modification happens so
* we don't lose track.
*
* The caller must ensure the mm is not nil (ie: not a kernel thread).
*/
static unsigned long
lookup_dcookie(struct mm_struct *mm, unsigned long addr, off_t *offset)
{
unsigned long cookie = NO_COOKIE;
struct vm_area_struct *vma;
down_read(&mm->mmap_sem);
for (vma = find_vma(mm, addr); vma; vma = vma->vm_next) {
if (addr < vma->vm_start || addr >= vma->vm_end)
continue;
if (vma->vm_file) {
cookie = fast_get_dcookie(&vma->vm_file->f_path);
*offset = (vma->vm_pgoff << PAGE_SHIFT) + addr -
vma->vm_start;
} else {
/* must be an anonymous map */
*offset = addr;
}
break;
}
if (!vma)
cookie = INVALID_COOKIE;
up_read(&mm->mmap_sem);
return cookie;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 124 | 87.32% | 3 | 50.00% |
Davidlohr Bueso A | 16 | 11.27% | 1 | 16.67% |
Josef 'Jeff' Sipek | 1 | 0.70% | 1 | 16.67% |
Jan Blunck | 1 | 0.70% | 1 | 16.67% |
Total | 142 | 100.00% | 6 | 100.00% |
static unsigned long last_cookie = INVALID_COOKIE;
static void add_cpu_switch(int i)
{
add_event_entry(ESCAPE_CODE);
add_event_entry(CPU_SWITCH_CODE);
add_event_entry(i);
last_cookie = INVALID_COOKIE;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 28 | 100.00% | 2 | 100.00% |
Total | 28 | 100.00% | 2 | 100.00% |
static void add_kernel_ctx_switch(unsigned int in_kernel)
{
add_event_entry(ESCAPE_CODE);
if (in_kernel)
add_event_entry(KERNEL_ENTER_SWITCH_CODE);
else
add_event_entry(KERNEL_EXIT_SWITCH_CODE);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 30 | 100.00% | 2 | 100.00% |
Total | 30 | 100.00% | 2 | 100.00% |
static void
add_user_ctx_switch(struct task_struct const *task, unsigned long cookie)
{
add_event_entry(ESCAPE_CODE);
add_event_entry(CTX_SWITCH_CODE);
add_event_entry(task->pid);
add_event_entry(cookie);
/* Another code for daemon back-compat */
add_event_entry(ESCAPE_CODE);
add_event_entry(CTX_TGID_CODE);
add_event_entry(task->tgid);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 56 | 100.00% | 4 | 100.00% |
Total | 56 | 100.00% | 4 | 100.00% |
static void add_cookie_switch(unsigned long cookie)
{
add_event_entry(ESCAPE_CODE);
add_event_entry(COOKIE_SWITCH_CODE);
add_event_entry(cookie);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 25 | 100.00% | 2 | 100.00% |
Total | 25 | 100.00% | 2 | 100.00% |
static void add_trace_begin(void)
{
add_event_entry(ESCAPE_CODE);
add_event_entry(TRACE_BEGIN_CODE);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
Greg Banks | 18 | 100.00% | 1 | 100.00% |
Total | 18 | 100.00% | 1 | 100.00% |
static void add_data(struct op_entry *entry, struct mm_struct *mm)
{
unsigned long code, pc, val;
unsigned long cookie;
off_t offset;
if (!op_cpu_buffer_get_data(entry, &code))
return;
if (!op_cpu_buffer_get_data(entry, &pc))
return;
if (!op_cpu_buffer_get_size(entry))
return;
if (mm) {
cookie = lookup_dcookie(mm, pc, &offset);
if (cookie == NO_COOKIE)
offset = pc;
if (cookie == INVALID_COOKIE) {
atomic_inc(&oprofile_stats.sample_lost_no_mapping);
offset = pc;
}
if (cookie != last_cookie) {
add_cookie_switch(cookie);
last_cookie = cookie;
}
} else
offset = pc;
add_event_entry(ESCAPE_CODE);
add_event_entry(code);
add_event_entry(offset); /* Offset from Dcookie */
while (op_cpu_buffer_get_data(entry, &val))
add_event_entry(val);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
Barry Kasindorf | 108 | 65.45% | 1 | 16.67% |
Robert Richter | 57 | 34.55% | 5 | 83.33% |
Total | 165 | 100.00% | 6 | 100.00% |
static inline void add_sample_entry(unsigned long offset, unsigned long event)
{
add_event_entry(offset);
add_event_entry(event);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 24 | 96.00% | 1 | 50.00% |
Robert Richter | 1 | 4.00% | 1 | 50.00% |
Total | 25 | 100.00% | 2 | 100.00% |
/*
* Add a sample to the global event buffer. If possible the
* sample is converted into a persistent dentry/offset pair
* for later lookup from userspace. Return 0 on failure.
*/
static int
add_sample(struct mm_struct *mm, struct op_sample *s, int in_kernel)
{
unsigned long cookie;
off_t offset;
if (in_kernel) {
add_sample_entry(s->eip, s->event);
return 1;
}
/* add userspace sample */
if (!mm) {
atomic_inc(&oprofile_stats.sample_lost_no_mm);
return 0;
}
cookie = lookup_dcookie(mm, s->eip, &offset);
if (cookie == INVALID_COOKIE) {
atomic_inc(&oprofile_stats.sample_lost_no_mapping);
return 0;
}
if (cookie != last_cookie) {
add_cookie_switch(cookie);
last_cookie = cookie;
}
add_sample_entry(offset, s->event);
return 1;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 77 | 60.63% | 4 | 66.67% |
Robert Richter | 43 | 33.86% | 1 | 16.67% |
Greg Banks | 7 | 5.51% | 1 | 16.67% |
Total | 127 | 100.00% | 6 | 100.00% |
static void release_mm(struct mm_struct *mm)
{
if (!mm)
return;
mmput(mm);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 22 | 100.00% | 2 | 100.00% |
Total | 22 | 100.00% | 2 | 100.00% |
static inline int is_code(unsigned long val)
{
return val == ESCAPE_CODE;
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 14 | 87.50% | 1 | 50.00% |
Greg Banks | 2 | 12.50% | 1 | 50.00% |
Total | 16 | 100.00% | 2 | 100.00% |
/* Move tasks along towards death. Any tasks on dead_tasks
* will definitely have no remaining references in any
* CPU buffers at this point, because we use two lists,
* and to have reached the list, it must have gone through
* one full sync already.
*/
static void process_task_mortuary(void)
{
unsigned long flags;
LIST_HEAD(local_dead_tasks);
struct task_struct *task;
struct task_struct *ttask;
spin_lock_irqsave(&task_mortuary, flags);
list_splice_init(&dead_tasks, &local_dead_tasks);
list_splice_init(&dying_tasks, &dead_tasks);
spin_unlock_irqrestore(&task_mortuary, flags);
list_for_each_entry_safe(task, ttask, &local_dead_tasks, tasks) {
list_del(&task->tasks);
free_task(task);
}
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 49 | 56.98% | 1 | 33.33% |
Paul E. McKenney | 36 | 41.86% | 1 | 33.33% |
Adrian Bunk | 1 | 1.16% | 1 | 33.33% |
Total | 86 | 100.00% | 3 | 100.00% |
static void mark_done(int cpu)
{
int i;
cpumask_set_cpu(cpu, marked_cpus);
for_each_online_cpu(i) {
if (!cpumask_test_cpu(i, marked_cpus))
return;
}
/* All CPUs have been processed at least once,
* we can process the mortuary once
*/
process_task_mortuary();
cpumask_clear(marked_cpus);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 42 | 93.33% | 1 | 50.00% |
Rusty Russell | 3 | 6.67% | 1 | 50.00% |
Total | 45 | 100.00% | 2 | 100.00% |
/* FIXME: this is not sufficient if we implement syscall barrier backtrace
* traversal, the code switch to sb_sample_start at first kernel enter/exit
* switch so we need a fifth state and some special handling in sync_buffer()
*/
typedef enum {
sb_bt_ignore = -2,
sb_buffer_start,
sb_bt_start,
sb_sample_start,
}
sync_buffer_state;
/* Sync one of the CPU's buffers into the global event buffer.
* Here we need to go through each batch of samples punctuated
* by context switch notes, taking the task's mmap_sem and doing
* lookup in task->mm->mmap to convert EIP into dcookie/offset
* value.
*/
void sync_buffer(int cpu)
{
struct mm_struct *mm = NULL;
struct mm_struct *oldmm;
unsigned long val;
struct task_struct *new;
unsigned long cookie = 0;
int in_kernel = 1;
sync_buffer_state state = sb_buffer_start;
unsigned int i;
unsigned long available;
unsigned long flags;
struct op_entry entry;
struct op_sample *sample;
mutex_lock(&buffer_mutex);
add_cpu_switch(cpu);
op_cpu_buffer_reset(cpu);
available = op_cpu_buffer_entries(cpu);
for (i = 0; i < available; ++i) {
sample = op_cpu_buffer_read_entry(&entry, cpu);
if (!sample)
break;
if (is_code(sample->eip)) {
flags = sample->event;
if (flags & TRACE_BEGIN) {
state = sb_bt_start;
add_trace_begin();
}
if (flags & KERNEL_CTX_SWITCH) {
/* kernel/userspace switch */
in_kernel = flags & IS_KERNEL;
if (state == sb_buffer_start)
state = sb_sample_start;
add_kernel_ctx_switch(flags & IS_KERNEL);
}
if (flags & USER_CTX_SWITCH
&& op_cpu_buffer_get_data(&entry, &val)) {
/* userspace context switch */
new = (struct task_struct *)val;
oldmm = mm;
release_mm(oldmm);
mm = get_task_mm(new);
if (mm != oldmm)
cookie = get_exec_dcookie(mm);
add_user_ctx_switch(new, cookie);
}
if (op_cpu_buffer_get_size(&entry))
add_data(&entry, mm);
continue;
}
if (state < sb_bt_start)
/* ignore sample */
continue;
if (add_sample(mm, sample, in_kernel))
continue;
/* ignore backtraces if failed to add a sample */
if (state == sb_bt_start) {
state = sb_bt_ignore;
atomic_inc(&oprofile_stats.bt_lost_no_mapping);
}
}
release_mm(mm);
mark_done(cpu);
mutex_unlock(&buffer_mutex);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 144 | 44.86% | 7 | 30.43% |
Robert Richter | 122 | 38.01% | 10 | 43.48% |
Greg Banks | 40 | 12.46% | 1 | 4.35% |
Barry Kasindorf | 9 | 2.80% | 2 | 8.70% |
Markus Armbruster | 4 | 1.25% | 1 | 4.35% |
Mika Kukkonen | 1 | 0.31% | 1 | 4.35% |
Davidlohr Bueso A | 1 | 0.31% | 1 | 4.35% |
Total | 321 | 100.00% | 23 | 100.00% |
/* The function can be used to add a buffer worth of data directly to
* the kernel buffer. The buffer is assumed to be a circular buffer.
* Take the entries from index start and end at index end, wrapping
* at max_entries.
*/
void oprofile_put_buff(unsigned long *buf, unsigned int start,
unsigned int stop, unsigned int max)
{
int i;
i = start;
mutex_lock(&buffer_mutex);
while (i != stop) {
add_event_entry(buf[i++]);
if (i >= max)
i = 0;
}
mutex_unlock(&buffer_mutex);
}
Contributors
Person | Tokens | Prop | Commits | CommitProp |
Carl E. Love | 68 | 100.00% | 1 | 100.00% |
Total | 68 | 100.00% | 1 | 100.00% |
Overall Contributors
Person | Tokens | Prop | Commits | CommitProp |
John Levon | 1202 | 62.83% | 16 | 27.12% |
Robert Richter | 280 | 14.64% | 18 | 30.51% |
Barry Kasindorf | 117 | 6.12% | 2 | 3.39% |
Greg Banks | 84 | 4.39% | 1 | 1.69% |
Carl E. Love | 69 | 3.61% | 1 | 1.69% |
Davidlohr Bueso A | 50 | 2.61% | 1 | 1.69% |
Paul E. McKenney | 47 | 2.46% | 1 | 1.69% |
Jan Blunck | 9 | 0.47% | 1 | 1.69% |
Markus Armbruster | 8 | 0.42% | 1 | 1.69% |
Ingo Molnar | 8 | 0.42% | 3 | 5.08% |
Andrew Morton | 7 | 0.37% | 1 | 1.69% |
Tejun Heo | 4 | 0.21% | 2 | 3.39% |
Rusty Russell | 4 | 0.21% | 1 | 1.69% |
Thomas Gleixner | 4 | 0.21% | 1 | 1.69% |
Bob Nelson | 3 | 0.16% | 1 | 1.69% |
Adrian Bunk | 3 | 0.16% | 1 | 1.69% |
Konstantin Khlebnikov | 3 | 0.16% | 1 | 1.69% |
Alexey Dobriyan | 3 | 0.16% | 1 | 1.69% |
Nicholas Piggin | 3 | 0.16% | 1 | 1.69% |
Josef 'Jeff' Sipek | 2 | 0.10% | 1 | 1.69% |
Mika Kukkonen | 1 | 0.05% | 1 | 1.69% |
Al Viro | 1 | 0.05% | 1 | 1.69% |
Li Zefan | 1 | 0.05% | 1 | 1.69% |
Total | 1913 | 100.00% | 59 | 100.00% |
Information contained on this website is for historical information purposes only and does not indicate or represent copyright ownership.