Merge branch 'perf-fixes-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/linux-2.6-tip
* 'perf-fixes-for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/tip/linux-2.6-tip: perf symbols: Remove incorrect open-coded container_of() perf record: Handle restrictive permissions in /proc/{kallsyms,modules} x86/kprobes: Prevent kprobes to probe on save_args() irq_work: Drop cmpxchg() result perf: Fix owner-list vs exit x86, hw_nmi: Move backtrace_mask declaration under ARCH_HAS_NMI_WATCHDOG tracing: Fix recursive user stack trace perf,hw_breakpoint: Initialize hardware api earlier x86: Ignore trap bits on single step exceptions tracing: Force arch_local_irq_* notrace for paravirt tracing: Fix module use of trace_bprintk()
This commit is contained in:
commit
d2f30c73ab
@ -824,27 +824,27 @@ static __always_inline void arch_spin_unlock(struct arch_spinlock *lock)
|
|||||||
#define __PV_IS_CALLEE_SAVE(func) \
|
#define __PV_IS_CALLEE_SAVE(func) \
|
||||||
((struct paravirt_callee_save) { func })
|
((struct paravirt_callee_save) { func })
|
||||||
|
|
||||||
static inline unsigned long arch_local_save_flags(void)
|
static inline notrace unsigned long arch_local_save_flags(void)
|
||||||
{
|
{
|
||||||
return PVOP_CALLEE0(unsigned long, pv_irq_ops.save_fl);
|
return PVOP_CALLEE0(unsigned long, pv_irq_ops.save_fl);
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline void arch_local_irq_restore(unsigned long f)
|
static inline notrace void arch_local_irq_restore(unsigned long f)
|
||||||
{
|
{
|
||||||
PVOP_VCALLEE1(pv_irq_ops.restore_fl, f);
|
PVOP_VCALLEE1(pv_irq_ops.restore_fl, f);
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline void arch_local_irq_disable(void)
|
static inline notrace void arch_local_irq_disable(void)
|
||||||
{
|
{
|
||||||
PVOP_VCALLEE0(pv_irq_ops.irq_disable);
|
PVOP_VCALLEE0(pv_irq_ops.irq_disable);
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline void arch_local_irq_enable(void)
|
static inline notrace void arch_local_irq_enable(void)
|
||||||
{
|
{
|
||||||
PVOP_VCALLEE0(pv_irq_ops.irq_enable);
|
PVOP_VCALLEE0(pv_irq_ops.irq_enable);
|
||||||
}
|
}
|
||||||
|
|
||||||
static inline unsigned long arch_local_irq_save(void)
|
static inline notrace unsigned long arch_local_irq_save(void)
|
||||||
{
|
{
|
||||||
unsigned long f;
|
unsigned long f;
|
||||||
|
|
||||||
|
@ -17,15 +17,16 @@
|
|||||||
#include <linux/nmi.h>
|
#include <linux/nmi.h>
|
||||||
#include <linux/module.h>
|
#include <linux/module.h>
|
||||||
|
|
||||||
/* For reliability, we're prepared to waste bits here. */
|
|
||||||
static DECLARE_BITMAP(backtrace_mask, NR_CPUS) __read_mostly;
|
|
||||||
|
|
||||||
u64 hw_nmi_get_sample_period(void)
|
u64 hw_nmi_get_sample_period(void)
|
||||||
{
|
{
|
||||||
return (u64)(cpu_khz) * 1000 * 60;
|
return (u64)(cpu_khz) * 1000 * 60;
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef ARCH_HAS_NMI_WATCHDOG
|
#ifdef ARCH_HAS_NMI_WATCHDOG
|
||||||
|
|
||||||
|
/* For reliability, we're prepared to waste bits here. */
|
||||||
|
static DECLARE_BITMAP(backtrace_mask, NR_CPUS) __read_mostly;
|
||||||
|
|
||||||
void arch_trigger_all_cpu_backtrace(void)
|
void arch_trigger_all_cpu_backtrace(void)
|
||||||
{
|
{
|
||||||
int i;
|
int i;
|
||||||
|
@ -295,6 +295,7 @@ ENDPROC(native_usergs_sysret64)
|
|||||||
.endm
|
.endm
|
||||||
|
|
||||||
/* save partial stack frame */
|
/* save partial stack frame */
|
||||||
|
.pushsection .kprobes.text, "ax"
|
||||||
ENTRY(save_args)
|
ENTRY(save_args)
|
||||||
XCPT_FRAME
|
XCPT_FRAME
|
||||||
cld
|
cld
|
||||||
@ -334,6 +335,7 @@ ENTRY(save_args)
|
|||||||
ret
|
ret
|
||||||
CFI_ENDPROC
|
CFI_ENDPROC
|
||||||
END(save_args)
|
END(save_args)
|
||||||
|
.popsection
|
||||||
|
|
||||||
ENTRY(save_rest)
|
ENTRY(save_rest)
|
||||||
PARTIAL_FRAME 1 REST_SKIP+8
|
PARTIAL_FRAME 1 REST_SKIP+8
|
||||||
|
@ -433,6 +433,10 @@ static int __kprobes hw_breakpoint_handler(struct die_args *args)
|
|||||||
dr6_p = (unsigned long *)ERR_PTR(args->err);
|
dr6_p = (unsigned long *)ERR_PTR(args->err);
|
||||||
dr6 = *dr6_p;
|
dr6 = *dr6_p;
|
||||||
|
|
||||||
|
/* If it's a single step, TRAP bits are random */
|
||||||
|
if (dr6 & DR_STEP)
|
||||||
|
return NOTIFY_DONE;
|
||||||
|
|
||||||
/* Do an early return if no trap bits are set in DR6 */
|
/* Do an early return if no trap bits are set in DR6 */
|
||||||
if ((dr6 & DR_TRAP_BITS) == 0)
|
if ((dr6 & DR_TRAP_BITS) == 0)
|
||||||
return NOTIFY_DONE;
|
return NOTIFY_DONE;
|
||||||
|
@ -33,6 +33,8 @@ enum bp_type_idx {
|
|||||||
|
|
||||||
#ifdef CONFIG_HAVE_HW_BREAKPOINT
|
#ifdef CONFIG_HAVE_HW_BREAKPOINT
|
||||||
|
|
||||||
|
extern int __init init_hw_breakpoint(void);
|
||||||
|
|
||||||
static inline void hw_breakpoint_init(struct perf_event_attr *attr)
|
static inline void hw_breakpoint_init(struct perf_event_attr *attr)
|
||||||
{
|
{
|
||||||
memset(attr, 0, sizeof(*attr));
|
memset(attr, 0, sizeof(*attr));
|
||||||
@ -108,6 +110,8 @@ static inline struct arch_hw_breakpoint *counter_arch_bp(struct perf_event *bp)
|
|||||||
|
|
||||||
#else /* !CONFIG_HAVE_HW_BREAKPOINT */
|
#else /* !CONFIG_HAVE_HW_BREAKPOINT */
|
||||||
|
|
||||||
|
static inline int __init init_hw_breakpoint(void) { return 0; }
|
||||||
|
|
||||||
static inline struct perf_event *
|
static inline struct perf_event *
|
||||||
register_user_hw_breakpoint(struct perf_event_attr *attr,
|
register_user_hw_breakpoint(struct perf_event_attr *attr,
|
||||||
perf_overflow_handler_t triggered,
|
perf_overflow_handler_t triggered,
|
||||||
|
@ -620,7 +620,7 @@ static struct pmu perf_breakpoint = {
|
|||||||
.read = hw_breakpoint_pmu_read,
|
.read = hw_breakpoint_pmu_read,
|
||||||
};
|
};
|
||||||
|
|
||||||
static int __init init_hw_breakpoint(void)
|
int __init init_hw_breakpoint(void)
|
||||||
{
|
{
|
||||||
unsigned int **task_bp_pinned;
|
unsigned int **task_bp_pinned;
|
||||||
int cpu, err_cpu;
|
int cpu, err_cpu;
|
||||||
@ -655,6 +655,5 @@ static int __init init_hw_breakpoint(void)
|
|||||||
|
|
||||||
return -ENOMEM;
|
return -ENOMEM;
|
||||||
}
|
}
|
||||||
core_initcall(init_hw_breakpoint);
|
|
||||||
|
|
||||||
|
|
||||||
|
@ -145,7 +145,9 @@ void irq_work_run(void)
|
|||||||
* Clear the BUSY bit and return to the free state if
|
* Clear the BUSY bit and return to the free state if
|
||||||
* no-one else claimed it meanwhile.
|
* no-one else claimed it meanwhile.
|
||||||
*/
|
*/
|
||||||
cmpxchg(&entry->next, next_flags(NULL, IRQ_WORK_BUSY), NULL);
|
(void)cmpxchg(&entry->next,
|
||||||
|
next_flags(NULL, IRQ_WORK_BUSY),
|
||||||
|
NULL);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
EXPORT_SYMBOL_GPL(irq_work_run);
|
EXPORT_SYMBOL_GPL(irq_work_run);
|
||||||
|
@ -2326,6 +2326,18 @@ static void find_module_sections(struct module *mod, struct load_info *info)
|
|||||||
kmemleak_scan_area(mod->trace_events, sizeof(*mod->trace_events) *
|
kmemleak_scan_area(mod->trace_events, sizeof(*mod->trace_events) *
|
||||||
mod->num_trace_events, GFP_KERNEL);
|
mod->num_trace_events, GFP_KERNEL);
|
||||||
#endif
|
#endif
|
||||||
|
#ifdef CONFIG_TRACING
|
||||||
|
mod->trace_bprintk_fmt_start = section_objs(info, "__trace_printk_fmt",
|
||||||
|
sizeof(*mod->trace_bprintk_fmt_start),
|
||||||
|
&mod->num_trace_bprintk_fmt);
|
||||||
|
/*
|
||||||
|
* This section contains pointers to allocated objects in the trace
|
||||||
|
* code and not scanning it leads to false positives.
|
||||||
|
*/
|
||||||
|
kmemleak_scan_area(mod->trace_bprintk_fmt_start,
|
||||||
|
sizeof(*mod->trace_bprintk_fmt_start) *
|
||||||
|
mod->num_trace_bprintk_fmt, GFP_KERNEL);
|
||||||
|
#endif
|
||||||
#ifdef CONFIG_FTRACE_MCOUNT_RECORD
|
#ifdef CONFIG_FTRACE_MCOUNT_RECORD
|
||||||
/* sechdrs[0].sh_size is always zero */
|
/* sechdrs[0].sh_size is always zero */
|
||||||
mod->ftrace_callsites = section_objs(info, "__mcount_loc",
|
mod->ftrace_callsites = section_objs(info, "__mcount_loc",
|
||||||
|
@ -31,6 +31,7 @@
|
|||||||
#include <linux/kernel_stat.h>
|
#include <linux/kernel_stat.h>
|
||||||
#include <linux/perf_event.h>
|
#include <linux/perf_event.h>
|
||||||
#include <linux/ftrace_event.h>
|
#include <linux/ftrace_event.h>
|
||||||
|
#include <linux/hw_breakpoint.h>
|
||||||
|
|
||||||
#include <asm/irq_regs.h>
|
#include <asm/irq_regs.h>
|
||||||
|
|
||||||
@ -2234,11 +2235,6 @@ int perf_event_release_kernel(struct perf_event *event)
|
|||||||
raw_spin_unlock_irq(&ctx->lock);
|
raw_spin_unlock_irq(&ctx->lock);
|
||||||
mutex_unlock(&ctx->mutex);
|
mutex_unlock(&ctx->mutex);
|
||||||
|
|
||||||
mutex_lock(&event->owner->perf_event_mutex);
|
|
||||||
list_del_init(&event->owner_entry);
|
|
||||||
mutex_unlock(&event->owner->perf_event_mutex);
|
|
||||||
put_task_struct(event->owner);
|
|
||||||
|
|
||||||
free_event(event);
|
free_event(event);
|
||||||
|
|
||||||
return 0;
|
return 0;
|
||||||
@ -2251,9 +2247,43 @@ EXPORT_SYMBOL_GPL(perf_event_release_kernel);
|
|||||||
static int perf_release(struct inode *inode, struct file *file)
|
static int perf_release(struct inode *inode, struct file *file)
|
||||||
{
|
{
|
||||||
struct perf_event *event = file->private_data;
|
struct perf_event *event = file->private_data;
|
||||||
|
struct task_struct *owner;
|
||||||
|
|
||||||
file->private_data = NULL;
|
file->private_data = NULL;
|
||||||
|
|
||||||
|
rcu_read_lock();
|
||||||
|
owner = ACCESS_ONCE(event->owner);
|
||||||
|
/*
|
||||||
|
* Matches the smp_wmb() in perf_event_exit_task(). If we observe
|
||||||
|
* !owner it means the list deletion is complete and we can indeed
|
||||||
|
* free this event, otherwise we need to serialize on
|
||||||
|
* owner->perf_event_mutex.
|
||||||
|
*/
|
||||||
|
smp_read_barrier_depends();
|
||||||
|
if (owner) {
|
||||||
|
/*
|
||||||
|
* Since delayed_put_task_struct() also drops the last
|
||||||
|
* task reference we can safely take a new reference
|
||||||
|
* while holding the rcu_read_lock().
|
||||||
|
*/
|
||||||
|
get_task_struct(owner);
|
||||||
|
}
|
||||||
|
rcu_read_unlock();
|
||||||
|
|
||||||
|
if (owner) {
|
||||||
|
mutex_lock(&owner->perf_event_mutex);
|
||||||
|
/*
|
||||||
|
* We have to re-check the event->owner field, if it is cleared
|
||||||
|
* we raced with perf_event_exit_task(), acquiring the mutex
|
||||||
|
* ensured they're done, and we can proceed with freeing the
|
||||||
|
* event.
|
||||||
|
*/
|
||||||
|
if (event->owner)
|
||||||
|
list_del_init(&event->owner_entry);
|
||||||
|
mutex_unlock(&owner->perf_event_mutex);
|
||||||
|
put_task_struct(owner);
|
||||||
|
}
|
||||||
|
|
||||||
return perf_event_release_kernel(event);
|
return perf_event_release_kernel(event);
|
||||||
}
|
}
|
||||||
|
|
||||||
@ -5677,7 +5707,7 @@ SYSCALL_DEFINE5(perf_event_open,
|
|||||||
mutex_unlock(&ctx->mutex);
|
mutex_unlock(&ctx->mutex);
|
||||||
|
|
||||||
event->owner = current;
|
event->owner = current;
|
||||||
get_task_struct(current);
|
|
||||||
mutex_lock(¤t->perf_event_mutex);
|
mutex_lock(¤t->perf_event_mutex);
|
||||||
list_add_tail(&event->owner_entry, ¤t->perf_event_list);
|
list_add_tail(&event->owner_entry, ¤t->perf_event_list);
|
||||||
mutex_unlock(¤t->perf_event_mutex);
|
mutex_unlock(¤t->perf_event_mutex);
|
||||||
@ -5745,12 +5775,6 @@ perf_event_create_kernel_counter(struct perf_event_attr *attr, int cpu,
|
|||||||
++ctx->generation;
|
++ctx->generation;
|
||||||
mutex_unlock(&ctx->mutex);
|
mutex_unlock(&ctx->mutex);
|
||||||
|
|
||||||
event->owner = current;
|
|
||||||
get_task_struct(current);
|
|
||||||
mutex_lock(¤t->perf_event_mutex);
|
|
||||||
list_add_tail(&event->owner_entry, ¤t->perf_event_list);
|
|
||||||
mutex_unlock(¤t->perf_event_mutex);
|
|
||||||
|
|
||||||
return event;
|
return event;
|
||||||
|
|
||||||
err_free:
|
err_free:
|
||||||
@ -5901,8 +5925,24 @@ again:
|
|||||||
*/
|
*/
|
||||||
void perf_event_exit_task(struct task_struct *child)
|
void perf_event_exit_task(struct task_struct *child)
|
||||||
{
|
{
|
||||||
|
struct perf_event *event, *tmp;
|
||||||
int ctxn;
|
int ctxn;
|
||||||
|
|
||||||
|
mutex_lock(&child->perf_event_mutex);
|
||||||
|
list_for_each_entry_safe(event, tmp, &child->perf_event_list,
|
||||||
|
owner_entry) {
|
||||||
|
list_del_init(&event->owner_entry);
|
||||||
|
|
||||||
|
/*
|
||||||
|
* Ensure the list deletion is visible before we clear
|
||||||
|
* the owner, closes a race against perf_release() where
|
||||||
|
* we need to serialize on the owner->perf_event_mutex.
|
||||||
|
*/
|
||||||
|
smp_wmb();
|
||||||
|
event->owner = NULL;
|
||||||
|
}
|
||||||
|
mutex_unlock(&child->perf_event_mutex);
|
||||||
|
|
||||||
for_each_task_context_nr(ctxn)
|
for_each_task_context_nr(ctxn)
|
||||||
perf_event_exit_task_context(child, ctxn);
|
perf_event_exit_task_context(child, ctxn);
|
||||||
}
|
}
|
||||||
@ -6321,6 +6361,8 @@ perf_cpu_notify(struct notifier_block *self, unsigned long action, void *hcpu)
|
|||||||
|
|
||||||
void __init perf_event_init(void)
|
void __init perf_event_init(void)
|
||||||
{
|
{
|
||||||
|
int ret;
|
||||||
|
|
||||||
perf_event_init_all_cpus();
|
perf_event_init_all_cpus();
|
||||||
init_srcu_struct(&pmus_srcu);
|
init_srcu_struct(&pmus_srcu);
|
||||||
perf_pmu_register(&perf_swevent);
|
perf_pmu_register(&perf_swevent);
|
||||||
@ -6328,4 +6370,7 @@ void __init perf_event_init(void)
|
|||||||
perf_pmu_register(&perf_task_clock);
|
perf_pmu_register(&perf_task_clock);
|
||||||
perf_tp_register();
|
perf_tp_register();
|
||||||
perf_cpu_notifier(perf_cpu_notify);
|
perf_cpu_notifier(perf_cpu_notify);
|
||||||
|
|
||||||
|
ret = init_hw_breakpoint();
|
||||||
|
WARN(ret, "hw_breakpoint initialization failed with: %d", ret);
|
||||||
}
|
}
|
||||||
|
@ -1283,6 +1283,8 @@ void trace_dump_stack(void)
|
|||||||
__ftrace_trace_stack(global_trace.buffer, flags, 3, preempt_count());
|
__ftrace_trace_stack(global_trace.buffer, flags, 3, preempt_count());
|
||||||
}
|
}
|
||||||
|
|
||||||
|
static DEFINE_PER_CPU(int, user_stack_count);
|
||||||
|
|
||||||
void
|
void
|
||||||
ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
|
ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
|
||||||
{
|
{
|
||||||
@ -1301,6 +1303,18 @@ ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
|
|||||||
if (unlikely(in_nmi()))
|
if (unlikely(in_nmi()))
|
||||||
return;
|
return;
|
||||||
|
|
||||||
|
/*
|
||||||
|
* prevent recursion, since the user stack tracing may
|
||||||
|
* trigger other kernel events.
|
||||||
|
*/
|
||||||
|
preempt_disable();
|
||||||
|
if (__this_cpu_read(user_stack_count))
|
||||||
|
goto out;
|
||||||
|
|
||||||
|
__this_cpu_inc(user_stack_count);
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK,
|
event = trace_buffer_lock_reserve(buffer, TRACE_USER_STACK,
|
||||||
sizeof(*entry), flags, pc);
|
sizeof(*entry), flags, pc);
|
||||||
if (!event)
|
if (!event)
|
||||||
@ -1318,6 +1332,11 @@ ftrace_trace_userstack(struct ring_buffer *buffer, unsigned long flags, int pc)
|
|||||||
save_stack_trace_user(&trace);
|
save_stack_trace_user(&trace);
|
||||||
if (!filter_check_discard(call, entry, buffer, event))
|
if (!filter_check_discard(call, entry, buffer, event))
|
||||||
ring_buffer_unlock_commit(buffer, event);
|
ring_buffer_unlock_commit(buffer, event);
|
||||||
|
|
||||||
|
__this_cpu_dec(user_stack_count);
|
||||||
|
|
||||||
|
out:
|
||||||
|
preempt_enable();
|
||||||
}
|
}
|
||||||
|
|
||||||
#ifdef UNUSED
|
#ifdef UNUSED
|
||||||
|
@ -697,17 +697,18 @@ static int __cmd_record(int argc, const char **argv)
|
|||||||
if (err < 0)
|
if (err < 0)
|
||||||
err = event__synthesize_kernel_mmap(process_synthesized_event,
|
err = event__synthesize_kernel_mmap(process_synthesized_event,
|
||||||
session, machine, "_stext");
|
session, machine, "_stext");
|
||||||
if (err < 0) {
|
if (err < 0)
|
||||||
pr_err("Couldn't record kernel reference relocation symbol.\n");
|
pr_err("Couldn't record kernel reference relocation symbol\n"
|
||||||
return err;
|
"Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
|
||||||
}
|
"Check /proc/kallsyms permission or run as root.\n");
|
||||||
|
|
||||||
err = event__synthesize_modules(process_synthesized_event,
|
err = event__synthesize_modules(process_synthesized_event,
|
||||||
session, machine);
|
session, machine);
|
||||||
if (err < 0) {
|
if (err < 0)
|
||||||
pr_err("Couldn't record kernel reference relocation symbol.\n");
|
pr_err("Couldn't record kernel module information.\n"
|
||||||
return err;
|
"Symbol resolution may be skewed if relocation was used (e.g. kexec).\n"
|
||||||
}
|
"Check /proc/modules permission or run as root.\n");
|
||||||
|
|
||||||
if (perf_guest)
|
if (perf_guest)
|
||||||
perf_session__process_machines(session, event__synthesize_guest_os);
|
perf_session__process_machines(session, event__synthesize_guest_os);
|
||||||
|
|
||||||
|
@ -295,7 +295,9 @@ static void symbols__insert_by_name(struct rb_root *self, struct symbol *sym)
|
|||||||
{
|
{
|
||||||
struct rb_node **p = &self->rb_node;
|
struct rb_node **p = &self->rb_node;
|
||||||
struct rb_node *parent = NULL;
|
struct rb_node *parent = NULL;
|
||||||
struct symbol_name_rb_node *symn = ((void *)sym) - sizeof(*parent), *s;
|
struct symbol_name_rb_node *symn, *s;
|
||||||
|
|
||||||
|
symn = container_of(sym, struct symbol_name_rb_node, sym);
|
||||||
|
|
||||||
while (*p != NULL) {
|
while (*p != NULL) {
|
||||||
parent = *p;
|
parent = *p;
|
||||||
|
Loading…
Reference in New Issue
Block a user