Return-Path: Received: (majordomo@vger.kernel.org) by vger.kernel.org via listexpand id S1753492AbaKEDM1 (ORCPT ); Tue, 4 Nov 2014 22:12:27 -0500 Received: from mga01.intel.com ([192.55.52.88]:23387 "EHLO mga01.intel.com" rhost-flags-OK-OK-OK-OK) by vger.kernel.org with ESMTP id S1753332AbaKEDKl (ORCPT ); Tue, 4 Nov 2014 22:10:41 -0500 X-ExtLoop1: 1 X-IronPort-AV: E=Sophos;i="5.07,317,1413270000"; d="scan'208";a="617287007" From: Kan Liang To: a.p.zijlstra@chello.nl, eranian@google.com Cc: linux-kernel@vger.kernel.org, mingo@redhat.com, paulus@samba.org, acme@kernel.org, jolsa@redhat.com, ak@linux.intel.com, Kan Liang Subject: [PATCH V7 11/17] perf, core: expose LBR call stack to user perf tool Date: Tue, 4 Nov 2014 21:56:07 -0500 Message-Id: <1415156173-10035-12-git-send-email-kan.liang@intel.com> X-Mailer: git-send-email 1.8.3.2 In-Reply-To: <1415156173-10035-1-git-send-email-kan.liang@intel.com> References: <1415156173-10035-1-git-send-email-kan.liang@intel.com> Sender: linux-kernel-owner@vger.kernel.org List-ID: X-Mailing-List: linux-kernel@vger.kernel.org From: Yan, Zheng With LBR call stack feature enable, there are two call chain data sources, traditional frame pointer and LBR call stack. This patch extends the perf_callchain_entry struct to mark the available call chain source. The frame pointer is still output as PERF_SAMPLE_CALLCHAIN data format. The LBR call stack data will be output as PERF_SAMPLE_BRANCH_STACK data format. Note: The LBR call stack is only available for user callchain. The kernel is always got from frame pointers. The user space perf tool also need to be changed to handle these two sources. Signed-off-by: Kan Liang Signed-off-by: Yan, Zheng --- arch/x86/kernel/cpu/perf_event.c | 7 +++++++ arch/x86/kernel/cpu/perf_event_intel.c | 2 +- arch/x86/kernel/cpu/perf_event_intel_ds.c | 2 +- arch/x86/kernel/cpu/perf_event_intel_lbr.c | 2 ++ include/linux/perf_event.h | 14 +++++++++++++- kernel/events/callchain.c | 1 + kernel/events/core.c | 22 +++++++++++++++++----- 7 files changed, 42 insertions(+), 8 deletions(-) diff --git a/arch/x86/kernel/cpu/perf_event.c b/arch/x86/kernel/cpu/perf_event.c index 1fd9492..646e705 100644 --- a/arch/x86/kernel/cpu/perf_event.c +++ b/arch/x86/kernel/cpu/perf_event.c @@ -2041,6 +2041,10 @@ perf_callchain_user32(struct pt_regs *regs, struct perf_callchain_entry *entry) perf_callchain_store(entry, cs_base + frame.return_address); fp = compat_ptr(ss_base + frame.next_frame); } + + if (fp != compat_ptr(regs->bp)) + entry->source |= PERF_FP_CALLCHAIN; + return 1; } #else @@ -2093,6 +2097,9 @@ perf_callchain_user(struct perf_callchain_entry *entry, struct pt_regs *regs) perf_callchain_store(entry, frame.return_address); fp = frame.next_frame; } + + if (fp != (void __user *)regs->bp) + entry->source |= PERF_FP_CALLCHAIN; } /* diff --git a/arch/x86/kernel/cpu/perf_event_intel.c b/arch/x86/kernel/cpu/perf_event_intel.c index 5f449fb..b35e23d 100644 --- a/arch/x86/kernel/cpu/perf_event_intel.c +++ b/arch/x86/kernel/cpu/perf_event_intel.c @@ -1404,7 +1404,7 @@ again: perf_sample_data_init(&data, 0, event->hw.last_period); - if (has_branch_stack(event)) + if (needs_branch_stack(event)) data.br_stack = &cpuc->lbr_stack; if (perf_event_overflow(event, &data, regs)) diff --git a/arch/x86/kernel/cpu/perf_event_intel_ds.c b/arch/x86/kernel/cpu/perf_event_intel_ds.c index 46211bc..517fd26 100644 --- a/arch/x86/kernel/cpu/perf_event_intel_ds.c +++ b/arch/x86/kernel/cpu/perf_event_intel_ds.c @@ -907,7 +907,7 @@ static void __intel_pmu_pebs_event(struct perf_event *event, data.txn = intel_hsw_transaction(pebs); } - if (has_branch_stack(event)) + if (needs_branch_stack(event)) data.br_stack = &cpuc->lbr_stack; if (perf_event_overflow(event, &data, ®s)) diff --git a/arch/x86/kernel/cpu/perf_event_intel_lbr.c b/arch/x86/kernel/cpu/perf_event_intel_lbr.c index 8c72efa..a9e3a0d 100644 --- a/arch/x86/kernel/cpu/perf_event_intel_lbr.c +++ b/arch/x86/kernel/cpu/perf_event_intel_lbr.c @@ -746,6 +746,8 @@ intel_pmu_lbr_filter(struct cpu_hw_events *cpuc) int i, j, type; bool compress = false; + cpuc->lbr_stack.user_callstack = branch_user_callstack(br_sel); + /* if sampling all branches, then nothing to filter */ if ((br_sel & X86_BR_ALL) == X86_BR_ALL) return; diff --git a/include/linux/perf_event.h b/include/linux/perf_event.h index 0d67460..c42f4ec 100644 --- a/include/linux/perf_event.h +++ b/include/linux/perf_event.h @@ -55,7 +55,16 @@ struct perf_guest_info_callbacks { #include #include +/* + * From Haswell, the existing Last Branch Record facility can + * also be used to record call chains. + * source: indicates the available call chains source. + */ +#define PERF_FP_CALLCHAIN 0x01 +#define PERF_LBR_CALLCHAIN 0x02 + struct perf_callchain_entry { + __u64 source; __u64 nr; __u64 ip[PERF_MAX_STACK_DEPTH]; }; @@ -67,7 +76,9 @@ struct perf_raw_record { /* * branch stack layout: - * nr: number of taken branches stored in entries[] + * user_callstack: LBR is enhanced to support call stack profiling. + * user_callstack indicates if it's call stack info. + * nr: number of taken branches stored in entries[] * * Note that nr can vary from sample to sample * branches (to, from) are stored from most recent @@ -75,6 +86,7 @@ struct perf_raw_record { * recent branch. */ struct perf_branch_stack { + bool user_callstack; __u64 nr; struct perf_branch_entry entries[0]; }; diff --git a/kernel/events/callchain.c b/kernel/events/callchain.c index d659487..0fc5924 100644 --- a/kernel/events/callchain.c +++ b/kernel/events/callchain.c @@ -175,6 +175,7 @@ perf_callchain(struct perf_event *event, struct pt_regs *regs) if (!entry) goto exit_put; + entry->source = 0; entry->nr = 0; if (kernel && !user_mode(regs)) { diff --git a/kernel/events/core.c b/kernel/events/core.c index 3f3e43d..27f9596 100644 --- a/kernel/events/core.c +++ b/kernel/events/core.c @@ -4793,7 +4793,7 @@ void perf_output_sample(struct perf_output_handle *handle, if (sample_type & PERF_SAMPLE_CALLCHAIN) { if (data->callchain) { - int size = 1; + int size = 2; if (data->callchain) size += data->callchain->nr; @@ -4824,7 +4824,9 @@ void perf_output_sample(struct perf_output_handle *handle, } } - if (sample_type & PERF_SAMPLE_BRANCH_STACK) { + /* LBR can be used for call stack, so it may be enabled implicitly. */ + if ((sample_type & PERF_SAMPLE_BRANCH_STACK) || + (data->br_stack && data->br_stack->user_callstack)) { if (data->br_stack) { size_t size; @@ -4908,13 +4910,21 @@ void perf_prepare_sample(struct perf_event_header *header, data->ip = perf_instruction_pointer(regs); if (sample_type & PERF_SAMPLE_CALLCHAIN) { - int size = 1; + int size = 2; data->callchain = perf_callchain(event, regs); - if (data->callchain) + if (data->callchain) { size += data->callchain->nr; + if (data->br_stack && + data->br_stack->user_callstack && + !(sample_type & PERF_SAMPLE_BRANCH_STACK) && + !(sample_type & PERF_SAMPLE_STACK_USER)) + data->callchain->source |= + PERF_LBR_CALLCHAIN; + } + header->size += size * sizeof(u64); } @@ -4930,7 +4940,9 @@ void perf_prepare_sample(struct perf_event_header *header, header->size += size; } - if (sample_type & PERF_SAMPLE_BRANCH_STACK) { + /* LBR can be used for call stack, so it may be enabled implicitly. */ + if ((sample_type & PERF_SAMPLE_BRANCH_STACK) || + (data->br_stack && data->br_stack->user_callstack)) { int size = sizeof(u64); /* nr */ if (data->br_stack) { size += data->br_stack->nr -- 1.8.3.2 -- To unsubscribe from this list: send the line "unsubscribe linux-kernel" in the body of a message to majordomo@vger.kernel.org More majordomo info at http://vger.kernel.org/majordomo-info.html Please read the FAQ at http://www.tux.org/lkml/