mirror of
https://github.com/torvalds/linux.git
synced 2024-12-04 18:13:04 +00:00
1f8cbb9c83
git commitdc7ee00d47
("s390: lowcore stack pointer offsets") introduced a regression in regard to perf_callchain_kernel(). The stack pointer for the asynchronous stack in the lowcore now has an additional offset applied. This offset needs to be taken into account in the calculation for the low and high address for the stack. This bug was already partially fixed with9cc5c206d9
("s390/dumpstack: fix address ranges for asynchronous and panic stack"). This patch fixes it also for the perf_event code. Fixes:dc7ee00d47
("s390: lowcore stack pointer offsets") Signed-off-by: Heiko Carstens <heiko.carstens@de.ibm.com> Signed-off-by: Martin Schwidefsky <schwidefsky@de.ibm.com>
325 lines
7.9 KiB
C
325 lines
7.9 KiB
C
/*
|
|
* Performance event support for s390x
|
|
*
|
|
* Copyright IBM Corp. 2012, 2013
|
|
* Author(s): Hendrik Brueckner <brueckner@linux.vnet.ibm.com>
|
|
*
|
|
* This program is free software; you can redistribute it and/or modify
|
|
* it under the terms of the GNU General Public License (version 2 only)
|
|
* as published by the Free Software Foundation.
|
|
*/
|
|
#define KMSG_COMPONENT "perf"
|
|
#define pr_fmt(fmt) KMSG_COMPONENT ": " fmt
|
|
|
|
#include <linux/kernel.h>
|
|
#include <linux/perf_event.h>
|
|
#include <linux/kvm_host.h>
|
|
#include <linux/percpu.h>
|
|
#include <linux/export.h>
|
|
#include <linux/seq_file.h>
|
|
#include <linux/spinlock.h>
|
|
#include <linux/sysfs.h>
|
|
#include <asm/irq.h>
|
|
#include <asm/cpu_mf.h>
|
|
#include <asm/lowcore.h>
|
|
#include <asm/processor.h>
|
|
#include <asm/sysinfo.h>
|
|
|
|
const char *perf_pmu_name(void)
|
|
{
|
|
if (cpum_cf_avail() || cpum_sf_avail())
|
|
return "CPU-Measurement Facilities (CPU-MF)";
|
|
return "pmu";
|
|
}
|
|
EXPORT_SYMBOL(perf_pmu_name);
|
|
|
|
int perf_num_counters(void)
|
|
{
|
|
int num = 0;
|
|
|
|
if (cpum_cf_avail())
|
|
num += PERF_CPUM_CF_MAX_CTR;
|
|
if (cpum_sf_avail())
|
|
num += PERF_CPUM_SF_MAX_CTR;
|
|
|
|
return num;
|
|
}
|
|
EXPORT_SYMBOL(perf_num_counters);
|
|
|
|
static struct kvm_s390_sie_block *sie_block(struct pt_regs *regs)
|
|
{
|
|
struct stack_frame *stack = (struct stack_frame *) regs->gprs[15];
|
|
|
|
if (!stack)
|
|
return NULL;
|
|
|
|
return (struct kvm_s390_sie_block *) stack->empty1[0];
|
|
}
|
|
|
|
static bool is_in_guest(struct pt_regs *regs)
|
|
{
|
|
if (user_mode(regs))
|
|
return false;
|
|
#if IS_ENABLED(CONFIG_KVM)
|
|
return instruction_pointer(regs) == (unsigned long) &sie_exit;
|
|
#else
|
|
return false;
|
|
#endif
|
|
}
|
|
|
|
static unsigned long guest_is_user_mode(struct pt_regs *regs)
|
|
{
|
|
return sie_block(regs)->gpsw.mask & PSW_MASK_PSTATE;
|
|
}
|
|
|
|
static unsigned long instruction_pointer_guest(struct pt_regs *regs)
|
|
{
|
|
return sie_block(regs)->gpsw.addr;
|
|
}
|
|
|
|
unsigned long perf_instruction_pointer(struct pt_regs *regs)
|
|
{
|
|
return is_in_guest(regs) ? instruction_pointer_guest(regs)
|
|
: instruction_pointer(regs);
|
|
}
|
|
|
|
static unsigned long perf_misc_guest_flags(struct pt_regs *regs)
|
|
{
|
|
return guest_is_user_mode(regs) ? PERF_RECORD_MISC_GUEST_USER
|
|
: PERF_RECORD_MISC_GUEST_KERNEL;
|
|
}
|
|
|
|
static unsigned long perf_misc_flags_sf(struct pt_regs *regs)
|
|
{
|
|
struct perf_sf_sde_regs *sde_regs;
|
|
unsigned long flags;
|
|
|
|
sde_regs = (struct perf_sf_sde_regs *) ®s->int_parm_long;
|
|
if (sde_regs->in_guest)
|
|
flags = user_mode(regs) ? PERF_RECORD_MISC_GUEST_USER
|
|
: PERF_RECORD_MISC_GUEST_KERNEL;
|
|
else
|
|
flags = user_mode(regs) ? PERF_RECORD_MISC_USER
|
|
: PERF_RECORD_MISC_KERNEL;
|
|
return flags;
|
|
}
|
|
|
|
unsigned long perf_misc_flags(struct pt_regs *regs)
|
|
{
|
|
/* Check if the cpum_sf PMU has created the pt_regs structure.
|
|
* In this case, perf misc flags can be easily extracted. Otherwise,
|
|
* do regular checks on the pt_regs content.
|
|
*/
|
|
if (regs->int_code == 0x1407 && regs->int_parm == CPU_MF_INT_SF_PRA)
|
|
if (!regs->gprs[15])
|
|
return perf_misc_flags_sf(regs);
|
|
|
|
if (is_in_guest(regs))
|
|
return perf_misc_guest_flags(regs);
|
|
|
|
return user_mode(regs) ? PERF_RECORD_MISC_USER
|
|
: PERF_RECORD_MISC_KERNEL;
|
|
}
|
|
|
|
static void print_debug_cf(void)
|
|
{
|
|
struct cpumf_ctr_info cf_info;
|
|
int cpu = smp_processor_id();
|
|
|
|
memset(&cf_info, 0, sizeof(cf_info));
|
|
if (!qctri(&cf_info))
|
|
pr_info("CPU[%i] CPUM_CF: ver=%u.%u A=%04x E=%04x C=%04x\n",
|
|
cpu, cf_info.cfvn, cf_info.csvn,
|
|
cf_info.auth_ctl, cf_info.enable_ctl, cf_info.act_ctl);
|
|
}
|
|
|
|
static void print_debug_sf(void)
|
|
{
|
|
struct hws_qsi_info_block si;
|
|
int cpu = smp_processor_id();
|
|
|
|
memset(&si, 0, sizeof(si));
|
|
if (qsi(&si))
|
|
return;
|
|
|
|
pr_info("CPU[%i] CPUM_SF: basic=%i diag=%i min=%lu max=%lu cpu_speed=%u\n",
|
|
cpu, si.as, si.ad, si.min_sampl_rate, si.max_sampl_rate,
|
|
si.cpu_speed);
|
|
|
|
if (si.as)
|
|
pr_info("CPU[%i] CPUM_SF: Basic-sampling: a=%i e=%i c=%i"
|
|
" bsdes=%i tear=%016lx dear=%016lx\n", cpu,
|
|
si.as, si.es, si.cs, si.bsdes, si.tear, si.dear);
|
|
if (si.ad)
|
|
pr_info("CPU[%i] CPUM_SF: Diagnostic-sampling: a=%i e=%i c=%i"
|
|
" dsdes=%i tear=%016lx dear=%016lx\n", cpu,
|
|
si.ad, si.ed, si.cd, si.dsdes, si.tear, si.dear);
|
|
}
|
|
|
|
void perf_event_print_debug(void)
|
|
{
|
|
unsigned long flags;
|
|
|
|
local_irq_save(flags);
|
|
if (cpum_cf_avail())
|
|
print_debug_cf();
|
|
if (cpum_sf_avail())
|
|
print_debug_sf();
|
|
local_irq_restore(flags);
|
|
}
|
|
|
|
/* Service level infrastructure */
|
|
static void sl_print_counter(struct seq_file *m)
|
|
{
|
|
struct cpumf_ctr_info ci;
|
|
|
|
memset(&ci, 0, sizeof(ci));
|
|
if (qctri(&ci))
|
|
return;
|
|
|
|
seq_printf(m, "CPU-MF: Counter facility: version=%u.%u "
|
|
"authorization=%04x\n", ci.cfvn, ci.csvn, ci.auth_ctl);
|
|
}
|
|
|
|
static void sl_print_sampling(struct seq_file *m)
|
|
{
|
|
struct hws_qsi_info_block si;
|
|
|
|
memset(&si, 0, sizeof(si));
|
|
if (qsi(&si))
|
|
return;
|
|
|
|
if (!si.as && !si.ad)
|
|
return;
|
|
|
|
seq_printf(m, "CPU-MF: Sampling facility: min_rate=%lu max_rate=%lu"
|
|
" cpu_speed=%u\n", si.min_sampl_rate, si.max_sampl_rate,
|
|
si.cpu_speed);
|
|
if (si.as)
|
|
seq_printf(m, "CPU-MF: Sampling facility: mode=basic"
|
|
" sample_size=%u\n", si.bsdes);
|
|
if (si.ad)
|
|
seq_printf(m, "CPU-MF: Sampling facility: mode=diagnostic"
|
|
" sample_size=%u\n", si.dsdes);
|
|
}
|
|
|
|
static void service_level_perf_print(struct seq_file *m,
|
|
struct service_level *sl)
|
|
{
|
|
if (cpum_cf_avail())
|
|
sl_print_counter(m);
|
|
if (cpum_sf_avail())
|
|
sl_print_sampling(m);
|
|
}
|
|
|
|
static struct service_level service_level_perf = {
|
|
.seq_print = service_level_perf_print,
|
|
};
|
|
|
|
static int __init service_level_perf_register(void)
|
|
{
|
|
return register_service_level(&service_level_perf);
|
|
}
|
|
arch_initcall(service_level_perf_register);
|
|
|
|
/* See also arch/s390/kernel/traps.c */
|
|
static unsigned long __store_trace(struct perf_callchain_entry *entry,
|
|
unsigned long sp,
|
|
unsigned long low, unsigned long high)
|
|
{
|
|
struct stack_frame *sf;
|
|
struct pt_regs *regs;
|
|
|
|
while (1) {
|
|
if (sp < low || sp > high - sizeof(*sf))
|
|
return sp;
|
|
sf = (struct stack_frame *) sp;
|
|
perf_callchain_store(entry, sf->gprs[8]);
|
|
/* Follow the backchain. */
|
|
while (1) {
|
|
low = sp;
|
|
sp = sf->back_chain;
|
|
if (!sp)
|
|
break;
|
|
if (sp <= low || sp > high - sizeof(*sf))
|
|
return sp;
|
|
sf = (struct stack_frame *) sp;
|
|
perf_callchain_store(entry, sf->gprs[8]);
|
|
}
|
|
/* Zero backchain detected, check for interrupt frame. */
|
|
sp = (unsigned long) (sf + 1);
|
|
if (sp <= low || sp > high - sizeof(*regs))
|
|
return sp;
|
|
regs = (struct pt_regs *) sp;
|
|
perf_callchain_store(entry, sf->gprs[8]);
|
|
low = sp;
|
|
sp = regs->gprs[15];
|
|
}
|
|
}
|
|
|
|
void perf_callchain_kernel(struct perf_callchain_entry *entry,
|
|
struct pt_regs *regs)
|
|
{
|
|
unsigned long head, frame_size;
|
|
struct stack_frame *head_sf;
|
|
|
|
if (user_mode(regs))
|
|
return;
|
|
|
|
frame_size = STACK_FRAME_OVERHEAD + sizeof(struct pt_regs);
|
|
head = regs->gprs[15];
|
|
head_sf = (struct stack_frame *) head;
|
|
|
|
if (!head_sf || !head_sf->back_chain)
|
|
return;
|
|
|
|
head = head_sf->back_chain;
|
|
head = __store_trace(entry, head,
|
|
S390_lowcore.async_stack + frame_size - ASYNC_SIZE,
|
|
S390_lowcore.async_stack + frame_size);
|
|
|
|
__store_trace(entry, head, S390_lowcore.thread_info,
|
|
S390_lowcore.thread_info + THREAD_SIZE);
|
|
}
|
|
|
|
/* Perf defintions for PMU event attributes in sysfs */
|
|
ssize_t cpumf_events_sysfs_show(struct device *dev,
|
|
struct device_attribute *attr, char *page)
|
|
{
|
|
struct perf_pmu_events_attr *pmu_attr;
|
|
|
|
pmu_attr = container_of(attr, struct perf_pmu_events_attr, attr);
|
|
return sprintf(page, "event=0x%04llx,name=%s\n",
|
|
pmu_attr->id, attr->attr.name);
|
|
}
|
|
|
|
/* Reserve/release functions for sharing perf hardware */
|
|
static DEFINE_SPINLOCK(perf_hw_owner_lock);
|
|
static void *perf_sampling_owner;
|
|
|
|
int perf_reserve_sampling(void)
|
|
{
|
|
int err;
|
|
|
|
err = 0;
|
|
spin_lock(&perf_hw_owner_lock);
|
|
if (perf_sampling_owner) {
|
|
pr_warn("The sampling facility is already reserved by %p\n",
|
|
perf_sampling_owner);
|
|
err = -EBUSY;
|
|
} else
|
|
perf_sampling_owner = __builtin_return_address(0);
|
|
spin_unlock(&perf_hw_owner_lock);
|
|
return err;
|
|
}
|
|
EXPORT_SYMBOL(perf_reserve_sampling);
|
|
|
|
void perf_release_sampling(void)
|
|
{
|
|
spin_lock(&perf_hw_owner_lock);
|
|
WARN_ON(!perf_sampling_owner);
|
|
perf_sampling_owner = NULL;
|
|
spin_unlock(&perf_hw_owner_lock);
|
|
}
|
|
EXPORT_SYMBOL(perf_release_sampling);
|