perf arm-spe: Set sample's data source field
The sample structure contains the field 'data_src' which is used to tell the data operation attributions, e.g. operation type is loading or storing, cache level, it's snooping or remote accessing, etc. At the end, the 'data_src' will be parsed by perf mem/c2c tools to display human readable strings. This patch is to fill the 'data_src' field in the synthesized samples base on different types. Currently perf tool can display statistics for L1/L2/L3 caches but it doesn't support the 'last level cache'. To fit to current implementation, 'data_src' field uses L3 cache for last level cache. Before this commit, perf mem report looks like this: # Samples: 75K of event 'l1d-miss' # Total weight : 75951 # Sort order : local_weight,mem,sym,dso,symbol_daddr,dso_daddr,snoop,tlb,locked # # Overhead Samples Local Weight Memory access Symbol Shared Object Data Symbol Data Object Snoop TLB access # ........ ....... ............ ............. ...................... ............. ...................... ........... ..... .......... # 81.56% 61945 0 N/A [.] 0x00000000000009d8 serial_c [.] 0000000000000000 [unknown] N/A N/A 18.44% 14003 0 N/A [.] 0x0000000000000828 serial_c [.] 0000000000000000 [unknown] N/A N/A Now on a system with Arm SPE, addresses and access types are displayed: # Samples: 75K of event 'l1d-miss' # Total weight : 75951 # Sort order : local_weight,mem,sym,dso,symbol_daddr,dso_daddr,snoop,tlb,locked # # Overhead Samples Local Weight Memory access Symbol Shared Object Data Symbol Data Object Snoop TLB access # ........ ....... ............ ............. ...................... ............. ...................... ........... ..... .......... # 0.43% 324 0 L1 miss [.] 0x00000000000009d8 serial_c [.] 0x0000ffff80794e00 anon N/A Walker hit 0.42% 322 0 L1 miss [.] 0x00000000000009d8 serial_c [.] 0x0000ffff80794580 anon N/A Walker hit Signed-off-by: Leo Yan <leo.yan@linaro.org> Reviewed-by: James Clark <james.clark@arm.com> Tested-by: James Clark <james.clark@arm.com> Cc: Adrian Hunter <adrian.hunter@intel.com> Cc: Alexander Shishkin <alexander.shishkin@linux.intel.com> Cc: Al Grant <al.grant@arm.com> Cc: Andre Przywara <andre.przywara@arm.com> Cc: Ingo Molnar <mingo@redhat.com> Cc: Jiri Olsa <jolsa@redhat.com> Cc: John Garry <john.garry@huawei.com> Cc: Mark Rutland <mark.rutland@arm.com> Cc: Mathieu Poirier <mathieu.poirier@linaro.org> Cc: Namhyung Kim <namhyung@kernel.org> Cc: Peter Zijlstra <peterz@infradead.org> Cc: Wei Li <liwei391@huawei.com> Cc: Will Deacon <will@kernel.org> Signed-off-by: James Clark <james.clark@arm.com> Link: https://lore.kernel.org/r/20210211133856.2137-6-james.clark@arm.com Signed-off-by: Arnaldo Carvalho de Melo <acme@redhat.com>
This commit is contained in:
parent
e55ed3423c
commit
a89dbc9b98
@ -261,7 +261,7 @@ arm_spe_deliver_synth_event(struct arm_spe *spe,
|
||||
}
|
||||
|
||||
static int arm_spe__synth_mem_sample(struct arm_spe_queue *speq,
|
||||
u64 spe_events_id)
|
||||
u64 spe_events_id, u64 data_src)
|
||||
{
|
||||
struct arm_spe *spe = speq->spe;
|
||||
struct arm_spe_record *record = &speq->decoder->record;
|
||||
@ -274,6 +274,7 @@ static int arm_spe__synth_mem_sample(struct arm_spe_queue *speq,
|
||||
sample.stream_id = spe_events_id;
|
||||
sample.addr = record->virt_addr;
|
||||
sample.phys_addr = record->phys_addr;
|
||||
sample.data_src = data_src;
|
||||
|
||||
return arm_spe_deliver_synth_event(spe, speq, event, &sample);
|
||||
}
|
||||
@ -307,21 +308,66 @@ static bool arm_spe__is_memory_event(enum arm_spe_sample_type type)
|
||||
return false;
|
||||
}
|
||||
|
||||
static u64 arm_spe__synth_data_source(const struct arm_spe_record *record)
|
||||
{
|
||||
union perf_mem_data_src data_src = { 0 };
|
||||
|
||||
if (record->op == ARM_SPE_LD)
|
||||
data_src.mem_op = PERF_MEM_OP_LOAD;
|
||||
else
|
||||
data_src.mem_op = PERF_MEM_OP_STORE;
|
||||
|
||||
if (record->type & (ARM_SPE_LLC_ACCESS | ARM_SPE_LLC_MISS)) {
|
||||
data_src.mem_lvl = PERF_MEM_LVL_L3;
|
||||
|
||||
if (record->type & ARM_SPE_LLC_MISS)
|
||||
data_src.mem_lvl |= PERF_MEM_LVL_MISS;
|
||||
else
|
||||
data_src.mem_lvl |= PERF_MEM_LVL_HIT;
|
||||
} else if (record->type & (ARM_SPE_L1D_ACCESS | ARM_SPE_L1D_MISS)) {
|
||||
data_src.mem_lvl = PERF_MEM_LVL_L1;
|
||||
|
||||
if (record->type & ARM_SPE_L1D_MISS)
|
||||
data_src.mem_lvl |= PERF_MEM_LVL_MISS;
|
||||
else
|
||||
data_src.mem_lvl |= PERF_MEM_LVL_HIT;
|
||||
}
|
||||
|
||||
if (record->type & ARM_SPE_REMOTE_ACCESS)
|
||||
data_src.mem_lvl |= PERF_MEM_LVL_REM_CCE1;
|
||||
|
||||
if (record->type & (ARM_SPE_TLB_ACCESS | ARM_SPE_TLB_MISS)) {
|
||||
data_src.mem_dtlb = PERF_MEM_TLB_WK;
|
||||
|
||||
if (record->type & ARM_SPE_TLB_MISS)
|
||||
data_src.mem_dtlb |= PERF_MEM_TLB_MISS;
|
||||
else
|
||||
data_src.mem_dtlb |= PERF_MEM_TLB_HIT;
|
||||
}
|
||||
|
||||
return data_src.val;
|
||||
}
|
||||
|
||||
static int arm_spe_sample(struct arm_spe_queue *speq)
|
||||
{
|
||||
const struct arm_spe_record *record = &speq->decoder->record;
|
||||
struct arm_spe *spe = speq->spe;
|
||||
u64 data_src;
|
||||
int err;
|
||||
|
||||
data_src = arm_spe__synth_data_source(record);
|
||||
|
||||
if (spe->sample_flc) {
|
||||
if (record->type & ARM_SPE_L1D_MISS) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->l1d_miss_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->l1d_miss_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
|
||||
if (record->type & ARM_SPE_L1D_ACCESS) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->l1d_access_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->l1d_access_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
@ -329,13 +375,15 @@ static int arm_spe_sample(struct arm_spe_queue *speq)
|
||||
|
||||
if (spe->sample_llc) {
|
||||
if (record->type & ARM_SPE_LLC_MISS) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->llc_miss_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->llc_miss_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
|
||||
if (record->type & ARM_SPE_LLC_ACCESS) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->llc_access_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->llc_access_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
@ -343,13 +391,15 @@ static int arm_spe_sample(struct arm_spe_queue *speq)
|
||||
|
||||
if (spe->sample_tlb) {
|
||||
if (record->type & ARM_SPE_TLB_MISS) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->tlb_miss_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->tlb_miss_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
|
||||
if (record->type & ARM_SPE_TLB_ACCESS) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->tlb_access_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->tlb_access_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
@ -363,13 +413,14 @@ static int arm_spe_sample(struct arm_spe_queue *speq)
|
||||
|
||||
if (spe->sample_remote_access &&
|
||||
(record->type & ARM_SPE_REMOTE_ACCESS)) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->remote_access_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->remote_access_id,
|
||||
data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
|
||||
if (spe->sample_memory && arm_spe__is_memory_event(record->type)) {
|
||||
err = arm_spe__synth_mem_sample(speq, spe->memory_id);
|
||||
err = arm_spe__synth_mem_sample(speq, spe->memory_id, data_src);
|
||||
if (err)
|
||||
return err;
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user