Tony Jones ad5999
From: Kan Liang <kan.liang@linux.intel.com>
Tony Jones ad5999
Date: Wed, 29 Jun 2022 08:08:40 -0700
Tony Jones ad5999
Subject: perf/x86/intel: Fix PEBS data source encoding for ADL
Tony Jones ad5999
Git-commit: ccf170e9d8fdacfe435bbe3749c897c7d86d32f8
Tony Jones ad5999
Patch-mainline: v6.0-rc1
Tony Jones 700454
References: jsc#PED-1063, jsc#PED-1752
Tony Jones ad5999
Tony Jones ad5999
The PEBS data source encoding for the e-core is different from the
Tony Jones ad5999
p-core.
Tony Jones ad5999
Tony Jones ad5999
Add the pebs_data_source[] in the struct x86_hybrid_pmu to store the
Tony Jones ad5999
data source encoding for each type of the core.
Tony Jones ad5999
Tony Jones ad5999
Add intel_pmu_pebs_data_source_grt() for the e-core.
Tony Jones ad5999
There is nothing changed for the data source encoding of the p-core,
Tony Jones ad5999
which still reuse the intel_pmu_pebs_data_source_skl().
Tony Jones ad5999
Tony Jones ad5999
Fixes: f83d2f91d259 ("perf/x86/intel: Add Alder Lake Hybrid support")
Tony Jones ad5999
Signed-off-by: Kan Liang <kan.liang@linux.intel.com>
Tony Jones ad5999
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Tony Jones ad5999
Reviewed-by: Andi Kleen <ak@linux.intel.com>
Tony Jones ad5999
Link: https://lkml.kernel.org/r/20220629150840.2235741-2-kan.liang@linux.intel.com
Tony Jones ad5999
Tony Jones ad5999
Signed-off-by: Tony Jones <tonyj@suse.de>
Tony Jones ad5999
---
Tony Jones ad5999
 arch/x86/events/intel/core.c |  2 +-
Tony Jones ad5999
 arch/x86/events/intel/ds.c   | 51 +++++++++++++++++++++++++++++++++-----------
Tony Jones ad5999
 arch/x86/events/perf_event.h |  6 ++++++
Tony Jones ad5999
 3 files changed, 45 insertions(+), 14 deletions(-)
Tony Jones ad5999
Tony Jones ad5999
diff --git a/arch/x86/events/intel/core.c b/arch/x86/events/intel/core.c
Tony Jones ad5999
index 07d4a5f20321..bd8b98857609 100644
Tony Jones ad5999
--- a/arch/x86/events/intel/core.c
Tony Jones ad5999
+++ b/arch/x86/events/intel/core.c
Tony Jones ad5999
@@ -6241,7 +6241,7 @@ __init int intel_pmu_init(void)
Tony Jones ad5999
 		x86_pmu.flags |= PMU_FL_INSTR_LATENCY;
Tony Jones ad5999
 		x86_pmu.flags |= PMU_FL_MEM_LOADS_AUX;
Tony Jones ad5999
 		x86_pmu.lbr_pt_coexist = true;
Tony Jones ad5999
-		intel_pmu_pebs_data_source_skl(false);
Tony Jones ad5999
+		intel_pmu_pebs_data_source_adl();
Tony Jones ad5999
 		x86_pmu.pebs_latency_data = adl_latency_data_small;
Tony Jones ad5999
 		x86_pmu.num_topdown_events = 8;
Tony Jones ad5999
 		x86_pmu.update_topdown_event = adl_update_topdown_event;
Tony Jones ad5999
diff --git a/arch/x86/events/intel/ds.c b/arch/x86/events/intel/ds.c
Tony Jones ad5999
index de84385de414..ba60427caa6d 100644
Tony Jones ad5999
--- a/arch/x86/events/intel/ds.c
Tony Jones ad5999
+++ b/arch/x86/events/intel/ds.c
Tony Jones ad5999
@@ -94,15 +94,40 @@ void __init intel_pmu_pebs_data_source_nhm(void)
Tony Jones ad5999
 	pebs_data_source[0x07] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HITM);
Tony Jones ad5999
 }
Tony Jones ad5999
 
Tony Jones ad5999
-void __init intel_pmu_pebs_data_source_skl(bool pmem)
Tony Jones ad5999
+static void __init __intel_pmu_pebs_data_source_skl(bool pmem, u64 *data_source)
Tony Jones ad5999
 {
Tony Jones ad5999
 	u64 pmem_or_l4 = pmem ? LEVEL(PMEM) : LEVEL(L4);
Tony Jones ad5999
 
Tony Jones ad5999
-	pebs_data_source[0x08] = OP_LH | pmem_or_l4 | P(SNOOP, HIT);
Tony Jones ad5999
-	pebs_data_source[0x09] = OP_LH | pmem_or_l4 | REM | P(SNOOP, HIT);
Tony Jones ad5999
-	pebs_data_source[0x0b] = OP_LH | LEVEL(RAM) | REM | P(SNOOP, NONE);
Tony Jones ad5999
-	pebs_data_source[0x0c] = OP_LH | LEVEL(ANY_CACHE) | REM | P(SNOOPX, FWD);
Tony Jones ad5999
-	pebs_data_source[0x0d] = OP_LH | LEVEL(ANY_CACHE) | REM | P(SNOOP, HITM);
Tony Jones ad5999
+	data_source[0x08] = OP_LH | pmem_or_l4 | P(SNOOP, HIT);
Tony Jones ad5999
+	data_source[0x09] = OP_LH | pmem_or_l4 | REM | P(SNOOP, HIT);
Tony Jones ad5999
+	data_source[0x0b] = OP_LH | LEVEL(RAM) | REM | P(SNOOP, NONE);
Tony Jones ad5999
+	data_source[0x0c] = OP_LH | LEVEL(ANY_CACHE) | REM | P(SNOOPX, FWD);
Tony Jones ad5999
+	data_source[0x0d] = OP_LH | LEVEL(ANY_CACHE) | REM | P(SNOOP, HITM);
Tony Jones ad5999
+}
Tony Jones ad5999
+
Tony Jones ad5999
+void __init intel_pmu_pebs_data_source_skl(bool pmem)
Tony Jones ad5999
+{
Tony Jones ad5999
+	__intel_pmu_pebs_data_source_skl(pmem, pebs_data_source);
Tony Jones ad5999
+}
Tony Jones ad5999
+
Tony Jones ad5999
+static void __init intel_pmu_pebs_data_source_grt(u64 *data_source)
Tony Jones ad5999
+{
Tony Jones ad5999
+	data_source[0x05] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HIT);
Tony Jones ad5999
+	data_source[0x06] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOP, HITM);
Tony Jones ad5999
+	data_source[0x08] = OP_LH | P(LVL, L3) | LEVEL(L3) | P(SNOOPX, FWD);
Tony Jones ad5999
+}
Tony Jones ad5999
+
Tony Jones ad5999
+void __init intel_pmu_pebs_data_source_adl(void)
Tony Jones ad5999
+{
Tony Jones ad5999
+	u64 *data_source;
Tony Jones ad5999
+
Tony Jones ad5999
+	data_source = x86_pmu.hybrid_pmu[X86_HYBRID_PMU_CORE_IDX].pebs_data_source;
Tony Jones ad5999
+	memcpy(data_source, pebs_data_source, sizeof(pebs_data_source));
Tony Jones ad5999
+	__intel_pmu_pebs_data_source_skl(false, data_source);
Tony Jones ad5999
+
Tony Jones ad5999
+	data_source = x86_pmu.hybrid_pmu[X86_HYBRID_PMU_ATOM_IDX].pebs_data_source;
Tony Jones ad5999
+	memcpy(data_source, pebs_data_source, sizeof(pebs_data_source));
Tony Jones ad5999
+	intel_pmu_pebs_data_source_grt(data_source);
Tony Jones ad5999
 }
Tony Jones ad5999
 
Tony Jones ad5999
 static u64 precise_store_data(u64 status)
Tony Jones ad5999
@@ -198,7 +223,7 @@ u64 adl_latency_data_small(struct perf_event *event, u64 status)
Tony Jones ad5999
 
Tony Jones ad5999
 	dse.val = status;
Tony Jones ad5999
 
Tony Jones ad5999
-	val = pebs_data_source[dse.ld_dse];
Tony Jones ad5999
+	val = hybrid_var(event->pmu, pebs_data_source)[dse.ld_dse];
Tony Jones ad5999
 
Tony Jones ad5999
 	/*
Tony Jones ad5999
 	 * For the atom core on ADL,
Tony Jones ad5999
@@ -214,7 +239,7 @@ u64 adl_latency_data_small(struct perf_event *event, u64 status)
Tony Jones ad5999
 	return val;
Tony Jones ad5999
 }
Tony Jones ad5999
 
Tony Jones ad5999
-static u64 load_latency_data(u64 status)
Tony Jones ad5999
+static u64 load_latency_data(struct perf_event *event, u64 status)
Tony Jones ad5999
 {
Tony Jones ad5999
 	union intel_x86_pebs_dse dse;
Tony Jones ad5999
 	u64 val;
Tony Jones ad5999
@@ -224,7 +249,7 @@ static u64 load_latency_data(u64 status)
Tony Jones ad5999
 	/*
Tony Jones ad5999
 	 * use the mapping table for bit 0-3
Tony Jones ad5999
 	 */
Tony Jones ad5999
-	val = pebs_data_source[dse.ld_dse];
Tony Jones ad5999
+	val = hybrid_var(event->pmu, pebs_data_source)[dse.ld_dse];
Tony Jones ad5999
 
Tony Jones ad5999
 	/*
Tony Jones ad5999
 	 * Nehalem models do not support TLB, Lock infos
Tony Jones ad5999
@@ -263,7 +288,7 @@ static u64 load_latency_data(u64 status)
Tony Jones ad5999
 	return val;
Tony Jones ad5999
 }
Tony Jones ad5999
 
Tony Jones ad5999
-static u64 store_latency_data(u64 status)
Tony Jones ad5999
+static u64 store_latency_data(struct perf_event *event, u64 status)
Tony Jones ad5999
 {
Tony Jones ad5999
 	union intel_x86_pebs_dse dse;
Tony Jones ad5999
 	u64 val;
Tony Jones ad5999
@@ -273,7 +298,7 @@ static u64 store_latency_data(u64 status)
Tony Jones ad5999
 	/*
Tony Jones ad5999
 	 * use the mapping table for bit 0-3
Tony Jones ad5999
 	 */
Tony Jones ad5999
-	val = pebs_data_source[dse.st_lat_dse];
Tony Jones ad5999
+	val = hybrid_var(event->pmu, pebs_data_source)[dse.st_lat_dse];
Tony Jones ad5999
 
Tony Jones ad5999
 	pebs_set_tlb_lock(&val, dse.st_lat_stlb_miss, dse.st_lat_locked);
Tony Jones ad5999
 
Tony Jones ad5999
@@ -1459,9 +1484,9 @@ static u64 get_data_src(struct perf_event *event, u64 aux)
Tony Jones ad5999
 	bool fst = fl & (PERF_X86_EVENT_PEBS_ST | PERF_X86_EVENT_PEBS_HSW_PREC);
Tony Jones ad5999
 
Tony Jones ad5999
 	if (fl & PERF_X86_EVENT_PEBS_LDLAT)
Tony Jones ad5999
-		val = load_latency_data(aux);
Tony Jones ad5999
+		val = load_latency_data(event, aux);
Tony Jones ad5999
 	else if (fl & PERF_X86_EVENT_PEBS_STLAT)
Tony Jones ad5999
-		val = store_latency_data(aux);
Tony Jones ad5999
+		val = store_latency_data(event, aux);
Tony Jones ad5999
 	else if (fl & PERF_X86_EVENT_PEBS_LAT_HYBRID)
Tony Jones ad5999
 		val = x86_pmu.pebs_latency_data(event, aux);
Tony Jones ad5999
 	else if (fst && (fl & PERF_X86_EVENT_PEBS_HSW_PREC))
Tony Jones ad5999
diff --git a/arch/x86/events/perf_event.h b/arch/x86/events/perf_event.h
Tony Jones ad5999
index 2d11445e158c..ca2f8bfe6ff1 100644
Tony Jones ad5999
--- a/arch/x86/events/perf_event.h
Tony Jones ad5999
+++ b/arch/x86/events/perf_event.h
Tony Jones ad5999
@@ -644,6 +644,8 @@ enum {
Tony Jones ad5999
 	x86_lbr_exclusive_max,
Tony Jones ad5999
 };
Tony Jones ad5999
 
Tony Jones ad5999
+#define PERF_PEBS_DATA_SOURCE_MAX	0x10
Tony Jones ad5999
+
Tony Jones ad5999
 struct x86_hybrid_pmu {
Tony Jones ad5999
 	struct pmu			pmu;
Tony Jones ad5999
 	const char			*name;
Tony Jones ad5999
@@ -671,6 +673,8 @@ struct x86_hybrid_pmu {
Tony Jones ad5999
 	unsigned int			late_ack	:1,
Tony Jones ad5999
 					mid_ack		:1,
Tony Jones ad5999
 					enabled_ack	:1;
Tony Jones ad5999
+
Tony Jones ad5999
+	u64				pebs_data_source[PERF_PEBS_DATA_SOURCE_MAX];
Tony Jones ad5999
 };
Tony Jones ad5999
 
Tony Jones ad5999
 static __always_inline struct x86_hybrid_pmu *hybrid_pmu(struct pmu *pmu)
Tony Jones ad5999
@@ -1508,6 +1512,8 @@ void intel_pmu_pebs_data_source_nhm(void);
Tony Jones ad5999
 
Tony Jones ad5999
 void intel_pmu_pebs_data_source_skl(bool pmem);
Tony Jones ad5999
 
Tony Jones ad5999
+void intel_pmu_pebs_data_source_adl(void);
Tony Jones ad5999
+
Tony Jones ad5999
 int intel_pmu_setup_lbr_filter(struct perf_event *event);
Tony Jones ad5999
 
Tony Jones ad5999
 void intel_pt_interrupt(void);
Tony Jones ad5999