]> www.infradead.org Git - nvme.git/commitdiff
perf/x86/intel: Add PMU support for ArrowLake-H
authorDapeng Mi <dapeng1.mi@linux.intel.com>
Tue, 20 Aug 2024 07:38:53 +0000 (07:38 +0000)
committerPeter Zijlstra <peterz@infradead.org>
Mon, 7 Oct 2024 07:28:43 +0000 (09:28 +0200)
ArrowLake-H contains 3 different uarchs, LionCove, Skymont and Crestmont.
It is different with previous hybrid processors which only contains two
kinds of uarchs.

This patch adds PMU support for ArrowLake-H processor, adds ARL-H
specific events which supports the 3 kinds of uarchs, such as
td_retiring_arl_h, and extends some existed format attributes like
offcore_rsp to make them be available to support ARL-H as well. Althrough
these format attributes like offcore_rsp have been extended to support
ARL-H, they can still support the regular hybrid platforms with 2 kinds
of uarchs since the helper hybrid_format_is_visible() would filter PMU
types and only show the format attribute for available PMUs.

Signed-off-by: Dapeng Mi <dapeng1.mi@linux.intel.com>
Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
Reviewed-by: Kan Liang <kan.liang@linux.intel.com>
Tested-by: Yongwei Ma <yongwei.ma@intel.com>
Link: https://lkml.kernel.org/r/20240820073853.1974746-5-dapeng1.mi@linux.intel.com
arch/x86/events/intel/core.c
arch/x86/events/intel/ds.c
arch/x86/events/perf_event.h

index 6b9884ee96e993c12e81c05da096c7fad53dc211..7ca40002a19b81c70feb219c5604f033ce51aa0b 100644 (file)
@@ -4599,6 +4599,28 @@ static inline bool erratum_hsw11(struct perf_event *event)
                X86_CONFIG(.event=0xc0, .umask=0x01);
 }
 
+static struct event_constraint *
+arl_h_get_event_constraints(struct cpu_hw_events *cpuc, int idx,
+                         struct perf_event *event)
+{
+       struct x86_hybrid_pmu *pmu = hybrid_pmu(event->pmu);
+
+       if (pmu->pmu_type == hybrid_tiny)
+               return cmt_get_event_constraints(cpuc, idx, event);
+
+       return mtl_get_event_constraints(cpuc, idx, event);
+}
+
+static int arl_h_hw_config(struct perf_event *event)
+{
+       struct x86_hybrid_pmu *pmu = hybrid_pmu(event->pmu);
+
+       if (pmu->pmu_type == hybrid_tiny)
+               return intel_pmu_hw_config(event);
+
+       return adl_hw_config(event);
+}
+
 /*
  * The HSW11 requires a period larger than 100 which is the same as the BDM11.
  * A minimum period of 128 is enforced as well for the INST_RETIRED.ALL.
@@ -5974,6 +5996,37 @@ static struct attribute *lnl_hybrid_events_attrs[] = {
        NULL
 };
 
+/* The event string must be in PMU IDX order. */
+EVENT_ATTR_STR_HYBRID(topdown-retiring,
+                     td_retiring_arl_h,
+                     "event=0xc2,umask=0x02;event=0x00,umask=0x80;event=0xc2,umask=0x0",
+                     hybrid_big_small_tiny);
+EVENT_ATTR_STR_HYBRID(topdown-bad-spec,
+                     td_bad_spec_arl_h,
+                     "event=0x73,umask=0x0;event=0x00,umask=0x81;event=0x73,umask=0x0",
+                     hybrid_big_small_tiny);
+EVENT_ATTR_STR_HYBRID(topdown-fe-bound,
+                     td_fe_bound_arl_h,
+                     "event=0x9c,umask=0x01;event=0x00,umask=0x82;event=0x71,umask=0x0",
+                     hybrid_big_small_tiny);
+EVENT_ATTR_STR_HYBRID(topdown-be-bound,
+                     td_be_bound_arl_h,
+                     "event=0xa4,umask=0x02;event=0x00,umask=0x83;event=0x74,umask=0x0",
+                     hybrid_big_small_tiny);
+
+static struct attribute *arl_h_hybrid_events_attrs[] = {
+       EVENT_PTR(slots_adl),
+       EVENT_PTR(td_retiring_arl_h),
+       EVENT_PTR(td_bad_spec_arl_h),
+       EVENT_PTR(td_fe_bound_arl_h),
+       EVENT_PTR(td_be_bound_arl_h),
+       EVENT_PTR(td_heavy_ops_adl),
+       EVENT_PTR(td_br_mis_adl),
+       EVENT_PTR(td_fetch_lat_adl),
+       EVENT_PTR(td_mem_bound_adl),
+       NULL,
+};
+
 /* Must be in IDX order */
 EVENT_ATTR_STR_HYBRID(mem-loads,     mem_ld_adl,     "event=0xd0,umask=0x5,ldlat=3;event=0xcd,umask=0x1,ldlat=3", hybrid_big_small);
 EVENT_ATTR_STR_HYBRID(mem-stores,    mem_st_adl,     "event=0xd0,umask=0x6;event=0xcd,umask=0x2",                 hybrid_big_small);
@@ -5992,6 +6045,21 @@ static struct attribute *mtl_hybrid_mem_attrs[] = {
        NULL
 };
 
+EVENT_ATTR_STR_HYBRID(mem-loads,
+                     mem_ld_arl_h,
+                     "event=0xd0,umask=0x5,ldlat=3;event=0xcd,umask=0x1,ldlat=3;event=0xd0,umask=0x5,ldlat=3",
+                     hybrid_big_small_tiny);
+EVENT_ATTR_STR_HYBRID(mem-stores,
+                     mem_st_arl_h,
+                     "event=0xd0,umask=0x6;event=0xcd,umask=0x2;event=0xd0,umask=0x6",
+                     hybrid_big_small_tiny);
+
+static struct attribute *arl_h_hybrid_mem_attrs[] = {
+       EVENT_PTR(mem_ld_arl_h),
+       EVENT_PTR(mem_st_arl_h),
+       NULL,
+};
+
 EVENT_ATTR_STR_HYBRID(tx-start,          tx_start_adl,          "event=0xc9,umask=0x1",          hybrid_big);
 EVENT_ATTR_STR_HYBRID(tx-commit,         tx_commit_adl,         "event=0xc9,umask=0x2",          hybrid_big);
 EVENT_ATTR_STR_HYBRID(tx-abort,          tx_abort_adl,          "event=0xc9,umask=0x4",          hybrid_big);
@@ -6015,8 +6083,8 @@ static struct attribute *adl_hybrid_tsx_attrs[] = {
 
 FORMAT_ATTR_HYBRID(in_tx,       hybrid_big);
 FORMAT_ATTR_HYBRID(in_tx_cp,    hybrid_big);
-FORMAT_ATTR_HYBRID(offcore_rsp, hybrid_big_small);
-FORMAT_ATTR_HYBRID(ldlat,       hybrid_big_small);
+FORMAT_ATTR_HYBRID(offcore_rsp, hybrid_big_small_tiny);
+FORMAT_ATTR_HYBRID(ldlat,       hybrid_big_small_tiny);
 FORMAT_ATTR_HYBRID(frontend,    hybrid_big);
 
 #define ADL_HYBRID_RTM_FORMAT_ATTR     \
@@ -6039,7 +6107,7 @@ static struct attribute *adl_hybrid_extra_attr[] = {
        NULL
 };
 
-FORMAT_ATTR_HYBRID(snoop_rsp,  hybrid_small);
+FORMAT_ATTR_HYBRID(snoop_rsp,  hybrid_small_tiny);
 
 static struct attribute *mtl_hybrid_extra_attr_rtm[] = {
        ADL_HYBRID_RTM_FORMAT_ATTR,
@@ -7121,6 +7189,37 @@ __init int intel_pmu_init(void)
                name = "lunarlake_hybrid";
                break;
 
+       case INTEL_ARROWLAKE_H:
+               intel_pmu_init_hybrid(hybrid_big_small_tiny);
+
+               x86_pmu.pebs_latency_data = arl_h_latency_data;
+               x86_pmu.get_event_constraints = arl_h_get_event_constraints;
+               x86_pmu.hw_config = arl_h_hw_config;
+
+               td_attr = arl_h_hybrid_events_attrs;
+               mem_attr = arl_h_hybrid_mem_attrs;
+               tsx_attr = adl_hybrid_tsx_attrs;
+               extra_attr = boot_cpu_has(X86_FEATURE_RTM) ?
+                       mtl_hybrid_extra_attr_rtm : mtl_hybrid_extra_attr;
+
+               /* Initialize big core specific PerfMon capabilities. */
+               pmu = &x86_pmu.hybrid_pmu[X86_HYBRID_PMU_CORE_IDX];
+               intel_pmu_init_lnc(&pmu->pmu);
+
+               /* Initialize Atom core specific PerfMon capabilities. */
+               pmu = &x86_pmu.hybrid_pmu[X86_HYBRID_PMU_ATOM_IDX];
+               intel_pmu_init_skt(&pmu->pmu);
+
+               /* Initialize Lower Power Atom specific PerfMon capabilities. */
+               pmu = &x86_pmu.hybrid_pmu[X86_HYBRID_PMU_TINY_IDX];
+               intel_pmu_init_grt(&pmu->pmu);
+               pmu->extra_regs = intel_cmt_extra_regs;
+
+               intel_pmu_pebs_data_source_arl_h();
+               pr_cont("ArrowLake-H Hybrid events, ");
+               name = "arrowlake_h_hybrid";
+               break;
+
        default:
                switch (x86_pmu.version) {
                case 1:
index fa5ea65de0d0fa8b3974910a49c8526dc44de357..8afc4ad3cd16eb8039c75f89e5e44ead7db1fdb1 100644 (file)
@@ -177,6 +177,17 @@ void __init intel_pmu_pebs_data_source_mtl(void)
        __intel_pmu_pebs_data_source_cmt(data_source);
 }
 
+void __init intel_pmu_pebs_data_source_arl_h(void)
+{
+       u64 *data_source;
+
+       intel_pmu_pebs_data_source_lnl();
+
+       data_source = x86_pmu.hybrid_pmu[X86_HYBRID_PMU_TINY_IDX].pebs_data_source;
+       memcpy(data_source, pebs_data_source, sizeof(pebs_data_source));
+       __intel_pmu_pebs_data_source_cmt(data_source);
+}
+
 void __init intel_pmu_pebs_data_source_cmt(void)
 {
        __intel_pmu_pebs_data_source_cmt(pebs_data_source);
@@ -388,6 +399,16 @@ u64 lnl_latency_data(struct perf_event *event, u64 status)
        return lnc_latency_data(event, status);
 }
 
+u64 arl_h_latency_data(struct perf_event *event, u64 status)
+{
+       struct x86_hybrid_pmu *pmu = hybrid_pmu(event->pmu);
+
+       if (pmu->pmu_type == hybrid_tiny)
+               return cmt_latency_data(event, status);
+
+       return lnl_latency_data(event, status);
+}
+
 static u64 load_latency_data(struct perf_event *event, u64 status)
 {
        union intel_x86_pebs_dse dse;
index 909467d6d7edd4e7b1e4e0b6734f703e8137dfc1..82c6f45ce97552a175ab9ad047000fca0420dda8 100644 (file)
@@ -1592,6 +1592,8 @@ u64 cmt_latency_data(struct perf_event *event, u64 status);
 
 u64 lnl_latency_data(struct perf_event *event, u64 status);
 
+u64 arl_h_latency_data(struct perf_event *event, u64 status);
+
 extern struct event_constraint intel_core2_pebs_event_constraints[];
 
 extern struct event_constraint intel_atom_pebs_event_constraints[];
@@ -1711,6 +1713,8 @@ void intel_pmu_pebs_data_source_grt(void);
 
 void intel_pmu_pebs_data_source_mtl(void);
 
+void intel_pmu_pebs_data_source_arl_h(void);
+
 void intel_pmu_pebs_data_source_cmt(void);
 
 void intel_pmu_pebs_data_source_lnl(void);