acpi/hmat / cxl: Add extended linear cache support for CXL

author Dave Jiang <dave.jiang@intel.com>

Wed, 26 Feb 2025 16:21:19 +0000 (09:21 -0700)

committer Dave Jiang <dave.jiang@intel.com>

Wed, 26 Feb 2025 20:45:22 +0000 (13:45 -0700)
author Dave Jiang <dave.jiang@intel.com>
Wed, 26 Feb 2025 16:21:19 +0000 (09:21 -0700)
committer Dave Jiang <dave.jiang@intel.com>
Wed, 26 Feb 2025 20:45:22 +0000 (13:45 -0700)
diff --git a/drivers/acpi/numa/hmat.c b/drivers/acpi/numa/hmat.c

index 2630511937f523f1cb37e96927020ddad0ae886b..9d9052258e924e0cc3c47b0bd4772b1df67f3ed1 100644 (file)
--- a/drivers/acpi/numa/hmat.c
+++ b/drivers/acpi/numa/hmat.c
@@ -108,6 +108,45 @@ static struct memory_target *find_mem_target(unsigned int mem_pxm)
         return NULL;
  }
  
+/**
+ * hmat_get_extended_linear_cache_size - Retrieve the extended linear cache size
+ * @backing_res: resource from the backing media
+ * @nid: node id for the memory region
+ * @cache_size: (Output) size of extended linear cache.
+ *
+ * Return: 0 on success. Errno on failure.
+ *
+ */
+int hmat_get_extended_linear_cache_size(struct resource *backing_res, int nid,
+                                       resource_size_t *cache_size)
+{
+       unsigned int pxm = node_to_pxm(nid);
+       struct memory_target *target;
+       struct target_cache *tcache;
+       struct resource *res;
+
+       target = find_mem_target(pxm);
+       if (!target)
+               return -ENOENT;
+
+       list_for_each_entry(tcache, &target->caches, node) {
+               if (tcache->cache_attrs.address_mode !=
+                               NODE_CACHE_ADDR_MODE_EXTENDED_LINEAR)
+                       continue;
+
+               res = &target->memregions;
+               if (!resource_contains(res, backing_res))
+                       continue;
+
+               *cache_size = tcache->cache_attrs.size;
+               return 0;
+       }
+
+       *cache_size = 0;
+       return 0;
+}
+EXPORT_SYMBOL_NS_GPL(hmat_get_extended_linear_cache_size, "CXL");
+
  static struct memory_target *acpi_find_genport_target(u32 uid)
  {
         struct memory_target *target;
diff --git a/drivers/cxl/core/Makefile b/drivers/cxl/core/Makefile

index 9259bcc6773c804ccace2478c9f6f09267b48c9d..1a0c9c6ca8182dfa5fa715d1b86b795126a453c8 100644 (file)
--- a/drivers/cxl/core/Makefile
+++ b/drivers/cxl/core/Makefile
@@ -14,5 +14,6 @@ cxl_core-y += pci.o
  cxl_core-y += hdm.o
  cxl_core-y += pmu.o
  cxl_core-y += cdat.o
+cxl_core-y += acpi.o
  cxl_core-$(CONFIG_TRACING) += trace.o
  cxl_core-$(CONFIG_CXL_REGION) += region.o
diff --git a/drivers/cxl/core/acpi.c b/drivers/cxl/core/acpi.c

new file mode 100644 (file)

index 0000000..f13b4da
--- /dev/null
+++ b/drivers/cxl/core/acpi.c
@@ -0,0 +1,11 @@
+// SPDX-License-Identifier: GPL-2.0-only
+/* Copyright(c) 2024 Intel Corporation. All rights reserved. */
+#include <linux/acpi.h>
+#include "cxl.h"
+#include "core.h"
+
+int cxl_acpi_get_extended_linear_cache_size(struct resource *backing_res,
+                                           int nid, resource_size_t *size)
+{
+       return hmat_get_extended_linear_cache_size(backing_res, nid, size);
+}
diff --git a/drivers/cxl/core/core.h b/drivers/cxl/core/core.h

index 800466f96a68517f0c6930faa555b347cf0e156b..0fb779b612d14d42c4ed68cbda48a9a20c7922ac 100644 (file)
--- a/drivers/cxl/core/core.h
+++ b/drivers/cxl/core/core.h
@@ -115,4 +115,7 @@ bool cxl_need_node_perf_attrs_update(int nid);
  int cxl_port_get_switch_dport_bandwidth(struct cxl_port *port,
                                         struct access_coordinate *c);
  
+int cxl_acpi_get_extended_linear_cache_size(struct resource *backing_res,
+                                           int nid, resource_size_t *size);
+
  #endif /* __CXL_CORE_H__ */
diff --git a/drivers/cxl/core/region.c b/drivers/cxl/core/region.c

index e8d11a988fd926a81e9eae993c2fe42d8e625787..69af651a8f466c9ea3e7c6023ca52ae7df72545c 100644 (file)
--- a/drivers/cxl/core/region.c
+++ b/drivers/cxl/core/region.c
@@ -824,6 +824,21 @@ static int match_free_decoder(struct device *dev, const void *data)
         return 1;
  }
  
+static bool region_res_match_cxl_range(const struct cxl_region_params *p,
+                                      struct range *range)
+{
+       if (!p->res)
+               return false;
+
+       /*
+        * If an extended linear cache region then the CXL range is assumed
+        * to be fronted by the DRAM range in current known implementation.
+        * This assumption will be made until a variant implementation exists.
+        */
+       return p->res->start + p->cache_size == range->start &&
+               p->res->end == range->end;
+}
+
  static int match_auto_decoder(struct device *dev, const void *data)
  {
         const struct cxl_region_params *p = data;
@@ -836,7 +851,7 @@ static int match_auto_decoder(struct device *dev, const void *data)
         cxld = to_cxl_decoder(dev);
         r = &cxld->hpa_range;
  
-       if (p->res && p->res->start == r->start && p->res->end == r->end)
+       if (region_res_match_cxl_range(p, r))
                 return 1;
  
         return 0;
@@ -1424,8 +1439,7 @@ static int cxl_port_setup_targets(struct cxl_port *port,
         if (test_bit(CXL_REGION_F_AUTO, &cxlr->flags)) {
                 if (cxld->interleave_ways != iw ||
                     cxld->interleave_granularity != ig ||
-                   cxld->hpa_range.start != p->res->start ||
-                   cxld->hpa_range.end != p->res->end ||
+                   !region_res_match_cxl_range(p, &cxld->hpa_range) ||
                     ((cxld->flags & CXL_DECODER_F_ENABLE) == 0)) {
                         dev_err(&cxlr->dev,
                                 "%s:%s %s expected iw: %d ig: %d %pr\n",
@@ -1951,13 +1965,13 @@ static int cxl_region_attach(struct cxl_region *cxlr,
                 return -ENXIO;
         }
  
-       if (resource_size(cxled->dpa_res) * p->interleave_ways !=
+       if (resource_size(cxled->dpa_res) * p->interleave_ways + p->cache_size !=
             resource_size(p->res)) {
                 dev_dbg(&cxlr->dev,
-                       "%s:%s: decoder-size-%#llx * ways-%d != region-size-%#llx\n",
+                       "%s:%s-size-%#llx * ways-%d + cache-%#llx != region-size-%#llx\n",
                         dev_name(&cxlmd->dev), dev_name(&cxled->cxld.dev),
                         (u64)resource_size(cxled->dpa_res), p->interleave_ways,
-                       (u64)resource_size(p->res));
+                       (u64)p->cache_size, (u64)resource_size(p->res));
                 return -EINVAL;
         }
  
@@ -2921,7 +2935,7 @@ u64 cxl_dpa_to_hpa(struct cxl_region *cxlr, const struct cxl_memdev *cxlmd,
         hpa_offset |= dpa_offset & GENMASK_ULL(eig + 7, 0);
  
         /* Apply the hpa_offset to the region base address */
-       hpa = hpa_offset + p->res->start;
+       hpa = hpa_offset + p->res->start + p->cache_size;
  
         /* Root decoder translation overrides typical modulo decode */
         if (cxlrd->hpa_to_spa)
@@ -3224,6 +3238,52 @@ static int match_region_by_range(struct device *dev, const void *data)
         return rc;
  }
  
+static int cxl_extended_linear_cache_resize(struct cxl_region *cxlr,
+                                           struct resource *res)
+{
+       struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(cxlr->dev.parent);
+       struct cxl_region_params *p = &cxlr->params;
+       int nid = phys_to_target_node(res->start);
+       resource_size_t size, cache_size, start;
+       int rc;
+
+       size = resource_size(res);
+       if (!size)
+               return -EINVAL;
+
+       rc = cxl_acpi_get_extended_linear_cache_size(res, nid, &cache_size);
+       if (rc)
+               return rc;
+
+       if (!cache_size)
+               return 0;
+
+       if (size != cache_size) {
+               dev_warn(&cxlr->dev,
+                        "Extended Linear Cache size %#lld != CXL size %#lld. No Support!",
+                        cache_size, size);
+               return -EOPNOTSUPP;
+       }
+
+       /*
+        * Move the start of the range to where the cache range starts. The
+        * implementation assumes that the cache range is in front of the
+        * CXL range. This is not dictated by the HMAT spec but is how the
+        * current known implementation is configured.
+        *
+        * The cache range is expected to be within the CFMWS. The adjusted
+        * res->start should not be less than cxlrd->res->start.
+        */
+       start = res->start - cache_size;
+       if (start < cxlrd->res->start)
+               return -ENXIO;
+
+       res->start = start;
+       p->cache_size = cache_size;
+
+       return 0;
+}
+
  /* Establish an empty region covering the given HPA range */
  static struct cxl_region *construct_region(struct cxl_root_decoder *cxlrd,
                                            struct cxl_endpoint_decoder *cxled)
@@ -3270,6 +3330,18 @@ static struct cxl_region *construct_region(struct cxl_root_decoder *cxlrd,
  
         *res = DEFINE_RES_MEM_NAMED(hpa->start, range_len(hpa),
                                     dev_name(&cxlr->dev));
+
+       rc = cxl_extended_linear_cache_resize(cxlr, res);
+       if (rc) {
+               /*
+                * Failing to support extended linear cache region resize does not
+                * prevent the region from functioning. Only causes cxl list showing
+                * incorrect region size.
+                */
+               dev_warn(cxlmd->dev.parent,
+                        "Extended linear cache calculation failed.\n");
+       }
+
         rc = insert_resource(cxlrd->res, res);
         if (rc) {
                 /*
diff --git a/drivers/cxl/cxl.h b/drivers/cxl/cxl.h

index bbbaa0d0a67036c997e5f970cb8741e67fbb644a..7ee96867ac73d7d64198d66b5d0b40b42d681ec8 100644 (file)
--- a/drivers/cxl/cxl.h
+++ b/drivers/cxl/cxl.h
@@ -493,6 +493,7 @@ enum cxl_config_state {
   * @res: allocated iomem capacity for this region
   * @targets: active ordered targets in current decoder configuration
   * @nr_targets: number of targets
+ * @cache_size: extended linear cache size if exists, otherwise zero.
   *
   * State transitions are protected by the cxl_region_rwsem
   */
@@ -504,6 +505,7 @@ struct cxl_region_params {
         struct resource *res;
         struct cxl_endpoint_decoder *targets[CXL_DECODER_MAX_INTERLEAVE];
         int nr_targets;
+       resource_size_t cache_size;
  };
  
  /*
diff --git a/include/linux/acpi.h b/include/linux/acpi.h

index 4e495b29c640f05eecba77942ad1dc53f1b87c4b..cbd933504dbf36588f42cd35a7bf0781dc676dc8 100644 (file)
--- a/include/linux/acpi.h
+++ b/include/linux/acpi.h
@@ -1095,6 +1095,17 @@ static inline acpi_handle acpi_get_processor_handle(int cpu)
  
  #endif /* !CONFIG_ACPI */
  
+#ifdef CONFIG_ACPI_HMAT
+int hmat_get_extended_linear_cache_size(struct resource *backing_res, int nid,
+                                       resource_size_t *size);
+#else
+static inline int hmat_get_extended_linear_cache_size(struct resource *backing_res,
+                                                     int nid, resource_size_t *size)
+{
+       return -EOPNOTSUPP;
+}
+#endif
+
  extern void arch_post_acpi_subsys_init(void);
  
  #ifdef CONFIG_ACPI_HOTPLUG_IOAPIC
diff --git a/tools/testing/cxl/Kbuild b/tools/testing/cxl/Kbuild

index b1256fee3567fc7743812ee14bc46e09b7c8ba9b..1ae13987a8a230a4530e83e67de8b68488d67b25 100644 (file)
--- a/tools/testing/cxl/Kbuild
+++ b/tools/testing/cxl/Kbuild
@@ -61,6 +61,7 @@ cxl_core-y += $(CXL_CORE_SRC)/pci.o
  cxl_core-y += $(CXL_CORE_SRC)/hdm.o
  cxl_core-y += $(CXL_CORE_SRC)/pmu.o
  cxl_core-y += $(CXL_CORE_SRC)/cdat.o
+cxl_core-y += $(CXL_CORE_SRC)/acpi.o
  cxl_core-$(CONFIG_TRACING) += $(CXL_CORE_SRC)/trace.o
  cxl_core-$(CONFIG_CXL_REGION) += $(CXL_CORE_SRC)/region.o
  cxl_core-y += config_check.o
author	Dave Jiang <dave.jiang@intel.com>
	Wed, 26 Feb 2025 16:21:19 +0000 (09:21 -0700)
committer	Dave Jiang <dave.jiang@intel.com>
	Wed, 26 Feb 2025 20:45:22 +0000 (13:45 -0700)
drivers/acpi/numa/hmat.c		patch \| blob \| history
drivers/cxl/core/Makefile		patch \| blob \| history
drivers/cxl/core/acpi.c	[new file with mode: 0644]	patch \| blob
drivers/cxl/core/core.h		patch \| blob \| history
drivers/cxl/core/region.c		patch \| blob \| history
drivers/cxl/cxl.h		patch \| blob \| history
include/linux/acpi.h		patch \| blob \| history
tools/testing/cxl/Kbuild		patch \| blob \| history