On 7/15/25 11:04 AM, Smita Koralahalli wrote:
> Reworked from a patch by Alison Schofield <alison.schofi...@intel.com>
> 
> Previously, when CXL regions were created through autodiscovery and their
> resources overlapped with SOFT RESERVED ranges, the soft reserved resource
> remained in place after region teardown. This left the HPA range
> unavailable for reuse even after the region was destroyed.
> 
> Enhance the logic to reliably remove SOFT RESERVED resources associated
> with a region, regardless of alignment or hierarchy in the iomem tree.
> 
> Link: 
> https://lore.kernel.org/linux-cxl/29312c0765224ae76862d59a17748c8188fb95f1.1692638817.git.alison.schofi...@intel.com/
> Co-developed-by: Alison Schofield <alison.schofi...@intel.com>
> Signed-off-by: Alison Schofield <alison.schofi...@intel.com>
> Co-developed-by: Terry Bowman <terry.bow...@amd.com>
> Signed-off-by: Terry Bowman <terry.bow...@amd.com>
> Signed-off-by: Smita Koralahalli <smita.koralahallichannabasa...@amd.com>
> ---
>  drivers/cxl/acpi.c        |   2 +
>  drivers/cxl/core/region.c | 124 ++++++++++++++++++++++++++++++++++++++
>  drivers/cxl/cxl.h         |   2 +
>  include/linux/ioport.h    |   1 +
>  kernel/resource.c         |  34 +++++++++++
>  5 files changed, 163 insertions(+)
> 
> diff --git a/drivers/cxl/acpi.c b/drivers/cxl/acpi.c
> index 3a27289e669b..9eb8a9587dee 100644
> --- a/drivers/cxl/acpi.c
> +++ b/drivers/cxl/acpi.c
> @@ -829,6 +829,8 @@ static void cxl_softreserv_mem_work_fn(struct work_struct 
> *work)
>               pr_debug("Timeout waiting for cxl_mem probing");
>  
>       wait_for_device_probe();
> +
> +     cxl_region_softreserv_update();
>  }
>  static DECLARE_WORK(cxl_sr_work, cxl_softreserv_mem_work_fn);
>  
> diff --git a/drivers/cxl/core/region.c b/drivers/cxl/core/region.c
> index 6e5e1460068d..95951a1f1cab 100644
> --- a/drivers/cxl/core/region.c
> +++ b/drivers/cxl/core/region.c
> @@ -3486,6 +3486,130 @@ int cxl_add_to_region(struct cxl_endpoint_decoder 
> *cxled)
>  }
>  EXPORT_SYMBOL_NS_GPL(cxl_add_to_region, "CXL");
>  
> +static int add_soft_reserved(resource_size_t start, resource_size_t len,
> +                          unsigned long flags)
> +{
> +     struct resource *res = kzalloc(sizeof(*res), GFP_KERNEL);
> +     int rc;
> +
> +     if (!res)
> +             return -ENOMEM;
> +
> +     *res = DEFINE_RES_NAMED_DESC(start, len, "Soft Reserved",
> +                                  flags | IORESOURCE_MEM,
> +                                  IORES_DESC_SOFT_RESERVED);
> +
> +     rc = insert_resource(&iomem_resource, res);
> +     if (rc) {
> +             kfree(res);
> +             return rc;
> +     }
> +
> +     return 0;
> +}
> +
> +static void remove_soft_reserved(struct cxl_region *cxlr, struct resource 
> *soft,
> +                              resource_size_t start, resource_size_t end)
> +{
> +     struct cxl_root_decoder *cxlrd = to_cxl_root_decoder(cxlr->dev.parent);
> +     resource_size_t new_start, new_end;
> +     int rc;
> +
> +     guard(mutex)(&cxlrd->range_lock);
> +
> +     if (soft->start == start && soft->end == end) {
> +             /*
> +              * Exact alignment at both start and end. The entire region is
> +              * removed below.
> +              */
> +
> +     } else if (soft->start == start || soft->end == end) {
> +             /* Aligns at either resource start or end */
> +             if (soft->start == start) {
> +                     new_start = end + 1;
> +                     new_end = soft->end;
> +             } else {
> +                     new_start = soft->start;
> +                     new_end = start - 1;
> +             }
> +
> +             /*
> +              * Reuse original flags as the trimmed portion retains the same
> +              * memory type and access characteristics.
> +              */
> +             rc = add_soft_reserved(new_start, new_end - new_start + 1,
> +                                    soft->flags);
> +             if (rc)
> +                     dev_warn(&cxlr->dev,
> +                              "cannot add new soft reserved resource at 
> %pa\n",
> +                              &new_start);
> +
> +     } else {
> +             /* No alignment - Split into two new soft reserved regions */
> +             new_start = soft->start;
> +             new_end = soft->end;
> +
> +             rc = add_soft_reserved(new_start, start - new_start,
> +                                    soft->flags);
> +             if (rc)
> +                     dev_warn(&cxlr->dev,
> +                              "cannot add new soft reserved resource at 
> %pa\n",
> +                              &new_start);
> +
> +             rc = add_soft_reserved(end + 1, new_end - end, soft->flags);
> +             if (rc)
> +                     dev_warn(&cxlr->dev,
> +                              "cannot add new soft reserved resource at %pa 
> + 1\n",
> +                              &end);
> +     }
> +
> +     rc = remove_resource(soft);
> +     if (rc)
> +             dev_warn(&cxlr->dev, "cannot remove soft reserved resource 
> %pr\n",
> +                      soft);
> +}
> +
> +static int __cxl_region_softreserv_update(struct resource *soft,
> +                                       void *_cxlr)
> +{
> +     struct cxl_region *cxlr = _cxlr;
> +     struct resource *res = cxlr->params.res;
> +
> +     /* Skip non-intersecting soft-reserved regions */
> +     if (soft->end < res->start || soft->start > res->end)
> +             return 0;
> +
> +     soft = normalize_resource(soft);
> +     if (!soft)
> +             return -EINVAL;
> +
> +     remove_soft_reserved(cxlr, soft, res->start, res->end);
> +
> +     return 0;
> +}
> +
> +static int cxl_region_softreserv_update_cb(struct device *dev, void *data)
> +{
> +     struct cxl_region *cxlr;
> +
> +     if (!is_cxl_region(dev))
> +             return 0;
> +
> +     cxlr = to_cxl_region(dev);
> +
> +     walk_iomem_res_desc(IORES_DESC_SOFT_RESERVED, IORESOURCE_MEM, 0, -1,
> +                         cxlr, __cxl_region_softreserv_update);

No checking return value of walk_iomem_res_desc()?

> +
> +     return 0;
> +}
> +
> +void cxl_region_softreserv_update(void)
> +{
> +     bus_for_each_dev(&cxl_bus_type, NULL, NULL,
> +                      cxl_region_softreserv_update_cb);

No checking return value of bus_for_each_dev()? Is it ok to ignore all errors?

> +}
> +EXPORT_SYMBOL_NS_GPL(cxl_region_softreserv_update, "CXL");
> +
>  u64 cxl_port_get_spa_cache_alias(struct cxl_port *endpoint, u64 spa)
>  {
>       struct cxl_region_ref *iter;
> diff --git a/drivers/cxl/cxl.h b/drivers/cxl/cxl.h
> index 3117136f0208..9f173467e497 100644
> --- a/drivers/cxl/cxl.h
> +++ b/drivers/cxl/cxl.h
> @@ -862,6 +862,7 @@ struct cxl_pmem_region *to_cxl_pmem_region(struct device 
> *dev);
>  int cxl_add_to_region(struct cxl_endpoint_decoder *cxled);
>  struct cxl_dax_region *to_cxl_dax_region(struct device *dev);
>  u64 cxl_port_get_spa_cache_alias(struct cxl_port *endpoint, u64 spa);
> +void cxl_region_softreserv_update(void);
>  #else
>  static inline bool is_cxl_pmem_region(struct device *dev)
>  {
> @@ -884,6 +885,7 @@ static inline u64 cxl_port_get_spa_cache_alias(struct 
> cxl_port *endpoint,
>  {
>       return 0;
>  }
> +static inline void cxl_region_softreserv_update(void) { }
>  #endif
>  
>  void cxl_endpoint_parse_cdat(struct cxl_port *port);
> diff --git a/include/linux/ioport.h b/include/linux/ioport.h
> index e8b2d6aa4013..8693e095d32b 100644
> --- a/include/linux/ioport.h
> +++ b/include/linux/ioport.h
> @@ -233,6 +233,7 @@ struct resource_constraint {
>  extern struct resource ioport_resource;
>  extern struct resource iomem_resource;
>  
> +extern struct resource *normalize_resource(struct resource *res);
>  extern struct resource *request_resource_conflict(struct resource *root, 
> struct resource *new);
>  extern int request_resource(struct resource *root, struct resource *new);
>  extern int release_resource(struct resource *new);
> diff --git a/kernel/resource.c b/kernel/resource.c
> index 8d3e6ed0bdc1..3d8dc2a59cb2 100644
> --- a/kernel/resource.c
> +++ b/kernel/resource.c
> @@ -50,6 +50,40 @@ EXPORT_SYMBOL(iomem_resource);
>  
>  static DEFINE_RWLOCK(resource_lock);
>  
> +/*
> + * normalize_resource
> + *
> + * The walk_iomem_res_desc() returns a copy of a resource, not a reference
> + * to the actual resource in the iomem_resource tree. As a result,
> + * __release_resource() which relies on pointer equality will fail.
> + *
> + * This helper walks the children of the resource's parent to find and
> + * return the original resource pointer that matches the given resource's
> + * start and end addresses.
> + *
> + * Return: Pointer to the matching original resource in iomem_resource, or
> + *         NULL if not found or invalid input.
> + */
> +struct resource *normalize_resource(struct resource *res)
> +{
> +     if (!res || !res->parent)
> +             return NULL;
> +
> +     read_lock(&resource_lock);

May as well go with below for consistency:
guard(read_lock)(&resource_lock);

DJ

> +     for (struct resource *res_iter = res->parent->child; res_iter != NULL;
> +          res_iter = res_iter->sibling) {
> +             if ((res_iter->start == res->start) &&
> +                 (res_iter->end == res->end)) {
> +                     read_unlock(&resource_lock);
> +                     return res_iter;
> +             }
> +     }
> +
> +     read_unlock(&resource_lock);
> +     return NULL;
> +}
> +EXPORT_SYMBOL_NS_GPL(normalize_resource, "CXL");
> +
>  /*
>   * Return the next node of @p in pre-order tree traversal.  If
>   * @skip_children is true, skip the descendant nodes of @p in


Reply via email to