Hi Miquel, On 2025-04-03 2:39 AM, Miquel Raynal wrote: > It is very surprising that such an uclass, specifically designed to > handle resources that may be shared by different devices, is not keeping > the count of the number of times a power domain has been > enabled/disabled to avoid shutting it down unexpectedly or disabling it > several times. > > Doing this causes troubles on eg. i.MX8MP because disabling power > domains can be done in recursive loops were the same power domain > disabled up to 4 times in a row. PGCs seem to have tight FSM internal > timings to respect and it is easy to produce a race condition that puts > the power domains in an unstable state, leading to ADB400 errors and > later crashes in Linux. > > CI tests using power domains are slightly updated to make sure the count > of on/off calls is even and the results match what we *now* expect. > > As we do not want to break existing users while stile getting > interesting error codes, the implementation is split between: > - a low-level helper reporting error codes if the requested transition > could not be operated, > - a higher-level helper ignoring the "non error" codes, like EALREADY and > EBUSY. > > Signed-off-by: Miquel Raynal <miquel.ray...@bootlin.com> > --- > drivers/firmware/scmi/sandbox-scmi_devices.c | 1 + > drivers/power/domain/power-domain-uclass.c | 40 ++++++++++++++-- > drivers/power/domain/sandbox-power-domain-test.c | 1 + > include/power-domain.h | 60 > ++++++++++++++++++++---- > test/dm/power-domain.c | 2 +- > 5 files changed, 91 insertions(+), 13 deletions(-) > > diff --git a/drivers/firmware/scmi/sandbox-scmi_devices.c > b/drivers/firmware/scmi/sandbox-scmi_devices.c > index > 96c2922b067e2886b3fa963bcd7e396f4569a569..9f253b0fd40f703a5ec11d34c197423d27ad8b01 > 100644 > --- a/drivers/firmware/scmi/sandbox-scmi_devices.c > +++ b/drivers/firmware/scmi/sandbox-scmi_devices.c > @@ -163,4 +163,5 @@ U_BOOT_DRIVER(sandbox_scmi_devices) = { > .priv_auto = sizeof(struct sandbox_scmi_device_priv), > .remove = sandbox_scmi_devices_remove, > .probe = sandbox_scmi_devices_probe, > + .flags = DM_FLAG_DEFAULT_PD_CTRL_OFF, > }; > diff --git a/drivers/power/domain/power-domain-uclass.c > b/drivers/power/domain/power-domain-uclass.c > index > 938bd8cbc9ffd1ba2109d702f886b6a99288d063..a6e5f9ed0369eb9d2dfa66edc9e938bac6720dab > 100644 > --- a/drivers/power/domain/power-domain-uclass.c > +++ b/drivers/power/domain/power-domain-uclass.c > @@ -12,6 +12,10 @@ > #include <power-domain-uclass.h> > #include <dm/device-internal.h> > > +struct power_domain_priv { > + int on_count; > +}; > + > static inline struct power_domain_ops *power_domain_dev_ops(struct udevice > *dev) > { > return (struct power_domain_ops *)dev->driver->ops; > @@ -107,22 +111,49 @@ int power_domain_free(struct power_domain *power_domain) > return ops->rfree ? ops->rfree(power_domain) : 0; > } > > -int power_domain_on(struct power_domain *power_domain) > +int power_domain_on_lowlevel(struct power_domain *power_domain) > { > + struct power_domain_priv *priv = dev_get_uclass_priv(power_domain->dev); > struct power_domain_ops *ops = power_domain_dev_ops(power_domain->dev); > + int ret; > > debug("%s(power_domain=%p)\n", __func__, power_domain); > > - return ops->on ? ops->on(power_domain) : 0; > + if (priv->on_count++ > 0) > + return -EALREADY;
This change is broken for power domain providers with #power-domain-cells = <1>, which can have multiple domains per provider device. There would need to be a separate reference count per domain, and currently the uclass doesn't know the range of valid domain IDs. Regards, Samuel > + > + ret = ops->on ? ops->on(power_domain) : 0; > + if (ret) { > + priv->on_count--; > + return ret; > + } > + > + return 0; > } > > -int power_domain_off(struct power_domain *power_domain) > +int power_domain_off_lowlevel(struct power_domain *power_domain) > { > + struct power_domain_priv *priv = dev_get_uclass_priv(power_domain->dev); > struct power_domain_ops *ops = power_domain_dev_ops(power_domain->dev); > + int ret; > > debug("%s(power_domain=%p)\n", __func__, power_domain); > > - return ops->off ? ops->off(power_domain) : 0; > + if (priv->on_count <= 0) { > + debug("Power domain %s already off.\n", > power_domain->dev->name); > + return -EALREADY; > + } > + > + if (priv->on_count-- > 1) > + return -EBUSY; > + > + ret = ops->off ? ops->off(power_domain) : 0; > + if (ret) { > + priv->on_count++; > + return ret; > + } > + > + return 0; > } > > #if CONFIG_IS_ENABLED(OF_REAL) > @@ -180,4 +211,5 @@ int dev_power_domain_off(struct udevice *dev) > UCLASS_DRIVER(power_domain) = { > .id = UCLASS_POWER_DOMAIN, > .name = "power_domain", > + .per_device_auto = sizeof(struct power_domain_priv), > }; > diff --git a/drivers/power/domain/sandbox-power-domain-test.c > b/drivers/power/domain/sandbox-power-domain-test.c > index > 08c15ef342b3dd3ce01807ee59b7e97337f7dde5..5b530974e942ffcba453e53be330baaf3a113a13 > 100644 > --- a/drivers/power/domain/sandbox-power-domain-test.c > +++ b/drivers/power/domain/sandbox-power-domain-test.c > @@ -51,4 +51,5 @@ U_BOOT_DRIVER(sandbox_power_domain_test) = { > .id = UCLASS_MISC, > .of_match = sandbox_power_domain_test_ids, > .priv_auto = sizeof(struct sandbox_power_domain_test), > + .flags = DM_FLAG_DEFAULT_PD_CTRL_OFF, > }; > diff --git a/include/power-domain.h b/include/power-domain.h > index > 18525073e5e3534fcbac6fae4e18462f29a4dc49..ad33dea76ce5808beaa4fbf4388438a504e36027 > 100644 > --- a/include/power-domain.h > +++ b/include/power-domain.h > @@ -147,37 +147,81 @@ static inline int power_domain_free(struct power_domain > *power_domain) > #endif > > /** > - * power_domain_on - Enable power to a power domain. > + * power_domain_on_lowlevel - Enable power to a power domain (with > refcounting) > * > * @power_domain: A power domain struct that was previously successfully > * requested by power_domain_get(). > - * Return: 0 if OK, or a negative error code. > + * Return: 0 if the transition has been performed correctly, > + * -EALREADY if the domain is already on, > + * a negative error code otherwise. > */ > #if CONFIG_IS_ENABLED(POWER_DOMAIN) > -int power_domain_on(struct power_domain *power_domain); > +int power_domain_on_lowlevel(struct power_domain *power_domain); > #else > -static inline int power_domain_on(struct power_domain *power_domain) > +static inline int power_domain_on_lowlevel(struct power_domain *power_domain) > { > return -ENOSYS; > } > #endif > > /** > - * power_domain_off - Disable power to a power domain. > + * power_domain_on - Enable power to a power domain (ignores the actual state > + * of the power domain) > * > * @power_domain: A power domain struct that was previously successfully > * requested by power_domain_get(). > - * Return: 0 if OK, or a negative error code. > + * Return: a negative error code upon error during the transition, 0 > otherwise. > + */ > +static inline int power_domain_on(struct power_domain *power_domain) > +{ > + int ret; > + > + ret = power_domain_on_lowlevel(power_domain); > + if (ret == -EALREADY) > + ret = 0; > + > + return ret; > +} > + > +/** > + * power_domain_off_lowlevel - Disable power to a power domain (with > refcounting) > + * > + * @power_domain: A power domain struct that was previously successfully > + * requested by power_domain_get(). > + * Return: 0 if the transition has been performed correctly, > + * -EALREADY if the domain is already off, > + * -EBUSY if another device is keeping the domain on (but the > refcounter > + * is decremented), > + * a negative error code otherwise. > */ > #if CONFIG_IS_ENABLED(POWER_DOMAIN) > -int power_domain_off(struct power_domain *power_domain); > +int power_domain_off_lowlevel(struct power_domain *power_domain); > #else > -static inline int power_domain_off(struct power_domain *power_domain) > +static inline int power_domain_off_lowlevel(struct power_domain > *power_domain) > { > return -ENOSYS; > } > #endif > > +/** > + * power_domain_off - Disable power to a power domain (ignores the actual > state > + * of the power domain) > + * > + * @power_domain: A power domain struct that was previously successfully > + * requested by power_domain_get(). > + * Return: a negative error code upon error during the transition, 0 > otherwise. > + */ > +static inline int power_domain_off(struct power_domain *power_domain) > +{ > + int ret; > + > + ret = power_domain_off_lowlevel(power_domain); > + if (ret == -EALREADY || ret == -EBUSY) > + ret = 0; > + > + return ret; > +} > + > /** > * dev_power_domain_on - Enable power domains for a device . > * > diff --git a/test/dm/power-domain.c b/test/dm/power-domain.c > index > 896cf5b2ae9d26701150fad70e888f8b135a22b0..8a95f6bdb903be9d1993528d87d5cae0075a83e4 > 100644 > --- a/test/dm/power-domain.c > +++ b/test/dm/power-domain.c > @@ -27,7 +27,7 @@ static int dm_test_power_domain(struct unit_test_state *uts) > > ut_assertok(uclass_get_device_by_name(UCLASS_MISC, "power-domain-test", > &dev_test)); > - ut_asserteq(1, sandbox_power_domain_query(dev_power_domain, > + ut_asserteq(0, sandbox_power_domain_query(dev_power_domain, > TEST_POWER_DOMAIN)); > ut_assertok(sandbox_power_domain_test_get(dev_test)); > >