Re: [PATCH v2 1/2] devfreq: qcom: Add L2 Krait Cache devfreq scaling driver

From: Ansuel Smith
Date: Thu May 19 2022 - 20:52:45 EST


On Fri, May 20, 2022 at 10:11:16AM +0900, Chanwoo Choi wrote:
> Hi Ansuel,
>
>
> The 5.19-rc1 will support the cpu based scaling support[2]
> as your needed. So that if you use passive governor with CPUFREQ_PARENT_DEV,
> you can scale the cache frequency according to cpu frequency change.
>
> [1] https://patchwork.kernel.org/project/linux-pm/patch/3acd6c32-6e78-dfc2-3e45-84f69a7d5f36@xxxxxxxxxxx/
> [2] PM / devfreq: Add cpu based scaling support to passive governor
>
>
> Best Regards,
> Chanwoo Choi
>

Oh wow thanks a lot for this. Wonder if this is finally the right time
for a correct handling of cache scaling for krait. Will rework this and
send a new version with the new implementation!
Again thanks.

> On 9/30/20 1:29 AM, Ansuel Smith wrote:
> > Qcom L2 Krait CPUs use the generic cpufreq-dt driver and doesn't actually
> > scale the Cache frequency when the CPU frequency is changed. This
> > devfreq driver register with the cpu notifier and scale the Cache
> > based on the max Freq across all core as the CPU cache is shared across
> > all of them. If provided this also scale the voltage of the regulator
> > attached to the CPU cache. The scaling logic is based on the CPU freq
> > and the 3 scaling interval are set by the device dts.
> >
> > Signed-off-by: Ansuel Smith <ansuelsmth@xxxxxxxxx>
> > ---
> > v2:
> > * Change cpu-freq to qcom,cpu-freq
> > * Skip freq change if prev is the same target freq
> >
> > drivers/devfreq/Kconfig | 10 +
> > drivers/devfreq/Makefile | 1 +
> > drivers/devfreq/krait-cache-devfreq.c | 301 ++++++++++++++++++++++++++
> > 3 files changed, 312 insertions(+)
> > create mode 100644 drivers/devfreq/krait-cache-devfreq.c
> >
> > diff --git a/drivers/devfreq/Kconfig b/drivers/devfreq/Kconfig
> > index 37dc40d1fcfb..99051aaf9c5e 100644
> > --- a/drivers/devfreq/Kconfig
> > +++ b/drivers/devfreq/Kconfig
> > @@ -143,6 +143,16 @@ config ARM_RK3399_DMC_DEVFREQ
> > It sets the frequency for the memory controller and reads the usage counts
> > from hardware.
> >
> > +config ARM_KRAIT_CACHE_DEVFREQ
> > + tristate "Scaling support for Krait CPU Cache Devfreq"
> > + depends on ARCH_QCOM || COMPILE_TEST
> > + help
> > + This adds the DEVFREQ driver for the Krait CPU L2 Cache shared by all cores.
> > +
> > + The driver register with the cpufreq notifier and find the right frequency
> > + based on the max frequency across all core and the range set in the device
> > + dts. If provided this scale also the regulator attached to the l2 cache.
> > +
> > source "drivers/devfreq/event/Kconfig"
> >
> > endif # PM_DEVFREQ
> > diff --git a/drivers/devfreq/Makefile b/drivers/devfreq/Makefile
> > index 3ca1ad0ecb97..bb87925a6a2d 100644
> > --- a/drivers/devfreq/Makefile
> > +++ b/drivers/devfreq/Makefile
> > @@ -14,6 +14,7 @@ obj-$(CONFIG_ARM_IMX8M_DDRC_DEVFREQ) += imx8m-ddrc.o
> > obj-$(CONFIG_ARM_RK3399_DMC_DEVFREQ) += rk3399_dmc.o
> > obj-$(CONFIG_ARM_TEGRA_DEVFREQ) += tegra30-devfreq.o
> > obj-$(CONFIG_ARM_TEGRA20_DEVFREQ) += tegra20-devfreq.o
> > +obj-$(CONFIG_ARM_KRAIT_CACHE_DEVFREQ) += krait-cache-devfreq.o
> >
> > # DEVFREQ Event Drivers
> > obj-$(CONFIG_PM_DEVFREQ_EVENT) += event/
> > diff --git a/drivers/devfreq/krait-cache-devfreq.c b/drivers/devfreq/krait-cache-devfreq.c
> > new file mode 100644
> > index 000000000000..101a13b6927a
> > --- /dev/null
> > +++ b/drivers/devfreq/krait-cache-devfreq.c
> > @@ -0,0 +1,301 @@
> > +// SPDX-License-Identifier: GPL-2.0
> > +
> > +#include <linux/kernel.h>
> > +#include <linux/init.h>
> > +#include <linux/module.h>
> > +#include <linux/cpufreq.h>
> > +#include <linux/devfreq.h>
> > +#include <linux/of.h>
> > +#include <linux/platform_device.h>
> > +#include <linux/clk.h>
> > +#include <linux/slab.h>
> > +#include <linux/regulator/consumer.h>
> > +#include <linux/pm_opp.h>
> > +
> > +#include "governor.h"
> > +
> > +struct krait_data {
> > + struct device *dev;
> > + struct devfreq *devfreq;
> > +
> > + struct clk *l2_clk;
> > +
> > + unsigned long *freq_table; /* L2 bus clock rate */
> > + unsigned int *l2_cpufreq; /* L2 target CPU frequency */
> > +
> > + struct notifier_block nb;
> > +};
> > +
> > +static int krait_cache_set_opp(struct dev_pm_set_opp_data *data)
> > +{
> > + unsigned long old_freq = data->old_opp.rate, freq = data->new_opp.rate;
> > + struct dev_pm_opp_supply *supply = &data->new_opp.supplies[0];
> > + struct regulator *reg = data->regulators[0];
> > + struct clk *clk = data->clk;
> > + struct krait_data *kdata;
> > + unsigned long idle_freq;
> > + int ret;
> > +
> > + kdata = (struct krait_data *)dev_get_drvdata(data->dev);
> > +
> > + idle_freq = kdata->freq_table[0];
> > +
> > + if (reg) {
> > + ret = regulator_set_voltage_triplet(reg, supply->u_volt_min,
> > + supply->u_volt,
> > + supply->u_volt_max);
> > + if (ret)
> > + goto exit;
> > + }
> > +
> > + /*
> > + * Set to idle bin if switching from normal to high bin
> > + * or vice versa. It has been notice that a bug is triggered
> > + * in cache scaling when more than one bin is scaled, to fix
> > + * this we first need to transition to the base rate and then
> > + * to target rate
> > + */
> > + if (likely(freq != idle_freq && old_freq != idle_freq)) {
> > + ret = clk_set_rate(clk, idle_freq);
> > + if (ret)
> > + goto exit;
> > + }
> > +
> > + ret = clk_set_rate(clk, freq);
> > + if (ret)
> > + goto exit;
> > +
> > +exit:
> > + return ret;
> > +};
> > +
> > +static int krait_cache_target(struct device *dev, unsigned long *freq,
> > + u32 flags)
> > +{
> > + return dev_pm_opp_set_rate(dev, *freq);
> > +};
> > +
> > +static int krait_cache_get_dev_status(struct device *dev,
> > + struct devfreq_dev_status *stat)
> > +{
> > + struct krait_data *data = dev_get_drvdata(dev);
> > +
> > + stat->busy_time = 0;
> > + stat->total_time = 0;
> > + stat->current_frequency = clk_get_rate(data->l2_clk);
> > +
> > + return 0;
> > +};
> > +
> > +static int krait_cache_get_cur_freq(struct device *dev, unsigned long *freq)
> > +{
> > + struct krait_data *data = dev_get_drvdata(dev);
> > +
> > + *freq = clk_get_rate(data->l2_clk);
> > +
> > + return 0;
> > +};
> > +
> > +static struct devfreq_dev_profile tegra_devfreq_profile = {
> > + .target = krait_cache_target,
> > + .get_dev_status = krait_cache_get_dev_status,
> > + .get_cur_freq = krait_cache_get_cur_freq
> > +};
> > +
> > +static int krait_cache_notifier(struct notifier_block *nb, unsigned long action,
> > + void *v)
> > +{
> > + struct cpufreq_freqs *freqs;
> > + unsigned int cpu, cur_cpu;
> > + struct krait_data *data;
> > + struct devfreq *devfreq;
> > + unsigned long freq;
> > + int ret = 0;
> > +
> > + if (action != CPUFREQ_POSTCHANGE)
> > + return NOTIFY_OK;
> > +
> > + data = container_of(nb, struct krait_data, nb);
> > + devfreq = data->devfreq;
> > +
> > + mutex_lock_nested(&devfreq->lock, SINGLE_DEPTH_NESTING);
> > +
> > + freqs = (struct cpufreq_freqs *)v;
> > + freq = freqs->new;
> > + cur_cpu = freqs->policy->cpu;
> > +
> > + /* find the max freq across all core */
> > + for_each_present_cpu(cpu)
> > + if (cpu != cur_cpu)
> > + freq = max(freq, (unsigned long)cpufreq_quick_get(cpu));
> > +
> > + devfreq->governor->get_target_freq(devfreq, &freq);
> > +
> > + if (devfreq->previous_freq == freq)
> > + goto out;
> > +
> > + ret = devfreq->profile->target(data->dev, &freq, 0);
> > + if (ret < 0)
> > + goto out;
> > +
> > + if (devfreq->profile->freq_table &&
> > + (devfreq_update_status(devfreq, freq)))
> > + dev_err(data->dev,
> > + "Couldn't update frequency transition information.\n");
> > +
> > + devfreq->previous_freq = freq;
> > +
> > +out:
> > + mutex_unlock(&devfreq->lock);
> > + return notifier_from_errno(ret);
> > +};
> > +
> > +static int krait_cache_governor_get_target(struct devfreq *devfreq,
> > + unsigned long *freq)
> > +{
> > + unsigned int *l2_cpufreq;
> > + unsigned long *freq_table;
> > + unsigned long target_freq = *freq;
> > + struct krait_data *data = dev_get_drvdata(devfreq->dev.parent);
> > +
> > + l2_cpufreq = data->l2_cpufreq;
> > + freq_table = data->freq_table;
> > +
> > + /*
> > + * Find the highest l2 freq interval based on the max cpufreq
> > + * across all core
> > + */
> > + while (*(l2_cpufreq = l2_cpufreq + 1) && target_freq >= *l2_cpufreq)
> > + freq_table = freq_table + 1;
> > +
> > + *freq = *freq_table;
> > +
> > + return 0;
> > +};
> > +
> > +static int krait_cache_governor_event_handler(struct devfreq *devfreq,
> > + unsigned int event, void *data)
> > +{
> > + struct krait_data *kdata = dev_get_drvdata(devfreq->dev.parent);
> > + int ret = 0;
> > +
> > + switch (event) {
> > + case DEVFREQ_GOV_START:
> > + kdata->nb.notifier_call = krait_cache_notifier;
> > + ret = cpufreq_register_notifier(&kdata->nb,
> > + CPUFREQ_TRANSITION_NOTIFIER);
> > + break;
> > +
> > + case DEVFREQ_GOV_STOP:
> > + cpufreq_unregister_notifier(&kdata->nb,
> > + CPUFREQ_TRANSITION_NOTIFIER);
> > + break;
> > + }
> > +
> > + return ret;
> > +};
> > +
> > +static struct devfreq_governor krait_devfreq_governor = {
> > + .name = "krait_governor",
> > + .get_target_freq = krait_cache_governor_get_target,
> > + .event_handler = krait_cache_governor_event_handler,
> > + .immutable = true,
> > +};
> > +
> > +static int krait_cache_probe(struct platform_device *pdev)
> > +{
> > + int ret, count;
> > + struct opp_table *table;
> > + struct krait_data *data;
> > + struct device *dev = &pdev->dev;
> > + struct device_node *node = dev->of_node;
> > +
> > + data = devm_kzalloc(dev, sizeof(*data), GFP_KERNEL);
> > + if (!data)
> > + return -ENOMEM;
> > +
> > + data->dev = dev;
> > +
> > + data->l2_clk = devm_clk_get(dev, "l2");
> > + if (IS_ERR(data->l2_clk))
> > + return PTR_ERR(data->l2_clk);
> > +
> > + table = dev_pm_opp_set_regulators(dev, (const char *[]){ "l2" }, 1);
> > + if (IS_ERR(table)) {
> > + ret = PTR_ERR(table);
> > + dev_err(dev, "failed to set regulators %d\n", ret);
> > + return ret;
> > + }
> > +
> > + ret = PTR_ERR_OR_ZERO(
> > + dev_pm_opp_register_set_opp_helper(dev, krait_cache_set_opp));
> > + if (ret)
> > + return ret;
> > +
> > + ret = dev_pm_opp_of_add_table(dev);
> > + if (ret) {
> > + dev_err(dev, "failed to parse L2 freq thresholds\n");
> > + return ret;
> > + }
> > +
> > + count = dev_pm_opp_get_opp_count(dev);
> > +
> > + data->l2_cpufreq =
> > + devm_kzalloc(dev, sizeof(unsigned int) * count, GFP_KERNEL);
> > + if (!data->l2_cpufreq)
> > + return -ENOMEM;
> > +
> > + ret = of_property_read_u32_array(node, "qcom,l2-cpufreq", data->l2_cpufreq,
> > + count);
> > + if (ret) {
> > + dev_err(dev, "failed to parse L2 cpufreq thresholds\n");
> > + return ret;
> > + }
> > +
> > + ret = devfreq_add_governor(&krait_devfreq_governor);
> > + if (ret) {
> > + dev_err(&pdev->dev, "Failed to add governor: %d\n", ret);
> > + return ret;
> > + }
> > +
> > + platform_set_drvdata(pdev, data);
> > +
> > + data->devfreq = devfreq_add_device(&pdev->dev, &tegra_devfreq_profile,
> > + "krait_governor", NULL);
> > +
> > + /* Cache freq_table to quickly get it when needed */
> > + data->freq_table = data->devfreq->profile->freq_table;
> > +
> > + if (IS_ERR(data->devfreq))
> > + return PTR_ERR(data->devfreq);
> > +
> > + return 0;
> > +};
> > +
> > +static int krait_cache_remove(struct platform_device *pdev)
> > +{
> > + struct krait_data *data = platform_get_drvdata(pdev);
> > +
> > + dev_pm_opp_remove_table(data->dev);
> > +
> > + return 0;
> > +};
> > +
> > +static const struct of_device_id krait_cache_match_table[] = {
> > + { .compatible = "qcom,krait-cache" },
> > + {}
> > +};
> > +
> > +static struct platform_driver krait_cache_driver = {
> > + .probe = krait_cache_probe,
> > + .remove = krait_cache_remove,
> > + .driver = {
> > + .name = "krait-cache-scaling",
> > + .of_match_table = krait_cache_match_table,
> > + },
> > +};
> > +module_platform_driver(krait_cache_driver);
> > +
> > +MODULE_DESCRIPTION("Krait CPU Cache Scaling driver");
> > +MODULE_AUTHOR("Ansuel Smith <ansuelsmth@xxxxxxxxx>");
> > +MODULE_LICENSE("GPL v2");
> >
>
>
> --
> Best Regards,
> Chanwoo Choi
> Samsung Electronics

--
Ansuel