Commit 4570ddda authored by Daniel Lezcano's avatar Daniel Lezcano

powercap/drivers/dtpm: Encapsulate even more the code

In order to increase the self-encapsulation of the dtpm generic code,
the following changes are adding a power update ops to the dtpm
ops. That allows the generic code to call directly the dtpm backend
function to update the power values.

The power update function does compute the power characteristics when
the function is invoked. In the case of the CPUs, the power
consumption depends on the number of online CPUs. The online CPUs mask
is not up to date at CPUHP_AP_ONLINE_DYN state in the tear down
callback. That is the reason why the online / offline are at separate
state. As there is already an existing state for DTPM, this one is
only moved to the DEAD state, so there is no addition of new state
with these changes. The dtpm node is not removed when the cpu is
unplugged.

That simplifies the code for the next changes and results in a more
self-encapsulated code.
Signed-off-by: default avatarDaniel Lezcano <daniel.lezcano@linaro.org>
Reviewed-by: default avatarLukasz Luba <lukasz.luba@arm.com>
Link: https://lore.kernel.org/r/20210312130411.29833-1-daniel.lezcano@linaro.org
parent 6880fa6c
...@@ -116,8 +116,6 @@ static void __dtpm_sub_power(struct dtpm *dtpm) ...@@ -116,8 +116,6 @@ static void __dtpm_sub_power(struct dtpm *dtpm)
parent->power_limit -= dtpm->power_limit; parent->power_limit -= dtpm->power_limit;
parent = parent->parent; parent = parent->parent;
} }
__dtpm_rebalance_weight(root);
} }
static void __dtpm_add_power(struct dtpm *dtpm) static void __dtpm_add_power(struct dtpm *dtpm)
...@@ -130,45 +128,45 @@ static void __dtpm_add_power(struct dtpm *dtpm) ...@@ -130,45 +128,45 @@ static void __dtpm_add_power(struct dtpm *dtpm)
parent->power_limit += dtpm->power_limit; parent->power_limit += dtpm->power_limit;
parent = parent->parent; parent = parent->parent;
} }
}
static int __dtpm_update_power(struct dtpm *dtpm)
{
int ret;
__dtpm_sub_power(dtpm);
__dtpm_rebalance_weight(root); ret = dtpm->ops->update_power_uw(dtpm);
if (ret)
pr_err("Failed to update power for '%s': %d\n",
dtpm->zone.name, ret);
if (!test_bit(DTPM_POWER_LIMIT_FLAG, &dtpm->flags))
dtpm->power_limit = dtpm->power_max;
__dtpm_add_power(dtpm);
if (root)
__dtpm_rebalance_weight(root);
return ret;
} }
/** /**
* dtpm_update_power - Update the power on the dtpm * dtpm_update_power - Update the power on the dtpm
* @dtpm: a pointer to a dtpm structure to update * @dtpm: a pointer to a dtpm structure to update
* @power_min: a u64 representing the new power_min value
* @power_max: a u64 representing the new power_max value
* *
* Function to update the power values of the dtpm node specified in * Function to update the power values of the dtpm node specified in
* parameter. These new values will be propagated to the tree. * parameter. These new values will be propagated to the tree.
* *
* Return: zero on success, -EINVAL if the values are inconsistent * Return: zero on success, -EINVAL if the values are inconsistent
*/ */
int dtpm_update_power(struct dtpm *dtpm, u64 power_min, u64 power_max) int dtpm_update_power(struct dtpm *dtpm)
{ {
int ret = 0; int ret;
mutex_lock(&dtpm_lock); mutex_lock(&dtpm_lock);
ret = __dtpm_update_power(dtpm);
if (power_min == dtpm->power_min && power_max == dtpm->power_max)
goto unlock;
if (power_max < power_min) {
ret = -EINVAL;
goto unlock;
}
__dtpm_sub_power(dtpm);
dtpm->power_min = power_min;
dtpm->power_max = power_max;
if (!test_bit(DTPM_POWER_LIMIT_FLAG, &dtpm->flags))
dtpm->power_limit = power_max;
__dtpm_add_power(dtpm);
unlock:
mutex_unlock(&dtpm_lock); mutex_unlock(&dtpm_lock);
return ret; return ret;
...@@ -436,6 +434,7 @@ int dtpm_register(const char *name, struct dtpm *dtpm, struct dtpm *parent) ...@@ -436,6 +434,7 @@ int dtpm_register(const char *name, struct dtpm *dtpm, struct dtpm *parent)
if (dtpm->ops && !(dtpm->ops->set_power_uw && if (dtpm->ops && !(dtpm->ops->set_power_uw &&
dtpm->ops->get_power_uw && dtpm->ops->get_power_uw &&
dtpm->ops->update_power_uw &&
dtpm->ops->release)) dtpm->ops->release))
return -EINVAL; return -EINVAL;
...@@ -455,7 +454,8 @@ int dtpm_register(const char *name, struct dtpm *dtpm, struct dtpm *parent) ...@@ -455,7 +454,8 @@ int dtpm_register(const char *name, struct dtpm *dtpm, struct dtpm *parent)
root = dtpm; root = dtpm;
} }
__dtpm_add_power(dtpm); if (dtpm->ops && !dtpm->ops->update_power_uw(dtpm))
__dtpm_add_power(dtpm);
pr_info("Registered dtpm node '%s' / %llu-%llu uW, \n", pr_info("Registered dtpm node '%s' / %llu-%llu uW, \n",
dtpm->zone.name, dtpm->power_min, dtpm->power_max); dtpm->zone.name, dtpm->power_min, dtpm->power_max);
......
...@@ -14,6 +14,8 @@ ...@@ -14,6 +14,8 @@
* The CPU hotplug is supported and the power numbers will be updated * The CPU hotplug is supported and the power numbers will be updated
* if a CPU is hot plugged / unplugged. * if a CPU is hot plugged / unplugged.
*/ */
#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
#include <linux/cpumask.h> #include <linux/cpumask.h>
#include <linux/cpufreq.h> #include <linux/cpufreq.h>
#include <linux/cpuhotplug.h> #include <linux/cpuhotplug.h>
...@@ -23,8 +25,6 @@ ...@@ -23,8 +25,6 @@
#include <linux/slab.h> #include <linux/slab.h>
#include <linux/units.h> #include <linux/units.h>
static struct dtpm *__parent;
static DEFINE_PER_CPU(struct dtpm *, dtpm_per_cpu); static DEFINE_PER_CPU(struct dtpm *, dtpm_per_cpu);
struct dtpm_cpu { struct dtpm_cpu {
...@@ -32,57 +32,16 @@ struct dtpm_cpu { ...@@ -32,57 +32,16 @@ struct dtpm_cpu {
int cpu; int cpu;
}; };
/*
* When a new CPU is inserted at hotplug or boot time, add the power
* contribution and update the dtpm tree.
*/
static int power_add(struct dtpm *dtpm, struct em_perf_domain *em)
{
u64 power_min, power_max;
power_min = em->table[0].power;
power_min *= MICROWATT_PER_MILLIWATT;
power_min += dtpm->power_min;
power_max = em->table[em->nr_perf_states - 1].power;
power_max *= MICROWATT_PER_MILLIWATT;
power_max += dtpm->power_max;
return dtpm_update_power(dtpm, power_min, power_max);
}
/*
* When a CPU is unplugged, remove its power contribution from the
* dtpm tree.
*/
static int power_sub(struct dtpm *dtpm, struct em_perf_domain *em)
{
u64 power_min, power_max;
power_min = em->table[0].power;
power_min *= MICROWATT_PER_MILLIWATT;
power_min = dtpm->power_min - power_min;
power_max = em->table[em->nr_perf_states - 1].power;
power_max *= MICROWATT_PER_MILLIWATT;
power_max = dtpm->power_max - power_max;
return dtpm_update_power(dtpm, power_min, power_max);
}
static u64 set_pd_power_limit(struct dtpm *dtpm, u64 power_limit) static u64 set_pd_power_limit(struct dtpm *dtpm, u64 power_limit)
{ {
struct dtpm_cpu *dtpm_cpu = dtpm->private; struct dtpm_cpu *dtpm_cpu = dtpm->private;
struct em_perf_domain *pd; struct em_perf_domain *pd = em_cpu_get(dtpm_cpu->cpu);
struct cpumask cpus; struct cpumask cpus;
unsigned long freq; unsigned long freq;
u64 power; u64 power;
int i, nr_cpus; int i, nr_cpus;
pd = em_cpu_get(dtpm_cpu->cpu);
cpumask_and(&cpus, cpu_online_mask, to_cpumask(pd->cpus)); cpumask_and(&cpus, cpu_online_mask, to_cpumask(pd->cpus));
nr_cpus = cpumask_weight(&cpus); nr_cpus = cpumask_weight(&cpus);
for (i = 0; i < pd->nr_perf_states; i++) { for (i = 0; i < pd->nr_perf_states; i++) {
...@@ -113,6 +72,7 @@ static u64 get_pd_power_uw(struct dtpm *dtpm) ...@@ -113,6 +72,7 @@ static u64 get_pd_power_uw(struct dtpm *dtpm)
pd = em_cpu_get(dtpm_cpu->cpu); pd = em_cpu_get(dtpm_cpu->cpu);
freq = cpufreq_quick_get(dtpm_cpu->cpu); freq = cpufreq_quick_get(dtpm_cpu->cpu);
cpumask_and(&cpus, cpu_online_mask, to_cpumask(pd->cpus)); cpumask_and(&cpus, cpu_online_mask, to_cpumask(pd->cpus));
nr_cpus = cpumask_weight(&cpus); nr_cpus = cpumask_weight(&cpus);
...@@ -128,6 +88,27 @@ static u64 get_pd_power_uw(struct dtpm *dtpm) ...@@ -128,6 +88,27 @@ static u64 get_pd_power_uw(struct dtpm *dtpm)
return 0; return 0;
} }
static int update_pd_power_uw(struct dtpm *dtpm)
{
struct dtpm_cpu *dtpm_cpu = dtpm->private;
struct em_perf_domain *em = em_cpu_get(dtpm_cpu->cpu);
struct cpumask cpus;
int nr_cpus;
cpumask_and(&cpus, cpu_online_mask, to_cpumask(em->cpus));
nr_cpus = cpumask_weight(&cpus);
dtpm->power_min = em->table[0].power;
dtpm->power_min *= MICROWATT_PER_MILLIWATT;
dtpm->power_min *= nr_cpus;
dtpm->power_max = em->table[em->nr_perf_states - 1].power;
dtpm->power_max *= MICROWATT_PER_MILLIWATT;
dtpm->power_max *= nr_cpus;
return 0;
}
static void pd_release(struct dtpm *dtpm) static void pd_release(struct dtpm *dtpm)
{ {
struct dtpm_cpu *dtpm_cpu = dtpm->private; struct dtpm_cpu *dtpm_cpu = dtpm->private;
...@@ -139,39 +120,24 @@ static void pd_release(struct dtpm *dtpm) ...@@ -139,39 +120,24 @@ static void pd_release(struct dtpm *dtpm)
} }
static struct dtpm_ops dtpm_ops = { static struct dtpm_ops dtpm_ops = {
.set_power_uw = set_pd_power_limit, .set_power_uw = set_pd_power_limit,
.get_power_uw = get_pd_power_uw, .get_power_uw = get_pd_power_uw,
.release = pd_release, .update_power_uw = update_pd_power_uw,
.release = pd_release,
}; };
static int cpuhp_dtpm_cpu_offline(unsigned int cpu) static int cpuhp_dtpm_cpu_offline(unsigned int cpu)
{ {
struct cpufreq_policy *policy;
struct em_perf_domain *pd; struct em_perf_domain *pd;
struct dtpm *dtpm; struct dtpm *dtpm;
policy = cpufreq_cpu_get(cpu);
if (!policy)
return 0;
pd = em_cpu_get(cpu); pd = em_cpu_get(cpu);
if (!pd) if (!pd)
return -EINVAL; return -EINVAL;
dtpm = per_cpu(dtpm_per_cpu, cpu); dtpm = per_cpu(dtpm_per_cpu, cpu);
power_sub(dtpm, pd); return dtpm_update_power(dtpm);
if (cpumask_weight(policy->cpus) != 1)
return 0;
for_each_cpu(cpu, policy->related_cpus)
per_cpu(dtpm_per_cpu, cpu) = NULL;
dtpm_unregister(dtpm);
return 0;
} }
static int cpuhp_dtpm_cpu_online(unsigned int cpu) static int cpuhp_dtpm_cpu_online(unsigned int cpu)
...@@ -184,7 +150,6 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu) ...@@ -184,7 +150,6 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu)
int ret = -ENOMEM; int ret = -ENOMEM;
policy = cpufreq_cpu_get(cpu); policy = cpufreq_cpu_get(cpu);
if (!policy) if (!policy)
return 0; return 0;
...@@ -194,7 +159,7 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu) ...@@ -194,7 +159,7 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu)
dtpm = per_cpu(dtpm_per_cpu, cpu); dtpm = per_cpu(dtpm_per_cpu, cpu);
if (dtpm) if (dtpm)
return power_add(dtpm, pd); return dtpm_update_power(dtpm);
dtpm = dtpm_alloc(&dtpm_ops); dtpm = dtpm_alloc(&dtpm_ops);
if (!dtpm) if (!dtpm)
...@@ -210,27 +175,20 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu) ...@@ -210,27 +175,20 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu)
for_each_cpu(cpu, policy->related_cpus) for_each_cpu(cpu, policy->related_cpus)
per_cpu(dtpm_per_cpu, cpu) = dtpm; per_cpu(dtpm_per_cpu, cpu) = dtpm;
sprintf(name, "cpu%d", dtpm_cpu->cpu); snprintf(name, sizeof(name), "cpu%d-cpufreq", dtpm_cpu->cpu);
ret = dtpm_register(name, dtpm, __parent); ret = dtpm_register(name, dtpm, NULL);
if (ret) if (ret)
goto out_kfree_dtpm_cpu; goto out_kfree_dtpm_cpu;
ret = power_add(dtpm, pd);
if (ret)
goto out_dtpm_unregister;
ret = freq_qos_add_request(&policy->constraints, ret = freq_qos_add_request(&policy->constraints,
&dtpm_cpu->qos_req, FREQ_QOS_MAX, &dtpm_cpu->qos_req, FREQ_QOS_MAX,
pd->table[pd->nr_perf_states - 1].frequency); pd->table[pd->nr_perf_states - 1].frequency);
if (ret) if (ret)
goto out_power_sub; goto out_dtpm_unregister;
return 0; return 0;
out_power_sub:
power_sub(dtpm, pd);
out_dtpm_unregister: out_dtpm_unregister:
dtpm_unregister(dtpm); dtpm_unregister(dtpm);
dtpm_cpu = NULL; dtpm_cpu = NULL;
...@@ -248,10 +206,38 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu) ...@@ -248,10 +206,38 @@ static int cpuhp_dtpm_cpu_online(unsigned int cpu)
int dtpm_register_cpu(struct dtpm *parent) int dtpm_register_cpu(struct dtpm *parent)
{ {
__parent = parent; int ret;
/*
* The callbacks at CPU hotplug time are calling
* dtpm_update_power() which in turns calls update_pd_power().
*
* The function update_pd_power() uses the online mask to
* figure out the power consumption limits.
*
* At CPUHP_AP_ONLINE_DYN, the CPU is present in the CPU
* online mask when the cpuhp_dtpm_cpu_online function is
* called, but the CPU is still in the online mask for the
* tear down callback. So the power can not be updated when
* the CPU is unplugged.
*
* At CPUHP_AP_DTPM_CPU_DEAD, the situation is the opposite as
* above. The CPU online mask is not up to date when the CPU
* is plugged in.
*
* For this reason, we need to call the online and offline
* callbacks at different moments when the CPU online mask is
* consistent with the power numbers we want to update.
*/
ret = cpuhp_setup_state(CPUHP_AP_DTPM_CPU_DEAD, "dtpm_cpu:offline",
NULL, cpuhp_dtpm_cpu_offline);
if (ret < 0)
return ret;
ret = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "dtpm_cpu:online",
cpuhp_dtpm_cpu_online, NULL);
if (ret < 0)
return ret;
return cpuhp_setup_state(CPUHP_AP_DTPM_CPU_ONLINE, return 0;
"dtpm_cpu:online",
cpuhp_dtpm_cpu_online,
cpuhp_dtpm_cpu_offline);
} }
...@@ -97,6 +97,7 @@ enum cpuhp_state { ...@@ -97,6 +97,7 @@ enum cpuhp_state {
CPUHP_LUSTRE_CFS_DEAD, CPUHP_LUSTRE_CFS_DEAD,
CPUHP_AP_ARM_CACHE_B15_RAC_DEAD, CPUHP_AP_ARM_CACHE_B15_RAC_DEAD,
CPUHP_PADATA_DEAD, CPUHP_PADATA_DEAD,
CPUHP_AP_DTPM_CPU_DEAD,
CPUHP_WORKQUEUE_PREP, CPUHP_WORKQUEUE_PREP,
CPUHP_POWER_NUMA_PREPARE, CPUHP_POWER_NUMA_PREPARE,
CPUHP_HRTIMERS_PREPARE, CPUHP_HRTIMERS_PREPARE,
...@@ -242,7 +243,6 @@ enum cpuhp_state { ...@@ -242,7 +243,6 @@ enum cpuhp_state {
CPUHP_AP_ONLINE_DYN_END = CPUHP_AP_ONLINE_DYN + 30, CPUHP_AP_ONLINE_DYN_END = CPUHP_AP_ONLINE_DYN + 30,
CPUHP_AP_X86_HPET_ONLINE, CPUHP_AP_X86_HPET_ONLINE,
CPUHP_AP_X86_KVM_CLK_ONLINE, CPUHP_AP_X86_KVM_CLK_ONLINE,
CPUHP_AP_DTPM_CPU_ONLINE,
CPUHP_AP_ACTIVE, CPUHP_AP_ACTIVE,
CPUHP_ONLINE, CPUHP_ONLINE,
}; };
......
...@@ -29,6 +29,7 @@ struct dtpm { ...@@ -29,6 +29,7 @@ struct dtpm {
struct dtpm_ops { struct dtpm_ops {
u64 (*set_power_uw)(struct dtpm *, u64); u64 (*set_power_uw)(struct dtpm *, u64);
u64 (*get_power_uw)(struct dtpm *); u64 (*get_power_uw)(struct dtpm *);
int (*update_power_uw)(struct dtpm *);
void (*release)(struct dtpm *); void (*release)(struct dtpm *);
}; };
...@@ -62,7 +63,7 @@ static inline struct dtpm *to_dtpm(struct powercap_zone *zone) ...@@ -62,7 +63,7 @@ static inline struct dtpm *to_dtpm(struct powercap_zone *zone)
return container_of(zone, struct dtpm, zone); return container_of(zone, struct dtpm, zone);
} }
int dtpm_update_power(struct dtpm *dtpm, u64 power_min, u64 power_max); int dtpm_update_power(struct dtpm *dtpm);
int dtpm_release_zone(struct powercap_zone *pcz); int dtpm_release_zone(struct powercap_zone *pcz);
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment