提交 521b512b 编写于 作者: L Lukasz Luba 提交者: Rafael J. Wysocki

PM / EM: change naming convention from 'capacity' to 'performance'

The Energy Model uses concept of performance domain and capacity states in
order to calculate power used by CPUs. Change naming convention from
capacity to performance state would enable wider usage in future, e.g.
upcoming support for other devices other than CPUs.
Acked-by: NDaniel Lezcano <daniel.lezcano@linaro.org>
Acked-by: NQuentin Perret <qperret@google.com>
Signed-off-by: NLukasz Luba <lukasz.luba@arm.com>
Signed-off-by: NRafael J. Wysocki <rafael.j.wysocki@intel.com>
上级 48778464
...@@ -333,18 +333,18 @@ static inline bool em_is_sane(struct cpufreq_cooling_device *cpufreq_cdev, ...@@ -333,18 +333,18 @@ static inline bool em_is_sane(struct cpufreq_cooling_device *cpufreq_cdev,
return false; return false;
policy = cpufreq_cdev->policy; policy = cpufreq_cdev->policy;
if (!cpumask_equal(policy->related_cpus, to_cpumask(em->cpus))) { if (!cpumask_equal(policy->related_cpus, em_span_cpus(em))) {
pr_err("The span of pd %*pbl is misaligned with cpufreq policy %*pbl\n", pr_err("The span of pd %*pbl is misaligned with cpufreq policy %*pbl\n",
cpumask_pr_args(to_cpumask(em->cpus)), cpumask_pr_args(em_span_cpus(em)),
cpumask_pr_args(policy->related_cpus)); cpumask_pr_args(policy->related_cpus));
return false; return false;
} }
nr_levels = cpufreq_cdev->max_level + 1; nr_levels = cpufreq_cdev->max_level + 1;
if (em->nr_cap_states != nr_levels) { if (em_pd_nr_perf_states(em) != nr_levels) {
pr_err("The number of cap states in pd %*pbl (%u) doesn't match the number of cooling levels (%u)\n", pr_err("The number of performance states in pd %*pbl (%u) doesn't match the number of cooling levels (%u)\n",
cpumask_pr_args(to_cpumask(em->cpus)), cpumask_pr_args(em_span_cpus(em)),
em->nr_cap_states, nr_levels); em_pd_nr_perf_states(em), nr_levels);
return false; return false;
} }
......
...@@ -10,13 +10,13 @@ ...@@ -10,13 +10,13 @@
#include <linux/types.h> #include <linux/types.h>
/** /**
* em_cap_state - Capacity state of a performance domain * em_perf_state - Performance state of a performance domain
* @frequency: The CPU frequency in KHz, for consistency with CPUFreq * @frequency: The CPU frequency in KHz, for consistency with CPUFreq
* @power: The power consumed by 1 CPU at this level, in milli-watts * @power: The power consumed by 1 CPU at this level, in milli-watts
* @cost: The cost coefficient associated with this level, used during * @cost: The cost coefficient associated with this level, used during
* energy calculation. Equal to: power * max_frequency / frequency * energy calculation. Equal to: power * max_frequency / frequency
*/ */
struct em_cap_state { struct em_perf_state {
unsigned long frequency; unsigned long frequency;
unsigned long power; unsigned long power;
unsigned long cost; unsigned long cost;
...@@ -24,8 +24,8 @@ struct em_cap_state { ...@@ -24,8 +24,8 @@ struct em_cap_state {
/** /**
* em_perf_domain - Performance domain * em_perf_domain - Performance domain
* @table: List of capacity states, in ascending order * @table: List of performance states, in ascending order
* @nr_cap_states: Number of capacity states * @nr_perf_states: Number of performance states
* @cpus: Cpumask covering the CPUs of the domain * @cpus: Cpumask covering the CPUs of the domain
* *
* A "performance domain" represents a group of CPUs whose performance is * A "performance domain" represents a group of CPUs whose performance is
...@@ -34,22 +34,27 @@ struct em_cap_state { ...@@ -34,22 +34,27 @@ struct em_cap_state {
* CPUFreq policies. * CPUFreq policies.
*/ */
struct em_perf_domain { struct em_perf_domain {
struct em_cap_state *table; struct em_perf_state *table;
int nr_cap_states; int nr_perf_states;
unsigned long cpus[]; unsigned long cpus[];
}; };
#define em_span_cpus(em) (to_cpumask((em)->cpus))
#ifdef CONFIG_ENERGY_MODEL #ifdef CONFIG_ENERGY_MODEL
#define EM_CPU_MAX_POWER 0xFFFF #define EM_CPU_MAX_POWER 0xFFFF
struct em_data_callback { struct em_data_callback {
/** /**
* active_power() - Provide power at the next capacity state of a CPU * active_power() - Provide power at the next performance state of
* @power : Active power at the capacity state in mW (modified) * a CPU
* @freq : Frequency at the capacity state in kHz (modified) * @power : Active power at the performance state in mW
* (modified)
* @freq : Frequency at the performance state in kHz
* (modified)
* @cpu : CPU for which we do this operation * @cpu : CPU for which we do this operation
* *
* active_power() must find the lowest capacity state of 'cpu' above * active_power() must find the lowest performance state of 'cpu' above
* 'freq' and update 'power' and 'freq' to the matching active power * 'freq' and update 'power' and 'freq' to the matching active power
* and frequency. * and frequency.
* *
...@@ -80,46 +85,46 @@ static inline unsigned long em_pd_energy(struct em_perf_domain *pd, ...@@ -80,46 +85,46 @@ static inline unsigned long em_pd_energy(struct em_perf_domain *pd,
unsigned long max_util, unsigned long sum_util) unsigned long max_util, unsigned long sum_util)
{ {
unsigned long freq, scale_cpu; unsigned long freq, scale_cpu;
struct em_cap_state *cs; struct em_perf_state *ps;
int i, cpu; int i, cpu;
/* /*
* In order to predict the capacity state, map the utilization of the * In order to predict the performance state, map the utilization of
* most utilized CPU of the performance domain to a requested frequency, * the most utilized CPU of the performance domain to a requested
* like schedutil. * frequency, like schedutil.
*/ */
cpu = cpumask_first(to_cpumask(pd->cpus)); cpu = cpumask_first(to_cpumask(pd->cpus));
scale_cpu = arch_scale_cpu_capacity(cpu); scale_cpu = arch_scale_cpu_capacity(cpu);
cs = &pd->table[pd->nr_cap_states - 1]; ps = &pd->table[pd->nr_perf_states - 1];
freq = map_util_freq(max_util, cs->frequency, scale_cpu); freq = map_util_freq(max_util, ps->frequency, scale_cpu);
/* /*
* Find the lowest capacity state of the Energy Model above the * Find the lowest performance state of the Energy Model above the
* requested frequency. * requested frequency.
*/ */
for (i = 0; i < pd->nr_cap_states; i++) { for (i = 0; i < pd->nr_perf_states; i++) {
cs = &pd->table[i]; ps = &pd->table[i];
if (cs->frequency >= freq) if (ps->frequency >= freq)
break; break;
} }
/* /*
* The capacity of a CPU in the domain at that capacity state (cs) * The capacity of a CPU in the domain at the performance state (ps)
* can be computed as: * can be computed as:
* *
* cs->freq * scale_cpu * ps->freq * scale_cpu
* cs->cap = -------------------- (1) * ps->cap = -------------------- (1)
* cpu_max_freq * cpu_max_freq
* *
* So, ignoring the costs of idle states (which are not available in * So, ignoring the costs of idle states (which are not available in
* the EM), the energy consumed by this CPU at that capacity state is * the EM), the energy consumed by this CPU at that performance state
* estimated as: * is estimated as:
* *
* cs->power * cpu_util * ps->power * cpu_util
* cpu_nrg = -------------------- (2) * cpu_nrg = -------------------- (2)
* cs->cap * ps->cap
* *
* since 'cpu_util / cs->cap' represents its percentage of busy time. * since 'cpu_util / ps->cap' represents its percentage of busy time.
* *
* NOTE: Although the result of this computation actually is in * NOTE: Although the result of this computation actually is in
* units of power, it can be manipulated as an energy value * units of power, it can be manipulated as an energy value
...@@ -129,34 +134,35 @@ static inline unsigned long em_pd_energy(struct em_perf_domain *pd, ...@@ -129,34 +134,35 @@ static inline unsigned long em_pd_energy(struct em_perf_domain *pd,
* By injecting (1) in (2), 'cpu_nrg' can be re-expressed as a product * By injecting (1) in (2), 'cpu_nrg' can be re-expressed as a product
* of two terms: * of two terms:
* *
* cs->power * cpu_max_freq cpu_util * ps->power * cpu_max_freq cpu_util
* cpu_nrg = ------------------------ * --------- (3) * cpu_nrg = ------------------------ * --------- (3)
* cs->freq scale_cpu * ps->freq scale_cpu
* *
* The first term is static, and is stored in the em_cap_state struct * The first term is static, and is stored in the em_perf_state struct
* as 'cs->cost'. * as 'ps->cost'.
* *
* Since all CPUs of the domain have the same micro-architecture, they * Since all CPUs of the domain have the same micro-architecture, they
* share the same 'cs->cost', and the same CPU capacity. Hence, the * share the same 'ps->cost', and the same CPU capacity. Hence, the
* total energy of the domain (which is the simple sum of the energy of * total energy of the domain (which is the simple sum of the energy of
* all of its CPUs) can be factorized as: * all of its CPUs) can be factorized as:
* *
* cs->cost * \Sum cpu_util * ps->cost * \Sum cpu_util
* pd_nrg = ------------------------ (4) * pd_nrg = ------------------------ (4)
* scale_cpu * scale_cpu
*/ */
return cs->cost * sum_util / scale_cpu; return ps->cost * sum_util / scale_cpu;
} }
/** /**
* em_pd_nr_cap_states() - Get the number of capacity states of a perf. domain * em_pd_nr_perf_states() - Get the number of performance states of a perf.
* domain
* @pd : performance domain for which this must be done * @pd : performance domain for which this must be done
* *
* Return: the number of capacity states in the performance domain table * Return: the number of performance states in the performance domain table
*/ */
static inline int em_pd_nr_cap_states(struct em_perf_domain *pd) static inline int em_pd_nr_perf_states(struct em_perf_domain *pd)
{ {
return pd->nr_cap_states; return pd->nr_perf_states;
} }
#else #else
...@@ -177,7 +183,7 @@ static inline unsigned long em_pd_energy(struct em_perf_domain *pd, ...@@ -177,7 +183,7 @@ static inline unsigned long em_pd_energy(struct em_perf_domain *pd,
{ {
return 0; return 0;
} }
static inline int em_pd_nr_cap_states(struct em_perf_domain *pd) static inline int em_pd_nr_perf_states(struct em_perf_domain *pd)
{ {
return 0; return 0;
} }
......
...@@ -27,18 +27,18 @@ static DEFINE_MUTEX(em_pd_mutex); ...@@ -27,18 +27,18 @@ static DEFINE_MUTEX(em_pd_mutex);
#ifdef CONFIG_DEBUG_FS #ifdef CONFIG_DEBUG_FS
static struct dentry *rootdir; static struct dentry *rootdir;
static void em_debug_create_cs(struct em_cap_state *cs, struct dentry *pd) static void em_debug_create_ps(struct em_perf_state *ps, struct dentry *pd)
{ {
struct dentry *d; struct dentry *d;
char name[24]; char name[24];
snprintf(name, sizeof(name), "cs:%lu", cs->frequency); snprintf(name, sizeof(name), "ps:%lu", ps->frequency);
/* Create per-cs directory */ /* Create per-ps directory */
d = debugfs_create_dir(name, pd); d = debugfs_create_dir(name, pd);
debugfs_create_ulong("frequency", 0444, d, &cs->frequency); debugfs_create_ulong("frequency", 0444, d, &ps->frequency);
debugfs_create_ulong("power", 0444, d, &cs->power); debugfs_create_ulong("power", 0444, d, &ps->power);
debugfs_create_ulong("cost", 0444, d, &cs->cost); debugfs_create_ulong("cost", 0444, d, &ps->cost);
} }
static int em_debug_cpus_show(struct seq_file *s, void *unused) static int em_debug_cpus_show(struct seq_file *s, void *unused)
...@@ -62,9 +62,9 @@ static void em_debug_create_pd(struct em_perf_domain *pd, int cpu) ...@@ -62,9 +62,9 @@ static void em_debug_create_pd(struct em_perf_domain *pd, int cpu)
debugfs_create_file("cpus", 0444, d, pd->cpus, &em_debug_cpus_fops); debugfs_create_file("cpus", 0444, d, pd->cpus, &em_debug_cpus_fops);
/* Create a sub-directory for each capacity state */ /* Create a sub-directory for each performance state */
for (i = 0; i < pd->nr_cap_states; i++) for (i = 0; i < pd->nr_perf_states; i++)
em_debug_create_cs(&pd->table[i], d); em_debug_create_ps(&pd->table[i], d);
} }
static int __init em_debug_init(void) static int __init em_debug_init(void)
...@@ -84,7 +84,7 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states, ...@@ -84,7 +84,7 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states,
unsigned long opp_eff, prev_opp_eff = ULONG_MAX; unsigned long opp_eff, prev_opp_eff = ULONG_MAX;
unsigned long power, freq, prev_freq = 0; unsigned long power, freq, prev_freq = 0;
int i, ret, cpu = cpumask_first(span); int i, ret, cpu = cpumask_first(span);
struct em_cap_state *table; struct em_perf_state *table;
struct em_perf_domain *pd; struct em_perf_domain *pd;
u64 fmax; u64 fmax;
...@@ -99,26 +99,26 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states, ...@@ -99,26 +99,26 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states,
if (!table) if (!table)
goto free_pd; goto free_pd;
/* Build the list of capacity states for this performance domain */ /* Build the list of performance states for this performance domain */
for (i = 0, freq = 0; i < nr_states; i++, freq++) { for (i = 0, freq = 0; i < nr_states; i++, freq++) {
/* /*
* active_power() is a driver callback which ceils 'freq' to * active_power() is a driver callback which ceils 'freq' to
* lowest capacity state of 'cpu' above 'freq' and updates * lowest performance state of 'cpu' above 'freq' and updates
* 'power' and 'freq' accordingly. * 'power' and 'freq' accordingly.
*/ */
ret = cb->active_power(&power, &freq, cpu); ret = cb->active_power(&power, &freq, cpu);
if (ret) { if (ret) {
pr_err("pd%d: invalid cap. state: %d\n", cpu, ret); pr_err("pd%d: invalid perf. state: %d\n", cpu, ret);
goto free_cs_table; goto free_ps_table;
} }
/* /*
* We expect the driver callback to increase the frequency for * We expect the driver callback to increase the frequency for
* higher capacity states. * higher performance states.
*/ */
if (freq <= prev_freq) { if (freq <= prev_freq) {
pr_err("pd%d: non-increasing freq: %lu\n", cpu, freq); pr_err("pd%d: non-increasing freq: %lu\n", cpu, freq);
goto free_cs_table; goto free_ps_table;
} }
/* /*
...@@ -127,7 +127,7 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states, ...@@ -127,7 +127,7 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states,
*/ */
if (!power || power > EM_CPU_MAX_POWER) { if (!power || power > EM_CPU_MAX_POWER) {
pr_err("pd%d: invalid power: %lu\n", cpu, power); pr_err("pd%d: invalid power: %lu\n", cpu, power);
goto free_cs_table; goto free_ps_table;
} }
table[i].power = power; table[i].power = power;
...@@ -141,12 +141,12 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states, ...@@ -141,12 +141,12 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states,
*/ */
opp_eff = freq / power; opp_eff = freq / power;
if (opp_eff >= prev_opp_eff) if (opp_eff >= prev_opp_eff)
pr_warn("pd%d: hertz/watts ratio non-monotonically decreasing: em_cap_state %d >= em_cap_state%d\n", pr_warn("pd%d: hertz/watts ratio non-monotonically decreasing: em_perf_state %d >= em_perf_state%d\n",
cpu, i, i - 1); cpu, i, i - 1);
prev_opp_eff = opp_eff; prev_opp_eff = opp_eff;
} }
/* Compute the cost of each capacity_state. */ /* Compute the cost of each performance state. */
fmax = (u64) table[nr_states - 1].frequency; fmax = (u64) table[nr_states - 1].frequency;
for (i = 0; i < nr_states; i++) { for (i = 0; i < nr_states; i++) {
table[i].cost = div64_u64(fmax * table[i].power, table[i].cost = div64_u64(fmax * table[i].power,
...@@ -154,14 +154,14 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states, ...@@ -154,14 +154,14 @@ static struct em_perf_domain *em_create_pd(cpumask_t *span, int nr_states,
} }
pd->table = table; pd->table = table;
pd->nr_cap_states = nr_states; pd->nr_perf_states = nr_states;
cpumask_copy(to_cpumask(pd->cpus), span); cpumask_copy(to_cpumask(pd->cpus), span);
em_debug_create_pd(pd, cpu); em_debug_create_pd(pd, cpu);
return pd; return pd;
free_cs_table: free_ps_table:
kfree(table); kfree(table);
free_pd: free_pd:
kfree(pd); kfree(pd);
...@@ -185,7 +185,7 @@ EXPORT_SYMBOL_GPL(em_cpu_get); ...@@ -185,7 +185,7 @@ EXPORT_SYMBOL_GPL(em_cpu_get);
/** /**
* em_register_perf_domain() - Register the Energy Model of a performance domain * em_register_perf_domain() - Register the Energy Model of a performance domain
* @span : Mask of CPUs in the performance domain * @span : Mask of CPUs in the performance domain
* @nr_states : Number of capacity states to register * @nr_states : Number of performance states to register
* @cb : Callback functions providing the data of the Energy Model * @cb : Callback functions providing the data of the Energy Model
* *
* Create Energy Model tables for a performance domain using the callbacks * Create Energy Model tables for a performance domain using the callbacks
......
...@@ -272,10 +272,10 @@ static void perf_domain_debug(const struct cpumask *cpu_map, ...@@ -272,10 +272,10 @@ static void perf_domain_debug(const struct cpumask *cpu_map,
printk(KERN_DEBUG "root_domain %*pbl:", cpumask_pr_args(cpu_map)); printk(KERN_DEBUG "root_domain %*pbl:", cpumask_pr_args(cpu_map));
while (pd) { while (pd) {
printk(KERN_CONT " pd%d:{ cpus=%*pbl nr_cstate=%d }", printk(KERN_CONT " pd%d:{ cpus=%*pbl nr_pstate=%d }",
cpumask_first(perf_domain_span(pd)), cpumask_first(perf_domain_span(pd)),
cpumask_pr_args(perf_domain_span(pd)), cpumask_pr_args(perf_domain_span(pd)),
em_pd_nr_cap_states(pd->em_pd)); em_pd_nr_perf_states(pd->em_pd));
pd = pd->next; pd = pd->next;
} }
...@@ -313,26 +313,26 @@ static void sched_energy_set(bool has_eas) ...@@ -313,26 +313,26 @@ static void sched_energy_set(bool has_eas)
* *
* The complexity of the Energy Model is defined as: * The complexity of the Energy Model is defined as:
* *
* C = nr_pd * (nr_cpus + nr_cs) * C = nr_pd * (nr_cpus + nr_ps)
* *
* with parameters defined as: * with parameters defined as:
* - nr_pd: the number of performance domains * - nr_pd: the number of performance domains
* - nr_cpus: the number of CPUs * - nr_cpus: the number of CPUs
* - nr_cs: the sum of the number of capacity states of all performance * - nr_ps: the sum of the number of performance states of all performance
* domains (for example, on a system with 2 performance domains, * domains (for example, on a system with 2 performance domains,
* with 10 capacity states each, nr_cs = 2 * 10 = 20). * with 10 performance states each, nr_ps = 2 * 10 = 20).
* *
* It is generally not a good idea to use such a model in the wake-up path on * It is generally not a good idea to use such a model in the wake-up path on
* very complex platforms because of the associated scheduling overheads. The * very complex platforms because of the associated scheduling overheads. The
* arbitrary constraint below prevents that. It makes EAS usable up to 16 CPUs * arbitrary constraint below prevents that. It makes EAS usable up to 16 CPUs
* with per-CPU DVFS and less than 8 capacity states each, for example. * with per-CPU DVFS and less than 8 performance states each, for example.
*/ */
#define EM_MAX_COMPLEXITY 2048 #define EM_MAX_COMPLEXITY 2048
extern struct cpufreq_governor schedutil_gov; extern struct cpufreq_governor schedutil_gov;
static bool build_perf_domains(const struct cpumask *cpu_map) static bool build_perf_domains(const struct cpumask *cpu_map)
{ {
int i, nr_pd = 0, nr_cs = 0, nr_cpus = cpumask_weight(cpu_map); int i, nr_pd = 0, nr_ps = 0, nr_cpus = cpumask_weight(cpu_map);
struct perf_domain *pd = NULL, *tmp; struct perf_domain *pd = NULL, *tmp;
int cpu = cpumask_first(cpu_map); int cpu = cpumask_first(cpu_map);
struct root_domain *rd = cpu_rq(cpu)->rd; struct root_domain *rd = cpu_rq(cpu)->rd;
...@@ -384,15 +384,15 @@ static bool build_perf_domains(const struct cpumask *cpu_map) ...@@ -384,15 +384,15 @@ static bool build_perf_domains(const struct cpumask *cpu_map)
pd = tmp; pd = tmp;
/* /*
* Count performance domains and capacity states for the * Count performance domains and performance states for the
* complexity check. * complexity check.
*/ */
nr_pd++; nr_pd++;
nr_cs += em_pd_nr_cap_states(pd->em_pd); nr_ps += em_pd_nr_perf_states(pd->em_pd);
} }
/* Bail out if the Energy Model complexity is too high. */ /* Bail out if the Energy Model complexity is too high. */
if (nr_pd * (nr_cs + nr_cpus) > EM_MAX_COMPLEXITY) { if (nr_pd * (nr_ps + nr_cpus) > EM_MAX_COMPLEXITY) {
WARN(1, "rd %*pbl: Failed to start EAS, EM complexity is too high\n", WARN(1, "rd %*pbl: Failed to start EAS, EM complexity is too high\n",
cpumask_pr_args(cpu_map)); cpumask_pr_args(cpu_map));
goto free; goto free;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册