1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
18
19#include <linux/export.h>
20#include <linux/kernel_stat.h>
21#include <linux/slab.h>
22
23#include "cpufreq_governor.h"
24
25#define CPUFREQ_DBS_MIN_SAMPLING_INTERVAL (2 * TICK_NSEC / NSEC_PER_USEC)
26
27static DEFINE_PER_CPU(struct cpu_dbs_info, cpu_dbs);
28
29static DEFINE_MUTEX(gov_dbs_data_mutex);
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47ssize_t store_sampling_rate(struct gov_attr_set *attr_set, const char *buf,
48 size_t count)
49{
50 struct dbs_data *dbs_data = to_dbs_data(attr_set);
51 struct policy_dbs_info *policy_dbs;
52 unsigned int sampling_interval;
53 int ret;
54
55 ret = sscanf(buf, "%u", &sampling_interval);
56 if (ret != 1 || sampling_interval < CPUFREQ_DBS_MIN_SAMPLING_INTERVAL)
57 return -EINVAL;
58
59 dbs_data->sampling_rate = sampling_interval;
60
61
62
63
64
65 list_for_each_entry(policy_dbs, &attr_set->policy_list, list) {
66 mutex_lock(&policy_dbs->update_mutex);
67
68
69
70
71
72
73
74
75
76
77
78
79
80 gov_update_sample_delay(policy_dbs, 0);
81 mutex_unlock(&policy_dbs->update_mutex);
82 }
83
84 return count;
85}
86EXPORT_SYMBOL_GPL(store_sampling_rate);
87
88
89
90
91
92
93
94
95
96
97
98void gov_update_cpu_data(struct dbs_data *dbs_data)
99{
100 struct policy_dbs_info *policy_dbs;
101
102 list_for_each_entry(policy_dbs, &dbs_data->attr_set.policy_list, list) {
103 unsigned int j;
104
105 for_each_cpu(j, policy_dbs->policy->cpus) {
106 struct cpu_dbs_info *j_cdbs = &per_cpu(cpu_dbs, j);
107
108 j_cdbs->prev_cpu_idle = get_cpu_idle_time(j, &j_cdbs->prev_update_time,
109 dbs_data->io_is_busy);
110 if (dbs_data->ignore_nice_load)
111 j_cdbs->prev_cpu_nice = kcpustat_cpu(j).cpustat[CPUTIME_NICE];
112 }
113 }
114}
115EXPORT_SYMBOL_GPL(gov_update_cpu_data);
116
117unsigned int dbs_update(struct cpufreq_policy *policy)
118{
119 struct policy_dbs_info *policy_dbs = policy->governor_data;
120 struct dbs_data *dbs_data = policy_dbs->dbs_data;
121 unsigned int ignore_nice = dbs_data->ignore_nice_load;
122 unsigned int max_load = 0, idle_periods = UINT_MAX;
123 unsigned int sampling_rate, io_busy, j;
124
125
126
127
128
129
130
131 sampling_rate = dbs_data->sampling_rate * policy_dbs->rate_mult;
132
133
134
135
136
137 io_busy = dbs_data->io_is_busy;
138
139
140 for_each_cpu(j, policy->cpus) {
141 struct cpu_dbs_info *j_cdbs = &per_cpu(cpu_dbs, j);
142 u64 update_time, cur_idle_time;
143 unsigned int idle_time, time_elapsed;
144 unsigned int load;
145
146 cur_idle_time = get_cpu_idle_time(j, &update_time, io_busy);
147
148 time_elapsed = update_time - j_cdbs->prev_update_time;
149 j_cdbs->prev_update_time = update_time;
150
151 idle_time = cur_idle_time - j_cdbs->prev_cpu_idle;
152 j_cdbs->prev_cpu_idle = cur_idle_time;
153
154 if (ignore_nice) {
155 u64 cur_nice = kcpustat_cpu(j).cpustat[CPUTIME_NICE];
156
157 idle_time += div_u64(cur_nice - j_cdbs->prev_cpu_nice, NSEC_PER_USEC);
158 j_cdbs->prev_cpu_nice = cur_nice;
159 }
160
161 if (unlikely(!time_elapsed)) {
162
163
164
165
166
167 load = j_cdbs->prev_load;
168 } else if (unlikely((int)idle_time > 2 * sampling_rate &&
169 j_cdbs->prev_load)) {
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192 load = j_cdbs->prev_load;
193 j_cdbs->prev_load = 0;
194 } else {
195 if (time_elapsed >= idle_time) {
196 load = 100 * (time_elapsed - idle_time) / time_elapsed;
197 } else {
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213 load = (int)idle_time < 0 ? 100 : 0;
214 }
215 j_cdbs->prev_load = load;
216 }
217
218 if (unlikely((int)idle_time > 2 * sampling_rate)) {
219 unsigned int periods = idle_time / sampling_rate;
220
221 if (periods < idle_periods)
222 idle_periods = periods;
223 }
224
225 if (load > max_load)
226 max_load = load;
227 }
228
229 policy_dbs->idle_periods = idle_periods;
230
231 return max_load;
232}
233EXPORT_SYMBOL_GPL(dbs_update);
234
235static void dbs_work_handler(struct work_struct *work)
236{
237 struct policy_dbs_info *policy_dbs;
238 struct cpufreq_policy *policy;
239 struct dbs_governor *gov;
240
241 policy_dbs = container_of(work, struct policy_dbs_info, work);
242 policy = policy_dbs->policy;
243 gov = dbs_governor_of(policy);
244
245
246
247
248
249 mutex_lock(&policy_dbs->update_mutex);
250 gov_update_sample_delay(policy_dbs, gov->gov_dbs_update(policy));
251 mutex_unlock(&policy_dbs->update_mutex);
252
253
254 atomic_set(&policy_dbs->work_count, 0);
255
256
257
258
259
260 smp_wmb();
261 policy_dbs->work_in_progress = false;
262}
263
264static void dbs_irq_work(struct irq_work *irq_work)
265{
266 struct policy_dbs_info *policy_dbs;
267
268 policy_dbs = container_of(irq_work, struct policy_dbs_info, irq_work);
269 schedule_work_on(smp_processor_id(), &policy_dbs->work);
270}
271
272static void dbs_update_util_handler(struct update_util_data *data, u64 time,
273 unsigned int flags)
274{
275 struct cpu_dbs_info *cdbs = container_of(data, struct cpu_dbs_info, update_util);
276 struct policy_dbs_info *policy_dbs = cdbs->policy_dbs;
277 u64 delta_ns, lst;
278
279 if (!cpufreq_this_cpu_can_update(policy_dbs->policy))
280 return;
281
282
283
284
285
286
287
288 if (policy_dbs->work_in_progress)
289 return;
290
291
292
293
294
295 smp_rmb();
296 lst = READ_ONCE(policy_dbs->last_sample_time);
297 delta_ns = time - lst;
298 if ((s64)delta_ns < policy_dbs->sample_delay_ns)
299 return;
300
301
302
303
304
305
306 if (policy_dbs->is_shared) {
307 if (!atomic_add_unless(&policy_dbs->work_count, 1, 1))
308 return;
309
310
311
312
313
314 if (unlikely(lst != READ_ONCE(policy_dbs->last_sample_time))) {
315 atomic_set(&policy_dbs->work_count, 0);
316 return;
317 }
318 }
319
320 policy_dbs->last_sample_time = time;
321 policy_dbs->work_in_progress = true;
322 irq_work_queue(&policy_dbs->irq_work);
323}
324
325static void gov_set_update_util(struct policy_dbs_info *policy_dbs,
326 unsigned int delay_us)
327{
328 struct cpufreq_policy *policy = policy_dbs->policy;
329 int cpu;
330
331 gov_update_sample_delay(policy_dbs, delay_us);
332 policy_dbs->last_sample_time = 0;
333
334 for_each_cpu(cpu, policy->cpus) {
335 struct cpu_dbs_info *cdbs = &per_cpu(cpu_dbs, cpu);
336
337 cpufreq_add_update_util_hook(cpu, &cdbs->update_util,
338 dbs_update_util_handler);
339 }
340}
341
342static inline void gov_clear_update_util(struct cpufreq_policy *policy)
343{
344 int i;
345
346 for_each_cpu(i, policy->cpus)
347 cpufreq_remove_update_util_hook(i);
348
349 synchronize_rcu();
350}
351
352static struct policy_dbs_info *alloc_policy_dbs_info(struct cpufreq_policy *policy,
353 struct dbs_governor *gov)
354{
355 struct policy_dbs_info *policy_dbs;
356 int j;
357
358
359 policy_dbs = gov->alloc();
360 if (!policy_dbs)
361 return NULL;
362
363 policy_dbs->policy = policy;
364 mutex_init(&policy_dbs->update_mutex);
365 atomic_set(&policy_dbs->work_count, 0);
366 init_irq_work(&policy_dbs->irq_work, dbs_irq_work);
367 INIT_WORK(&policy_dbs->work, dbs_work_handler);
368
369
370 for_each_cpu(j, policy->related_cpus) {
371 struct cpu_dbs_info *j_cdbs = &per_cpu(cpu_dbs, j);
372
373 j_cdbs->policy_dbs = policy_dbs;
374 }
375 return policy_dbs;
376}
377
378static void free_policy_dbs_info(struct policy_dbs_info *policy_dbs,
379 struct dbs_governor *gov)
380{
381 int j;
382
383 mutex_destroy(&policy_dbs->update_mutex);
384
385 for_each_cpu(j, policy_dbs->policy->related_cpus) {
386 struct cpu_dbs_info *j_cdbs = &per_cpu(cpu_dbs, j);
387
388 j_cdbs->policy_dbs = NULL;
389 j_cdbs->update_util.func = NULL;
390 }
391 gov->free(policy_dbs);
392}
393
394int cpufreq_dbs_governor_init(struct cpufreq_policy *policy)
395{
396 struct dbs_governor *gov = dbs_governor_of(policy);
397 struct dbs_data *dbs_data;
398 struct policy_dbs_info *policy_dbs;
399 int ret = 0;
400
401
402 if (policy->governor_data)
403 return -EBUSY;
404
405 policy_dbs = alloc_policy_dbs_info(policy, gov);
406 if (!policy_dbs)
407 return -ENOMEM;
408
409
410 mutex_lock(&gov_dbs_data_mutex);
411
412 dbs_data = gov->gdbs_data;
413 if (dbs_data) {
414 if (WARN_ON(have_governor_per_policy())) {
415 ret = -EINVAL;
416 goto free_policy_dbs_info;
417 }
418 policy_dbs->dbs_data = dbs_data;
419 policy->governor_data = policy_dbs;
420
421 gov_attr_set_get(&dbs_data->attr_set, &policy_dbs->list);
422 goto out;
423 }
424
425 dbs_data = kzalloc(sizeof(*dbs_data), GFP_KERNEL);
426 if (!dbs_data) {
427 ret = -ENOMEM;
428 goto free_policy_dbs_info;
429 }
430
431 gov_attr_set_init(&dbs_data->attr_set, &policy_dbs->list);
432
433 ret = gov->init(dbs_data);
434 if (ret)
435 goto free_policy_dbs_info;
436
437
438
439
440
441
442 dbs_data->sampling_rate = max_t(unsigned int,
443 CPUFREQ_DBS_MIN_SAMPLING_INTERVAL,
444 cpufreq_policy_transition_delay_us(policy));
445
446 if (!have_governor_per_policy())
447 gov->gdbs_data = dbs_data;
448
449 policy_dbs->dbs_data = dbs_data;
450 policy->governor_data = policy_dbs;
451
452 gov->kobj_type.sysfs_ops = &governor_sysfs_ops;
453 ret = kobject_init_and_add(&dbs_data->attr_set.kobj, &gov->kobj_type,
454 get_governor_parent_kobj(policy),
455 "%s", gov->gov.name);
456 if (!ret)
457 goto out;
458
459
460 pr_err("initialization failed (dbs_data kobject init error %d)\n", ret);
461
462 policy->governor_data = NULL;
463
464 if (!have_governor_per_policy())
465 gov->gdbs_data = NULL;
466 gov->exit(dbs_data);
467 kfree(dbs_data);
468
469free_policy_dbs_info:
470 free_policy_dbs_info(policy_dbs, gov);
471
472out:
473 mutex_unlock(&gov_dbs_data_mutex);
474 return ret;
475}
476EXPORT_SYMBOL_GPL(cpufreq_dbs_governor_init);
477
478void cpufreq_dbs_governor_exit(struct cpufreq_policy *policy)
479{
480 struct dbs_governor *gov = dbs_governor_of(policy);
481 struct policy_dbs_info *policy_dbs = policy->governor_data;
482 struct dbs_data *dbs_data = policy_dbs->dbs_data;
483 unsigned int count;
484
485
486 mutex_lock(&gov_dbs_data_mutex);
487
488 count = gov_attr_set_put(&dbs_data->attr_set, &policy_dbs->list);
489
490 policy->governor_data = NULL;
491
492 if (!count) {
493 if (!have_governor_per_policy())
494 gov->gdbs_data = NULL;
495
496 gov->exit(dbs_data);
497 kfree(dbs_data);
498 }
499
500 free_policy_dbs_info(policy_dbs, gov);
501
502 mutex_unlock(&gov_dbs_data_mutex);
503}
504EXPORT_SYMBOL_GPL(cpufreq_dbs_governor_exit);
505
506int cpufreq_dbs_governor_start(struct cpufreq_policy *policy)
507{
508 struct dbs_governor *gov = dbs_governor_of(policy);
509 struct policy_dbs_info *policy_dbs = policy->governor_data;
510 struct dbs_data *dbs_data = policy_dbs->dbs_data;
511 unsigned int sampling_rate, ignore_nice, j;
512 unsigned int io_busy;
513
514 if (!policy->cur)
515 return -EINVAL;
516
517 policy_dbs->is_shared = policy_is_shared(policy);
518 policy_dbs->rate_mult = 1;
519
520 sampling_rate = dbs_data->sampling_rate;
521 ignore_nice = dbs_data->ignore_nice_load;
522 io_busy = dbs_data->io_is_busy;
523
524 for_each_cpu(j, policy->cpus) {
525 struct cpu_dbs_info *j_cdbs = &per_cpu(cpu_dbs, j);
526
527 j_cdbs->prev_cpu_idle = get_cpu_idle_time(j, &j_cdbs->prev_update_time, io_busy);
528
529
530
531 j_cdbs->prev_load = 0;
532
533 if (ignore_nice)
534 j_cdbs->prev_cpu_nice = kcpustat_cpu(j).cpustat[CPUTIME_NICE];
535 }
536
537 gov->start(policy);
538
539 gov_set_update_util(policy_dbs, sampling_rate);
540 return 0;
541}
542EXPORT_SYMBOL_GPL(cpufreq_dbs_governor_start);
543
544void cpufreq_dbs_governor_stop(struct cpufreq_policy *policy)
545{
546 struct policy_dbs_info *policy_dbs = policy->governor_data;
547
548 gov_clear_update_util(policy_dbs->policy);
549 irq_work_sync(&policy_dbs->irq_work);
550 cancel_work_sync(&policy_dbs->work);
551 atomic_set(&policy_dbs->work_count, 0);
552 policy_dbs->work_in_progress = false;
553}
554EXPORT_SYMBOL_GPL(cpufreq_dbs_governor_stop);
555
556void cpufreq_dbs_governor_limits(struct cpufreq_policy *policy)
557{
558 struct policy_dbs_info *policy_dbs;
559
560
561 mutex_lock(&gov_dbs_data_mutex);
562 policy_dbs = policy->governor_data;
563 if (!policy_dbs)
564 goto out;
565
566 mutex_lock(&policy_dbs->update_mutex);
567 cpufreq_policy_apply_limits(policy);
568 gov_update_sample_delay(policy_dbs, 0);
569 mutex_unlock(&policy_dbs->update_mutex);
570
571out:
572 mutex_unlock(&gov_dbs_data_mutex);
573}
574EXPORT_SYMBOL_GPL(cpufreq_dbs_governor_limits);
575