]> git.proxmox.com Git - mirror_ubuntu-bionic-kernel.git/blob - drivers/cpufreq/cpufreq.c
Fix common misspellings
[mirror_ubuntu-bionic-kernel.git] / drivers / cpufreq / cpufreq.c
1 /*
2 * linux/drivers/cpufreq/cpufreq.c
3 *
4 * Copyright (C) 2001 Russell King
5 * (C) 2002 - 2003 Dominik Brodowski <linux@brodo.de>
6 *
7 * Oct 2005 - Ashok Raj <ashok.raj@intel.com>
8 * Added handling for CPU hotplug
9 * Feb 2006 - Jacob Shin <jacob.shin@amd.com>
10 * Fix handling for CPU hotplug -- affected CPUs
11 *
12 * This program is free software; you can redistribute it and/or modify
13 * it under the terms of the GNU General Public License version 2 as
14 * published by the Free Software Foundation.
15 *
16 */
17
18 #include <linux/kernel.h>
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/notifier.h>
22 #include <linux/cpufreq.h>
23 #include <linux/delay.h>
24 #include <linux/interrupt.h>
25 #include <linux/spinlock.h>
26 #include <linux/device.h>
27 #include <linux/slab.h>
28 #include <linux/cpu.h>
29 #include <linux/completion.h>
30 #include <linux/mutex.h>
31 #include <linux/syscore_ops.h>
32
33 #include <trace/events/power.h>
34
35 #define dprintk(msg...) cpufreq_debug_printk(CPUFREQ_DEBUG_CORE, \
36 "cpufreq-core", msg)
37
38 /**
39 * The "cpufreq driver" - the arch- or hardware-dependent low
40 * level driver of CPUFreq support, and its spinlock. This lock
41 * also protects the cpufreq_cpu_data array.
42 */
43 static struct cpufreq_driver *cpufreq_driver;
44 static DEFINE_PER_CPU(struct cpufreq_policy *, cpufreq_cpu_data);
45 #ifdef CONFIG_HOTPLUG_CPU
46 /* This one keeps track of the previously set governor of a removed CPU */
47 static DEFINE_PER_CPU(char[CPUFREQ_NAME_LEN], cpufreq_cpu_governor);
48 #endif
49 static DEFINE_SPINLOCK(cpufreq_driver_lock);
50
51 /*
52 * cpu_policy_rwsem is a per CPU reader-writer semaphore designed to cure
53 * all cpufreq/hotplug/workqueue/etc related lock issues.
54 *
55 * The rules for this semaphore:
56 * - Any routine that wants to read from the policy structure will
57 * do a down_read on this semaphore.
58 * - Any routine that will write to the policy structure and/or may take away
59 * the policy altogether (eg. CPU hotplug), will hold this lock in write
60 * mode before doing so.
61 *
62 * Additional rules:
63 * - All holders of the lock should check to make sure that the CPU they
64 * are concerned with are online after they get the lock.
65 * - Governor routines that can be called in cpufreq hotplug path should not
66 * take this sem as top level hotplug notifier handler takes this.
67 * - Lock should not be held across
68 * __cpufreq_governor(data, CPUFREQ_GOV_STOP);
69 */
70 static DEFINE_PER_CPU(int, cpufreq_policy_cpu);
71 static DEFINE_PER_CPU(struct rw_semaphore, cpu_policy_rwsem);
72
73 #define lock_policy_rwsem(mode, cpu) \
74 static int lock_policy_rwsem_##mode \
75 (int cpu) \
76 { \
77 int policy_cpu = per_cpu(cpufreq_policy_cpu, cpu); \
78 BUG_ON(policy_cpu == -1); \
79 down_##mode(&per_cpu(cpu_policy_rwsem, policy_cpu)); \
80 if (unlikely(!cpu_online(cpu))) { \
81 up_##mode(&per_cpu(cpu_policy_rwsem, policy_cpu)); \
82 return -1; \
83 } \
84 \
85 return 0; \
86 }
87
88 lock_policy_rwsem(read, cpu);
89
90 lock_policy_rwsem(write, cpu);
91
92 static void unlock_policy_rwsem_read(int cpu)
93 {
94 int policy_cpu = per_cpu(cpufreq_policy_cpu, cpu);
95 BUG_ON(policy_cpu == -1);
96 up_read(&per_cpu(cpu_policy_rwsem, policy_cpu));
97 }
98
99 static void unlock_policy_rwsem_write(int cpu)
100 {
101 int policy_cpu = per_cpu(cpufreq_policy_cpu, cpu);
102 BUG_ON(policy_cpu == -1);
103 up_write(&per_cpu(cpu_policy_rwsem, policy_cpu));
104 }
105
106
107 /* internal prototypes */
108 static int __cpufreq_governor(struct cpufreq_policy *policy,
109 unsigned int event);
110 static unsigned int __cpufreq_get(unsigned int cpu);
111 static void handle_update(struct work_struct *work);
112
113 /**
114 * Two notifier lists: the "policy" list is involved in the
115 * validation process for a new CPU frequency policy; the
116 * "transition" list for kernel code that needs to handle
117 * changes to devices when the CPU clock speed changes.
118 * The mutex locks both lists.
119 */
120 static BLOCKING_NOTIFIER_HEAD(cpufreq_policy_notifier_list);
121 static struct srcu_notifier_head cpufreq_transition_notifier_list;
122
123 static bool init_cpufreq_transition_notifier_list_called;
124 static int __init init_cpufreq_transition_notifier_list(void)
125 {
126 srcu_init_notifier_head(&cpufreq_transition_notifier_list);
127 init_cpufreq_transition_notifier_list_called = true;
128 return 0;
129 }
130 pure_initcall(init_cpufreq_transition_notifier_list);
131
132 static LIST_HEAD(cpufreq_governor_list);
133 static DEFINE_MUTEX(cpufreq_governor_mutex);
134
135 struct cpufreq_policy *cpufreq_cpu_get(unsigned int cpu)
136 {
137 struct cpufreq_policy *data;
138 unsigned long flags;
139
140 if (cpu >= nr_cpu_ids)
141 goto err_out;
142
143 /* get the cpufreq driver */
144 spin_lock_irqsave(&cpufreq_driver_lock, flags);
145
146 if (!cpufreq_driver)
147 goto err_out_unlock;
148
149 if (!try_module_get(cpufreq_driver->owner))
150 goto err_out_unlock;
151
152
153 /* get the CPU */
154 data = per_cpu(cpufreq_cpu_data, cpu);
155
156 if (!data)
157 goto err_out_put_module;
158
159 if (!kobject_get(&data->kobj))
160 goto err_out_put_module;
161
162 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
163 return data;
164
165 err_out_put_module:
166 module_put(cpufreq_driver->owner);
167 err_out_unlock:
168 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
169 err_out:
170 return NULL;
171 }
172 EXPORT_SYMBOL_GPL(cpufreq_cpu_get);
173
174
175 void cpufreq_cpu_put(struct cpufreq_policy *data)
176 {
177 kobject_put(&data->kobj);
178 module_put(cpufreq_driver->owner);
179 }
180 EXPORT_SYMBOL_GPL(cpufreq_cpu_put);
181
182
183 /*********************************************************************
184 * UNIFIED DEBUG HELPERS *
185 *********************************************************************/
186 #ifdef CONFIG_CPU_FREQ_DEBUG
187
188 /* what part(s) of the CPUfreq subsystem are debugged? */
189 static unsigned int debug;
190
191 /* is the debug output ratelimit'ed using printk_ratelimit? User can
192 * set or modify this value.
193 */
194 static unsigned int debug_ratelimit = 1;
195
196 /* is the printk_ratelimit'ing enabled? It's enabled after a successful
197 * loading of a cpufreq driver, temporarily disabled when a new policy
198 * is set, and disabled upon cpufreq driver removal
199 */
200 static unsigned int disable_ratelimit = 1;
201 static DEFINE_SPINLOCK(disable_ratelimit_lock);
202
203 static void cpufreq_debug_enable_ratelimit(void)
204 {
205 unsigned long flags;
206
207 spin_lock_irqsave(&disable_ratelimit_lock, flags);
208 if (disable_ratelimit)
209 disable_ratelimit--;
210 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
211 }
212
213 static void cpufreq_debug_disable_ratelimit(void)
214 {
215 unsigned long flags;
216
217 spin_lock_irqsave(&disable_ratelimit_lock, flags);
218 disable_ratelimit++;
219 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
220 }
221
222 void cpufreq_debug_printk(unsigned int type, const char *prefix,
223 const char *fmt, ...)
224 {
225 char s[256];
226 va_list args;
227 unsigned int len;
228 unsigned long flags;
229
230 WARN_ON(!prefix);
231 if (type & debug) {
232 spin_lock_irqsave(&disable_ratelimit_lock, flags);
233 if (!disable_ratelimit && debug_ratelimit
234 && !printk_ratelimit()) {
235 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
236 return;
237 }
238 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
239
240 len = snprintf(s, 256, KERN_DEBUG "%s: ", prefix);
241
242 va_start(args, fmt);
243 len += vsnprintf(&s[len], (256 - len), fmt, args);
244 va_end(args);
245
246 printk(s);
247
248 WARN_ON(len < 5);
249 }
250 }
251 EXPORT_SYMBOL(cpufreq_debug_printk);
252
253
254 module_param(debug, uint, 0644);
255 MODULE_PARM_DESC(debug, "CPUfreq debugging: add 1 to debug core,"
256 " 2 to debug drivers, and 4 to debug governors.");
257
258 module_param(debug_ratelimit, uint, 0644);
259 MODULE_PARM_DESC(debug_ratelimit, "CPUfreq debugging:"
260 " set to 0 to disable ratelimiting.");
261
262 #else /* !CONFIG_CPU_FREQ_DEBUG */
263
264 static inline void cpufreq_debug_enable_ratelimit(void) { return; }
265 static inline void cpufreq_debug_disable_ratelimit(void) { return; }
266
267 #endif /* CONFIG_CPU_FREQ_DEBUG */
268
269
270 /*********************************************************************
271 * EXTERNALLY AFFECTING FREQUENCY CHANGES *
272 *********************************************************************/
273
274 /**
275 * adjust_jiffies - adjust the system "loops_per_jiffy"
276 *
277 * This function alters the system "loops_per_jiffy" for the clock
278 * speed change. Note that loops_per_jiffy cannot be updated on SMP
279 * systems as each CPU might be scaled differently. So, use the arch
280 * per-CPU loops_per_jiffy value wherever possible.
281 */
282 #ifndef CONFIG_SMP
283 static unsigned long l_p_j_ref;
284 static unsigned int l_p_j_ref_freq;
285
286 static void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
287 {
288 if (ci->flags & CPUFREQ_CONST_LOOPS)
289 return;
290
291 if (!l_p_j_ref_freq) {
292 l_p_j_ref = loops_per_jiffy;
293 l_p_j_ref_freq = ci->old;
294 dprintk("saving %lu as reference value for loops_per_jiffy; "
295 "freq is %u kHz\n", l_p_j_ref, l_p_j_ref_freq);
296 }
297 if ((val == CPUFREQ_PRECHANGE && ci->old < ci->new) ||
298 (val == CPUFREQ_POSTCHANGE && ci->old > ci->new) ||
299 (val == CPUFREQ_RESUMECHANGE || val == CPUFREQ_SUSPENDCHANGE)) {
300 loops_per_jiffy = cpufreq_scale(l_p_j_ref, l_p_j_ref_freq,
301 ci->new);
302 dprintk("scaling loops_per_jiffy to %lu "
303 "for frequency %u kHz\n", loops_per_jiffy, ci->new);
304 }
305 }
306 #else
307 static inline void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
308 {
309 return;
310 }
311 #endif
312
313
314 /**
315 * cpufreq_notify_transition - call notifier chain and adjust_jiffies
316 * on frequency transition.
317 *
318 * This function calls the transition notifiers and the "adjust_jiffies"
319 * function. It is called twice on all CPU frequency changes that have
320 * external effects.
321 */
322 void cpufreq_notify_transition(struct cpufreq_freqs *freqs, unsigned int state)
323 {
324 struct cpufreq_policy *policy;
325
326 BUG_ON(irqs_disabled());
327
328 freqs->flags = cpufreq_driver->flags;
329 dprintk("notification %u of frequency transition to %u kHz\n",
330 state, freqs->new);
331
332 policy = per_cpu(cpufreq_cpu_data, freqs->cpu);
333 switch (state) {
334
335 case CPUFREQ_PRECHANGE:
336 /* detect if the driver reported a value as "old frequency"
337 * which is not equal to what the cpufreq core thinks is
338 * "old frequency".
339 */
340 if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
341 if ((policy) && (policy->cpu == freqs->cpu) &&
342 (policy->cur) && (policy->cur != freqs->old)) {
343 dprintk("Warning: CPU frequency is"
344 " %u, cpufreq assumed %u kHz.\n",
345 freqs->old, policy->cur);
346 freqs->old = policy->cur;
347 }
348 }
349 srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
350 CPUFREQ_PRECHANGE, freqs);
351 adjust_jiffies(CPUFREQ_PRECHANGE, freqs);
352 break;
353
354 case CPUFREQ_POSTCHANGE:
355 adjust_jiffies(CPUFREQ_POSTCHANGE, freqs);
356 dprintk("FREQ: %lu - CPU: %lu", (unsigned long)freqs->new,
357 (unsigned long)freqs->cpu);
358 trace_power_frequency(POWER_PSTATE, freqs->new, freqs->cpu);
359 trace_cpu_frequency(freqs->new, freqs->cpu);
360 srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
361 CPUFREQ_POSTCHANGE, freqs);
362 if (likely(policy) && likely(policy->cpu == freqs->cpu))
363 policy->cur = freqs->new;
364 break;
365 }
366 }
367 EXPORT_SYMBOL_GPL(cpufreq_notify_transition);
368
369
370
371 /*********************************************************************
372 * SYSFS INTERFACE *
373 *********************************************************************/
374
375 static struct cpufreq_governor *__find_governor(const char *str_governor)
376 {
377 struct cpufreq_governor *t;
378
379 list_for_each_entry(t, &cpufreq_governor_list, governor_list)
380 if (!strnicmp(str_governor, t->name, CPUFREQ_NAME_LEN))
381 return t;
382
383 return NULL;
384 }
385
386 /**
387 * cpufreq_parse_governor - parse a governor string
388 */
389 static int cpufreq_parse_governor(char *str_governor, unsigned int *policy,
390 struct cpufreq_governor **governor)
391 {
392 int err = -EINVAL;
393
394 if (!cpufreq_driver)
395 goto out;
396
397 if (cpufreq_driver->setpolicy) {
398 if (!strnicmp(str_governor, "performance", CPUFREQ_NAME_LEN)) {
399 *policy = CPUFREQ_POLICY_PERFORMANCE;
400 err = 0;
401 } else if (!strnicmp(str_governor, "powersave",
402 CPUFREQ_NAME_LEN)) {
403 *policy = CPUFREQ_POLICY_POWERSAVE;
404 err = 0;
405 }
406 } else if (cpufreq_driver->target) {
407 struct cpufreq_governor *t;
408
409 mutex_lock(&cpufreq_governor_mutex);
410
411 t = __find_governor(str_governor);
412
413 if (t == NULL) {
414 char *name = kasprintf(GFP_KERNEL, "cpufreq_%s",
415 str_governor);
416
417 if (name) {
418 int ret;
419
420 mutex_unlock(&cpufreq_governor_mutex);
421 ret = request_module("%s", name);
422 mutex_lock(&cpufreq_governor_mutex);
423
424 if (ret == 0)
425 t = __find_governor(str_governor);
426 }
427
428 kfree(name);
429 }
430
431 if (t != NULL) {
432 *governor = t;
433 err = 0;
434 }
435
436 mutex_unlock(&cpufreq_governor_mutex);
437 }
438 out:
439 return err;
440 }
441
442
443 /**
444 * cpufreq_per_cpu_attr_read() / show_##file_name() -
445 * print out cpufreq information
446 *
447 * Write out information from cpufreq_driver->policy[cpu]; object must be
448 * "unsigned int".
449 */
450
451 #define show_one(file_name, object) \
452 static ssize_t show_##file_name \
453 (struct cpufreq_policy *policy, char *buf) \
454 { \
455 return sprintf(buf, "%u\n", policy->object); \
456 }
457
458 show_one(cpuinfo_min_freq, cpuinfo.min_freq);
459 show_one(cpuinfo_max_freq, cpuinfo.max_freq);
460 show_one(cpuinfo_transition_latency, cpuinfo.transition_latency);
461 show_one(scaling_min_freq, min);
462 show_one(scaling_max_freq, max);
463 show_one(scaling_cur_freq, cur);
464
465 static int __cpufreq_set_policy(struct cpufreq_policy *data,
466 struct cpufreq_policy *policy);
467
468 /**
469 * cpufreq_per_cpu_attr_write() / store_##file_name() - sysfs write access
470 */
471 #define store_one(file_name, object) \
472 static ssize_t store_##file_name \
473 (struct cpufreq_policy *policy, const char *buf, size_t count) \
474 { \
475 unsigned int ret = -EINVAL; \
476 struct cpufreq_policy new_policy; \
477 \
478 ret = cpufreq_get_policy(&new_policy, policy->cpu); \
479 if (ret) \
480 return -EINVAL; \
481 \
482 ret = sscanf(buf, "%u", &new_policy.object); \
483 if (ret != 1) \
484 return -EINVAL; \
485 \
486 ret = __cpufreq_set_policy(policy, &new_policy); \
487 policy->user_policy.object = policy->object; \
488 \
489 return ret ? ret : count; \
490 }
491
492 store_one(scaling_min_freq, min);
493 store_one(scaling_max_freq, max);
494
495 /**
496 * show_cpuinfo_cur_freq - current CPU frequency as detected by hardware
497 */
498 static ssize_t show_cpuinfo_cur_freq(struct cpufreq_policy *policy,
499 char *buf)
500 {
501 unsigned int cur_freq = __cpufreq_get(policy->cpu);
502 if (!cur_freq)
503 return sprintf(buf, "<unknown>");
504 return sprintf(buf, "%u\n", cur_freq);
505 }
506
507
508 /**
509 * show_scaling_governor - show the current policy for the specified CPU
510 */
511 static ssize_t show_scaling_governor(struct cpufreq_policy *policy, char *buf)
512 {
513 if (policy->policy == CPUFREQ_POLICY_POWERSAVE)
514 return sprintf(buf, "powersave\n");
515 else if (policy->policy == CPUFREQ_POLICY_PERFORMANCE)
516 return sprintf(buf, "performance\n");
517 else if (policy->governor)
518 return scnprintf(buf, CPUFREQ_NAME_LEN, "%s\n",
519 policy->governor->name);
520 return -EINVAL;
521 }
522
523
524 /**
525 * store_scaling_governor - store policy for the specified CPU
526 */
527 static ssize_t store_scaling_governor(struct cpufreq_policy *policy,
528 const char *buf, size_t count)
529 {
530 unsigned int ret = -EINVAL;
531 char str_governor[16];
532 struct cpufreq_policy new_policy;
533
534 ret = cpufreq_get_policy(&new_policy, policy->cpu);
535 if (ret)
536 return ret;
537
538 ret = sscanf(buf, "%15s", str_governor);
539 if (ret != 1)
540 return -EINVAL;
541
542 if (cpufreq_parse_governor(str_governor, &new_policy.policy,
543 &new_policy.governor))
544 return -EINVAL;
545
546 /* Do not use cpufreq_set_policy here or the user_policy.max
547 will be wrongly overridden */
548 ret = __cpufreq_set_policy(policy, &new_policy);
549
550 policy->user_policy.policy = policy->policy;
551 policy->user_policy.governor = policy->governor;
552
553 if (ret)
554 return ret;
555 else
556 return count;
557 }
558
559 /**
560 * show_scaling_driver - show the cpufreq driver currently loaded
561 */
562 static ssize_t show_scaling_driver(struct cpufreq_policy *policy, char *buf)
563 {
564 return scnprintf(buf, CPUFREQ_NAME_LEN, "%s\n", cpufreq_driver->name);
565 }
566
567 /**
568 * show_scaling_available_governors - show the available CPUfreq governors
569 */
570 static ssize_t show_scaling_available_governors(struct cpufreq_policy *policy,
571 char *buf)
572 {
573 ssize_t i = 0;
574 struct cpufreq_governor *t;
575
576 if (!cpufreq_driver->target) {
577 i += sprintf(buf, "performance powersave");
578 goto out;
579 }
580
581 list_for_each_entry(t, &cpufreq_governor_list, governor_list) {
582 if (i >= (ssize_t) ((PAGE_SIZE / sizeof(char))
583 - (CPUFREQ_NAME_LEN + 2)))
584 goto out;
585 i += scnprintf(&buf[i], CPUFREQ_NAME_LEN, "%s ", t->name);
586 }
587 out:
588 i += sprintf(&buf[i], "\n");
589 return i;
590 }
591
592 static ssize_t show_cpus(const struct cpumask *mask, char *buf)
593 {
594 ssize_t i = 0;
595 unsigned int cpu;
596
597 for_each_cpu(cpu, mask) {
598 if (i)
599 i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), " ");
600 i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), "%u", cpu);
601 if (i >= (PAGE_SIZE - 5))
602 break;
603 }
604 i += sprintf(&buf[i], "\n");
605 return i;
606 }
607
608 /**
609 * show_related_cpus - show the CPUs affected by each transition even if
610 * hw coordination is in use
611 */
612 static ssize_t show_related_cpus(struct cpufreq_policy *policy, char *buf)
613 {
614 if (cpumask_empty(policy->related_cpus))
615 return show_cpus(policy->cpus, buf);
616 return show_cpus(policy->related_cpus, buf);
617 }
618
619 /**
620 * show_affected_cpus - show the CPUs affected by each transition
621 */
622 static ssize_t show_affected_cpus(struct cpufreq_policy *policy, char *buf)
623 {
624 return show_cpus(policy->cpus, buf);
625 }
626
627 static ssize_t store_scaling_setspeed(struct cpufreq_policy *policy,
628 const char *buf, size_t count)
629 {
630 unsigned int freq = 0;
631 unsigned int ret;
632
633 if (!policy->governor || !policy->governor->store_setspeed)
634 return -EINVAL;
635
636 ret = sscanf(buf, "%u", &freq);
637 if (ret != 1)
638 return -EINVAL;
639
640 policy->governor->store_setspeed(policy, freq);
641
642 return count;
643 }
644
645 static ssize_t show_scaling_setspeed(struct cpufreq_policy *policy, char *buf)
646 {
647 if (!policy->governor || !policy->governor->show_setspeed)
648 return sprintf(buf, "<unsupported>\n");
649
650 return policy->governor->show_setspeed(policy, buf);
651 }
652
653 /**
654 * show_scaling_driver - show the current cpufreq HW/BIOS limitation
655 */
656 static ssize_t show_bios_limit(struct cpufreq_policy *policy, char *buf)
657 {
658 unsigned int limit;
659 int ret;
660 if (cpufreq_driver->bios_limit) {
661 ret = cpufreq_driver->bios_limit(policy->cpu, &limit);
662 if (!ret)
663 return sprintf(buf, "%u\n", limit);
664 }
665 return sprintf(buf, "%u\n", policy->cpuinfo.max_freq);
666 }
667
668 cpufreq_freq_attr_ro_perm(cpuinfo_cur_freq, 0400);
669 cpufreq_freq_attr_ro(cpuinfo_min_freq);
670 cpufreq_freq_attr_ro(cpuinfo_max_freq);
671 cpufreq_freq_attr_ro(cpuinfo_transition_latency);
672 cpufreq_freq_attr_ro(scaling_available_governors);
673 cpufreq_freq_attr_ro(scaling_driver);
674 cpufreq_freq_attr_ro(scaling_cur_freq);
675 cpufreq_freq_attr_ro(bios_limit);
676 cpufreq_freq_attr_ro(related_cpus);
677 cpufreq_freq_attr_ro(affected_cpus);
678 cpufreq_freq_attr_rw(scaling_min_freq);
679 cpufreq_freq_attr_rw(scaling_max_freq);
680 cpufreq_freq_attr_rw(scaling_governor);
681 cpufreq_freq_attr_rw(scaling_setspeed);
682
683 static struct attribute *default_attrs[] = {
684 &cpuinfo_min_freq.attr,
685 &cpuinfo_max_freq.attr,
686 &cpuinfo_transition_latency.attr,
687 &scaling_min_freq.attr,
688 &scaling_max_freq.attr,
689 &affected_cpus.attr,
690 &related_cpus.attr,
691 &scaling_governor.attr,
692 &scaling_driver.attr,
693 &scaling_available_governors.attr,
694 &scaling_setspeed.attr,
695 NULL
696 };
697
698 struct kobject *cpufreq_global_kobject;
699 EXPORT_SYMBOL(cpufreq_global_kobject);
700
701 #define to_policy(k) container_of(k, struct cpufreq_policy, kobj)
702 #define to_attr(a) container_of(a, struct freq_attr, attr)
703
704 static ssize_t show(struct kobject *kobj, struct attribute *attr, char *buf)
705 {
706 struct cpufreq_policy *policy = to_policy(kobj);
707 struct freq_attr *fattr = to_attr(attr);
708 ssize_t ret = -EINVAL;
709 policy = cpufreq_cpu_get(policy->cpu);
710 if (!policy)
711 goto no_policy;
712
713 if (lock_policy_rwsem_read(policy->cpu) < 0)
714 goto fail;
715
716 if (fattr->show)
717 ret = fattr->show(policy, buf);
718 else
719 ret = -EIO;
720
721 unlock_policy_rwsem_read(policy->cpu);
722 fail:
723 cpufreq_cpu_put(policy);
724 no_policy:
725 return ret;
726 }
727
728 static ssize_t store(struct kobject *kobj, struct attribute *attr,
729 const char *buf, size_t count)
730 {
731 struct cpufreq_policy *policy = to_policy(kobj);
732 struct freq_attr *fattr = to_attr(attr);
733 ssize_t ret = -EINVAL;
734 policy = cpufreq_cpu_get(policy->cpu);
735 if (!policy)
736 goto no_policy;
737
738 if (lock_policy_rwsem_write(policy->cpu) < 0)
739 goto fail;
740
741 if (fattr->store)
742 ret = fattr->store(policy, buf, count);
743 else
744 ret = -EIO;
745
746 unlock_policy_rwsem_write(policy->cpu);
747 fail:
748 cpufreq_cpu_put(policy);
749 no_policy:
750 return ret;
751 }
752
753 static void cpufreq_sysfs_release(struct kobject *kobj)
754 {
755 struct cpufreq_policy *policy = to_policy(kobj);
756 dprintk("last reference is dropped\n");
757 complete(&policy->kobj_unregister);
758 }
759
760 static const struct sysfs_ops sysfs_ops = {
761 .show = show,
762 .store = store,
763 };
764
765 static struct kobj_type ktype_cpufreq = {
766 .sysfs_ops = &sysfs_ops,
767 .default_attrs = default_attrs,
768 .release = cpufreq_sysfs_release,
769 };
770
771 /*
772 * Returns:
773 * Negative: Failure
774 * 0: Success
775 * Positive: When we have a managed CPU and the sysfs got symlinked
776 */
777 static int cpufreq_add_dev_policy(unsigned int cpu,
778 struct cpufreq_policy *policy,
779 struct sys_device *sys_dev)
780 {
781 int ret = 0;
782 #ifdef CONFIG_SMP
783 unsigned long flags;
784 unsigned int j;
785 #ifdef CONFIG_HOTPLUG_CPU
786 struct cpufreq_governor *gov;
787
788 gov = __find_governor(per_cpu(cpufreq_cpu_governor, cpu));
789 if (gov) {
790 policy->governor = gov;
791 dprintk("Restoring governor %s for cpu %d\n",
792 policy->governor->name, cpu);
793 }
794 #endif
795
796 for_each_cpu(j, policy->cpus) {
797 struct cpufreq_policy *managed_policy;
798
799 if (cpu == j)
800 continue;
801
802 /* Check for existing affected CPUs.
803 * They may not be aware of it due to CPU Hotplug.
804 * cpufreq_cpu_put is called when the device is removed
805 * in __cpufreq_remove_dev()
806 */
807 managed_policy = cpufreq_cpu_get(j);
808 if (unlikely(managed_policy)) {
809
810 /* Set proper policy_cpu */
811 unlock_policy_rwsem_write(cpu);
812 per_cpu(cpufreq_policy_cpu, cpu) = managed_policy->cpu;
813
814 if (lock_policy_rwsem_write(cpu) < 0) {
815 /* Should not go through policy unlock path */
816 if (cpufreq_driver->exit)
817 cpufreq_driver->exit(policy);
818 cpufreq_cpu_put(managed_policy);
819 return -EBUSY;
820 }
821
822 spin_lock_irqsave(&cpufreq_driver_lock, flags);
823 cpumask_copy(managed_policy->cpus, policy->cpus);
824 per_cpu(cpufreq_cpu_data, cpu) = managed_policy;
825 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
826
827 dprintk("CPU already managed, adding link\n");
828 ret = sysfs_create_link(&sys_dev->kobj,
829 &managed_policy->kobj,
830 "cpufreq");
831 if (ret)
832 cpufreq_cpu_put(managed_policy);
833 /*
834 * Success. We only needed to be added to the mask.
835 * Call driver->exit() because only the cpu parent of
836 * the kobj needed to call init().
837 */
838 if (cpufreq_driver->exit)
839 cpufreq_driver->exit(policy);
840
841 if (!ret)
842 return 1;
843 else
844 return ret;
845 }
846 }
847 #endif
848 return ret;
849 }
850
851
852 /* symlink affected CPUs */
853 static int cpufreq_add_dev_symlink(unsigned int cpu,
854 struct cpufreq_policy *policy)
855 {
856 unsigned int j;
857 int ret = 0;
858
859 for_each_cpu(j, policy->cpus) {
860 struct cpufreq_policy *managed_policy;
861 struct sys_device *cpu_sys_dev;
862
863 if (j == cpu)
864 continue;
865 if (!cpu_online(j))
866 continue;
867
868 dprintk("CPU %u already managed, adding link\n", j);
869 managed_policy = cpufreq_cpu_get(cpu);
870 cpu_sys_dev = get_cpu_sysdev(j);
871 ret = sysfs_create_link(&cpu_sys_dev->kobj, &policy->kobj,
872 "cpufreq");
873 if (ret) {
874 cpufreq_cpu_put(managed_policy);
875 return ret;
876 }
877 }
878 return ret;
879 }
880
881 static int cpufreq_add_dev_interface(unsigned int cpu,
882 struct cpufreq_policy *policy,
883 struct sys_device *sys_dev)
884 {
885 struct cpufreq_policy new_policy;
886 struct freq_attr **drv_attr;
887 unsigned long flags;
888 int ret = 0;
889 unsigned int j;
890
891 /* prepare interface data */
892 ret = kobject_init_and_add(&policy->kobj, &ktype_cpufreq,
893 &sys_dev->kobj, "cpufreq");
894 if (ret)
895 return ret;
896
897 /* set up files for this cpu device */
898 drv_attr = cpufreq_driver->attr;
899 while ((drv_attr) && (*drv_attr)) {
900 ret = sysfs_create_file(&policy->kobj, &((*drv_attr)->attr));
901 if (ret)
902 goto err_out_kobj_put;
903 drv_attr++;
904 }
905 if (cpufreq_driver->get) {
906 ret = sysfs_create_file(&policy->kobj, &cpuinfo_cur_freq.attr);
907 if (ret)
908 goto err_out_kobj_put;
909 }
910 if (cpufreq_driver->target) {
911 ret = sysfs_create_file(&policy->kobj, &scaling_cur_freq.attr);
912 if (ret)
913 goto err_out_kobj_put;
914 }
915 if (cpufreq_driver->bios_limit) {
916 ret = sysfs_create_file(&policy->kobj, &bios_limit.attr);
917 if (ret)
918 goto err_out_kobj_put;
919 }
920
921 spin_lock_irqsave(&cpufreq_driver_lock, flags);
922 for_each_cpu(j, policy->cpus) {
923 if (!cpu_online(j))
924 continue;
925 per_cpu(cpufreq_cpu_data, j) = policy;
926 per_cpu(cpufreq_policy_cpu, j) = policy->cpu;
927 }
928 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
929
930 ret = cpufreq_add_dev_symlink(cpu, policy);
931 if (ret)
932 goto err_out_kobj_put;
933
934 memcpy(&new_policy, policy, sizeof(struct cpufreq_policy));
935 /* assure that the starting sequence is run in __cpufreq_set_policy */
936 policy->governor = NULL;
937
938 /* set default policy */
939 ret = __cpufreq_set_policy(policy, &new_policy);
940 policy->user_policy.policy = policy->policy;
941 policy->user_policy.governor = policy->governor;
942
943 if (ret) {
944 dprintk("setting policy failed\n");
945 if (cpufreq_driver->exit)
946 cpufreq_driver->exit(policy);
947 }
948 return ret;
949
950 err_out_kobj_put:
951 kobject_put(&policy->kobj);
952 wait_for_completion(&policy->kobj_unregister);
953 return ret;
954 }
955
956
957 /**
958 * cpufreq_add_dev - add a CPU device
959 *
960 * Adds the cpufreq interface for a CPU device.
961 *
962 * The Oracle says: try running cpufreq registration/unregistration concurrently
963 * with with cpu hotplugging and all hell will break loose. Tried to clean this
964 * mess up, but more thorough testing is needed. - Mathieu
965 */
966 static int cpufreq_add_dev(struct sys_device *sys_dev)
967 {
968 unsigned int cpu = sys_dev->id;
969 int ret = 0, found = 0;
970 struct cpufreq_policy *policy;
971 unsigned long flags;
972 unsigned int j;
973 #ifdef CONFIG_HOTPLUG_CPU
974 int sibling;
975 #endif
976
977 if (cpu_is_offline(cpu))
978 return 0;
979
980 cpufreq_debug_disable_ratelimit();
981 dprintk("adding CPU %u\n", cpu);
982
983 #ifdef CONFIG_SMP
984 /* check whether a different CPU already registered this
985 * CPU because it is in the same boat. */
986 policy = cpufreq_cpu_get(cpu);
987 if (unlikely(policy)) {
988 cpufreq_cpu_put(policy);
989 cpufreq_debug_enable_ratelimit();
990 return 0;
991 }
992 #endif
993
994 if (!try_module_get(cpufreq_driver->owner)) {
995 ret = -EINVAL;
996 goto module_out;
997 }
998
999 ret = -ENOMEM;
1000 policy = kzalloc(sizeof(struct cpufreq_policy), GFP_KERNEL);
1001 if (!policy)
1002 goto nomem_out;
1003
1004 if (!alloc_cpumask_var(&policy->cpus, GFP_KERNEL))
1005 goto err_free_policy;
1006
1007 if (!zalloc_cpumask_var(&policy->related_cpus, GFP_KERNEL))
1008 goto err_free_cpumask;
1009
1010 policy->cpu = cpu;
1011 cpumask_copy(policy->cpus, cpumask_of(cpu));
1012
1013 /* Initially set CPU itself as the policy_cpu */
1014 per_cpu(cpufreq_policy_cpu, cpu) = cpu;
1015 ret = (lock_policy_rwsem_write(cpu) < 0);
1016 WARN_ON(ret);
1017
1018 init_completion(&policy->kobj_unregister);
1019 INIT_WORK(&policy->update, handle_update);
1020
1021 /* Set governor before ->init, so that driver could check it */
1022 #ifdef CONFIG_HOTPLUG_CPU
1023 for_each_online_cpu(sibling) {
1024 struct cpufreq_policy *cp = per_cpu(cpufreq_cpu_data, sibling);
1025 if (cp && cp->governor &&
1026 (cpumask_test_cpu(cpu, cp->related_cpus))) {
1027 policy->governor = cp->governor;
1028 found = 1;
1029 break;
1030 }
1031 }
1032 #endif
1033 if (!found)
1034 policy->governor = CPUFREQ_DEFAULT_GOVERNOR;
1035 /* call driver. From then on the cpufreq must be able
1036 * to accept all calls to ->verify and ->setpolicy for this CPU
1037 */
1038 ret = cpufreq_driver->init(policy);
1039 if (ret) {
1040 dprintk("initialization failed\n");
1041 goto err_unlock_policy;
1042 }
1043 policy->user_policy.min = policy->min;
1044 policy->user_policy.max = policy->max;
1045
1046 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1047 CPUFREQ_START, policy);
1048
1049 ret = cpufreq_add_dev_policy(cpu, policy, sys_dev);
1050 if (ret) {
1051 if (ret > 0)
1052 /* This is a managed cpu, symlink created,
1053 exit with 0 */
1054 ret = 0;
1055 goto err_unlock_policy;
1056 }
1057
1058 ret = cpufreq_add_dev_interface(cpu, policy, sys_dev);
1059 if (ret)
1060 goto err_out_unregister;
1061
1062 unlock_policy_rwsem_write(cpu);
1063
1064 kobject_uevent(&policy->kobj, KOBJ_ADD);
1065 module_put(cpufreq_driver->owner);
1066 dprintk("initialization complete\n");
1067 cpufreq_debug_enable_ratelimit();
1068
1069 return 0;
1070
1071
1072 err_out_unregister:
1073 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1074 for_each_cpu(j, policy->cpus)
1075 per_cpu(cpufreq_cpu_data, j) = NULL;
1076 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1077
1078 kobject_put(&policy->kobj);
1079 wait_for_completion(&policy->kobj_unregister);
1080
1081 err_unlock_policy:
1082 unlock_policy_rwsem_write(cpu);
1083 free_cpumask_var(policy->related_cpus);
1084 err_free_cpumask:
1085 free_cpumask_var(policy->cpus);
1086 err_free_policy:
1087 kfree(policy);
1088 nomem_out:
1089 module_put(cpufreq_driver->owner);
1090 module_out:
1091 cpufreq_debug_enable_ratelimit();
1092 return ret;
1093 }
1094
1095
1096 /**
1097 * __cpufreq_remove_dev - remove a CPU device
1098 *
1099 * Removes the cpufreq interface for a CPU device.
1100 * Caller should already have policy_rwsem in write mode for this CPU.
1101 * This routine frees the rwsem before returning.
1102 */
1103 static int __cpufreq_remove_dev(struct sys_device *sys_dev)
1104 {
1105 unsigned int cpu = sys_dev->id;
1106 unsigned long flags;
1107 struct cpufreq_policy *data;
1108 struct kobject *kobj;
1109 struct completion *cmp;
1110 #ifdef CONFIG_SMP
1111 struct sys_device *cpu_sys_dev;
1112 unsigned int j;
1113 #endif
1114
1115 cpufreq_debug_disable_ratelimit();
1116 dprintk("unregistering CPU %u\n", cpu);
1117
1118 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1119 data = per_cpu(cpufreq_cpu_data, cpu);
1120
1121 if (!data) {
1122 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1123 cpufreq_debug_enable_ratelimit();
1124 unlock_policy_rwsem_write(cpu);
1125 return -EINVAL;
1126 }
1127 per_cpu(cpufreq_cpu_data, cpu) = NULL;
1128
1129
1130 #ifdef CONFIG_SMP
1131 /* if this isn't the CPU which is the parent of the kobj, we
1132 * only need to unlink, put and exit
1133 */
1134 if (unlikely(cpu != data->cpu)) {
1135 dprintk("removing link\n");
1136 cpumask_clear_cpu(cpu, data->cpus);
1137 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1138 kobj = &sys_dev->kobj;
1139 cpufreq_cpu_put(data);
1140 cpufreq_debug_enable_ratelimit();
1141 unlock_policy_rwsem_write(cpu);
1142 sysfs_remove_link(kobj, "cpufreq");
1143 return 0;
1144 }
1145 #endif
1146
1147 #ifdef CONFIG_SMP
1148
1149 #ifdef CONFIG_HOTPLUG_CPU
1150 strncpy(per_cpu(cpufreq_cpu_governor, cpu), data->governor->name,
1151 CPUFREQ_NAME_LEN);
1152 #endif
1153
1154 /* if we have other CPUs still registered, we need to unlink them,
1155 * or else wait_for_completion below will lock up. Clean the
1156 * per_cpu(cpufreq_cpu_data) while holding the lock, and remove
1157 * the sysfs links afterwards.
1158 */
1159 if (unlikely(cpumask_weight(data->cpus) > 1)) {
1160 for_each_cpu(j, data->cpus) {
1161 if (j == cpu)
1162 continue;
1163 per_cpu(cpufreq_cpu_data, j) = NULL;
1164 }
1165 }
1166
1167 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1168
1169 if (unlikely(cpumask_weight(data->cpus) > 1)) {
1170 for_each_cpu(j, data->cpus) {
1171 if (j == cpu)
1172 continue;
1173 dprintk("removing link for cpu %u\n", j);
1174 #ifdef CONFIG_HOTPLUG_CPU
1175 strncpy(per_cpu(cpufreq_cpu_governor, j),
1176 data->governor->name, CPUFREQ_NAME_LEN);
1177 #endif
1178 cpu_sys_dev = get_cpu_sysdev(j);
1179 kobj = &cpu_sys_dev->kobj;
1180 unlock_policy_rwsem_write(cpu);
1181 sysfs_remove_link(kobj, "cpufreq");
1182 lock_policy_rwsem_write(cpu);
1183 cpufreq_cpu_put(data);
1184 }
1185 }
1186 #else
1187 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1188 #endif
1189
1190 if (cpufreq_driver->target)
1191 __cpufreq_governor(data, CPUFREQ_GOV_STOP);
1192
1193 kobj = &data->kobj;
1194 cmp = &data->kobj_unregister;
1195 unlock_policy_rwsem_write(cpu);
1196 kobject_put(kobj);
1197
1198 /* we need to make sure that the underlying kobj is actually
1199 * not referenced anymore by anybody before we proceed with
1200 * unloading.
1201 */
1202 dprintk("waiting for dropping of refcount\n");
1203 wait_for_completion(cmp);
1204 dprintk("wait complete\n");
1205
1206 lock_policy_rwsem_write(cpu);
1207 if (cpufreq_driver->exit)
1208 cpufreq_driver->exit(data);
1209 unlock_policy_rwsem_write(cpu);
1210
1211 free_cpumask_var(data->related_cpus);
1212 free_cpumask_var(data->cpus);
1213 kfree(data);
1214 per_cpu(cpufreq_cpu_data, cpu) = NULL;
1215
1216 cpufreq_debug_enable_ratelimit();
1217 return 0;
1218 }
1219
1220
1221 static int cpufreq_remove_dev(struct sys_device *sys_dev)
1222 {
1223 unsigned int cpu = sys_dev->id;
1224 int retval;
1225
1226 if (cpu_is_offline(cpu))
1227 return 0;
1228
1229 if (unlikely(lock_policy_rwsem_write(cpu)))
1230 BUG();
1231
1232 retval = __cpufreq_remove_dev(sys_dev);
1233 return retval;
1234 }
1235
1236
1237 static void handle_update(struct work_struct *work)
1238 {
1239 struct cpufreq_policy *policy =
1240 container_of(work, struct cpufreq_policy, update);
1241 unsigned int cpu = policy->cpu;
1242 dprintk("handle_update for cpu %u called\n", cpu);
1243 cpufreq_update_policy(cpu);
1244 }
1245
1246 /**
1247 * cpufreq_out_of_sync - If actual and saved CPU frequency differs, we're in deep trouble.
1248 * @cpu: cpu number
1249 * @old_freq: CPU frequency the kernel thinks the CPU runs at
1250 * @new_freq: CPU frequency the CPU actually runs at
1251 *
1252 * We adjust to current frequency first, and need to clean up later.
1253 * So either call to cpufreq_update_policy() or schedule handle_update()).
1254 */
1255 static void cpufreq_out_of_sync(unsigned int cpu, unsigned int old_freq,
1256 unsigned int new_freq)
1257 {
1258 struct cpufreq_freqs freqs;
1259
1260 dprintk("Warning: CPU frequency out of sync: cpufreq and timing "
1261 "core thinks of %u, is %u kHz.\n", old_freq, new_freq);
1262
1263 freqs.cpu = cpu;
1264 freqs.old = old_freq;
1265 freqs.new = new_freq;
1266 cpufreq_notify_transition(&freqs, CPUFREQ_PRECHANGE);
1267 cpufreq_notify_transition(&freqs, CPUFREQ_POSTCHANGE);
1268 }
1269
1270
1271 /**
1272 * cpufreq_quick_get - get the CPU frequency (in kHz) from policy->cur
1273 * @cpu: CPU number
1274 *
1275 * This is the last known freq, without actually getting it from the driver.
1276 * Return value will be same as what is shown in scaling_cur_freq in sysfs.
1277 */
1278 unsigned int cpufreq_quick_get(unsigned int cpu)
1279 {
1280 struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1281 unsigned int ret_freq = 0;
1282
1283 if (policy) {
1284 ret_freq = policy->cur;
1285 cpufreq_cpu_put(policy);
1286 }
1287
1288 return ret_freq;
1289 }
1290 EXPORT_SYMBOL(cpufreq_quick_get);
1291
1292
1293 static unsigned int __cpufreq_get(unsigned int cpu)
1294 {
1295 struct cpufreq_policy *policy = per_cpu(cpufreq_cpu_data, cpu);
1296 unsigned int ret_freq = 0;
1297
1298 if (!cpufreq_driver->get)
1299 return ret_freq;
1300
1301 ret_freq = cpufreq_driver->get(cpu);
1302
1303 if (ret_freq && policy->cur &&
1304 !(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
1305 /* verify no discrepancy between actual and
1306 saved value exists */
1307 if (unlikely(ret_freq != policy->cur)) {
1308 cpufreq_out_of_sync(cpu, policy->cur, ret_freq);
1309 schedule_work(&policy->update);
1310 }
1311 }
1312
1313 return ret_freq;
1314 }
1315
1316 /**
1317 * cpufreq_get - get the current CPU frequency (in kHz)
1318 * @cpu: CPU number
1319 *
1320 * Get the CPU current (static) CPU frequency
1321 */
1322 unsigned int cpufreq_get(unsigned int cpu)
1323 {
1324 unsigned int ret_freq = 0;
1325 struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1326
1327 if (!policy)
1328 goto out;
1329
1330 if (unlikely(lock_policy_rwsem_read(cpu)))
1331 goto out_policy;
1332
1333 ret_freq = __cpufreq_get(cpu);
1334
1335 unlock_policy_rwsem_read(cpu);
1336
1337 out_policy:
1338 cpufreq_cpu_put(policy);
1339 out:
1340 return ret_freq;
1341 }
1342 EXPORT_SYMBOL(cpufreq_get);
1343
1344 static struct sysdev_driver cpufreq_sysdev_driver = {
1345 .add = cpufreq_add_dev,
1346 .remove = cpufreq_remove_dev,
1347 };
1348
1349
1350 /**
1351 * cpufreq_bp_suspend - Prepare the boot CPU for system suspend.
1352 *
1353 * This function is only executed for the boot processor. The other CPUs
1354 * have been put offline by means of CPU hotplug.
1355 */
1356 static int cpufreq_bp_suspend(void)
1357 {
1358 int ret = 0;
1359
1360 int cpu = smp_processor_id();
1361 struct cpufreq_policy *cpu_policy;
1362
1363 dprintk("suspending cpu %u\n", cpu);
1364
1365 /* If there's no policy for the boot CPU, we have nothing to do. */
1366 cpu_policy = cpufreq_cpu_get(cpu);
1367 if (!cpu_policy)
1368 return 0;
1369
1370 if (cpufreq_driver->suspend) {
1371 ret = cpufreq_driver->suspend(cpu_policy);
1372 if (ret)
1373 printk(KERN_ERR "cpufreq: suspend failed in ->suspend "
1374 "step on CPU %u\n", cpu_policy->cpu);
1375 }
1376
1377 cpufreq_cpu_put(cpu_policy);
1378 return ret;
1379 }
1380
1381 /**
1382 * cpufreq_bp_resume - Restore proper frequency handling of the boot CPU.
1383 *
1384 * 1.) resume CPUfreq hardware support (cpufreq_driver->resume())
1385 * 2.) schedule call cpufreq_update_policy() ASAP as interrupts are
1386 * restored. It will verify that the current freq is in sync with
1387 * what we believe it to be. This is a bit later than when it
1388 * should be, but nonethteless it's better than calling
1389 * cpufreq_driver->get() here which might re-enable interrupts...
1390 *
1391 * This function is only executed for the boot CPU. The other CPUs have not
1392 * been turned on yet.
1393 */
1394 static void cpufreq_bp_resume(void)
1395 {
1396 int ret = 0;
1397
1398 int cpu = smp_processor_id();
1399 struct cpufreq_policy *cpu_policy;
1400
1401 dprintk("resuming cpu %u\n", cpu);
1402
1403 /* If there's no policy for the boot CPU, we have nothing to do. */
1404 cpu_policy = cpufreq_cpu_get(cpu);
1405 if (!cpu_policy)
1406 return;
1407
1408 if (cpufreq_driver->resume) {
1409 ret = cpufreq_driver->resume(cpu_policy);
1410 if (ret) {
1411 printk(KERN_ERR "cpufreq: resume failed in ->resume "
1412 "step on CPU %u\n", cpu_policy->cpu);
1413 goto fail;
1414 }
1415 }
1416
1417 schedule_work(&cpu_policy->update);
1418
1419 fail:
1420 cpufreq_cpu_put(cpu_policy);
1421 }
1422
1423 static struct syscore_ops cpufreq_syscore_ops = {
1424 .suspend = cpufreq_bp_suspend,
1425 .resume = cpufreq_bp_resume,
1426 };
1427
1428
1429 /*********************************************************************
1430 * NOTIFIER LISTS INTERFACE *
1431 *********************************************************************/
1432
1433 /**
1434 * cpufreq_register_notifier - register a driver with cpufreq
1435 * @nb: notifier function to register
1436 * @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1437 *
1438 * Add a driver to one of two lists: either a list of drivers that
1439 * are notified about clock rate changes (once before and once after
1440 * the transition), or a list of drivers that are notified about
1441 * changes in cpufreq policy.
1442 *
1443 * This function may sleep, and has the same return conditions as
1444 * blocking_notifier_chain_register.
1445 */
1446 int cpufreq_register_notifier(struct notifier_block *nb, unsigned int list)
1447 {
1448 int ret;
1449
1450 WARN_ON(!init_cpufreq_transition_notifier_list_called);
1451
1452 switch (list) {
1453 case CPUFREQ_TRANSITION_NOTIFIER:
1454 ret = srcu_notifier_chain_register(
1455 &cpufreq_transition_notifier_list, nb);
1456 break;
1457 case CPUFREQ_POLICY_NOTIFIER:
1458 ret = blocking_notifier_chain_register(
1459 &cpufreq_policy_notifier_list, nb);
1460 break;
1461 default:
1462 ret = -EINVAL;
1463 }
1464
1465 return ret;
1466 }
1467 EXPORT_SYMBOL(cpufreq_register_notifier);
1468
1469
1470 /**
1471 * cpufreq_unregister_notifier - unregister a driver with cpufreq
1472 * @nb: notifier block to be unregistered
1473 * @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1474 *
1475 * Remove a driver from the CPU frequency notifier list.
1476 *
1477 * This function may sleep, and has the same return conditions as
1478 * blocking_notifier_chain_unregister.
1479 */
1480 int cpufreq_unregister_notifier(struct notifier_block *nb, unsigned int list)
1481 {
1482 int ret;
1483
1484 switch (list) {
1485 case CPUFREQ_TRANSITION_NOTIFIER:
1486 ret = srcu_notifier_chain_unregister(
1487 &cpufreq_transition_notifier_list, nb);
1488 break;
1489 case CPUFREQ_POLICY_NOTIFIER:
1490 ret = blocking_notifier_chain_unregister(
1491 &cpufreq_policy_notifier_list, nb);
1492 break;
1493 default:
1494 ret = -EINVAL;
1495 }
1496
1497 return ret;
1498 }
1499 EXPORT_SYMBOL(cpufreq_unregister_notifier);
1500
1501
1502 /*********************************************************************
1503 * GOVERNORS *
1504 *********************************************************************/
1505
1506
1507 int __cpufreq_driver_target(struct cpufreq_policy *policy,
1508 unsigned int target_freq,
1509 unsigned int relation)
1510 {
1511 int retval = -EINVAL;
1512
1513 dprintk("target for CPU %u: %u kHz, relation %u\n", policy->cpu,
1514 target_freq, relation);
1515 if (cpu_online(policy->cpu) && cpufreq_driver->target)
1516 retval = cpufreq_driver->target(policy, target_freq, relation);
1517
1518 return retval;
1519 }
1520 EXPORT_SYMBOL_GPL(__cpufreq_driver_target);
1521
1522 int cpufreq_driver_target(struct cpufreq_policy *policy,
1523 unsigned int target_freq,
1524 unsigned int relation)
1525 {
1526 int ret = -EINVAL;
1527
1528 policy = cpufreq_cpu_get(policy->cpu);
1529 if (!policy)
1530 goto no_policy;
1531
1532 if (unlikely(lock_policy_rwsem_write(policy->cpu)))
1533 goto fail;
1534
1535 ret = __cpufreq_driver_target(policy, target_freq, relation);
1536
1537 unlock_policy_rwsem_write(policy->cpu);
1538
1539 fail:
1540 cpufreq_cpu_put(policy);
1541 no_policy:
1542 return ret;
1543 }
1544 EXPORT_SYMBOL_GPL(cpufreq_driver_target);
1545
1546 int __cpufreq_driver_getavg(struct cpufreq_policy *policy, unsigned int cpu)
1547 {
1548 int ret = 0;
1549
1550 policy = cpufreq_cpu_get(policy->cpu);
1551 if (!policy)
1552 return -EINVAL;
1553
1554 if (cpu_online(cpu) && cpufreq_driver->getavg)
1555 ret = cpufreq_driver->getavg(policy, cpu);
1556
1557 cpufreq_cpu_put(policy);
1558 return ret;
1559 }
1560 EXPORT_SYMBOL_GPL(__cpufreq_driver_getavg);
1561
1562 /*
1563 * when "event" is CPUFREQ_GOV_LIMITS
1564 */
1565
1566 static int __cpufreq_governor(struct cpufreq_policy *policy,
1567 unsigned int event)
1568 {
1569 int ret;
1570
1571 /* Only must be defined when default governor is known to have latency
1572 restrictions, like e.g. conservative or ondemand.
1573 That this is the case is already ensured in Kconfig
1574 */
1575 #ifdef CONFIG_CPU_FREQ_GOV_PERFORMANCE
1576 struct cpufreq_governor *gov = &cpufreq_gov_performance;
1577 #else
1578 struct cpufreq_governor *gov = NULL;
1579 #endif
1580
1581 if (policy->governor->max_transition_latency &&
1582 policy->cpuinfo.transition_latency >
1583 policy->governor->max_transition_latency) {
1584 if (!gov)
1585 return -EINVAL;
1586 else {
1587 printk(KERN_WARNING "%s governor failed, too long"
1588 " transition latency of HW, fallback"
1589 " to %s governor\n",
1590 policy->governor->name,
1591 gov->name);
1592 policy->governor = gov;
1593 }
1594 }
1595
1596 if (!try_module_get(policy->governor->owner))
1597 return -EINVAL;
1598
1599 dprintk("__cpufreq_governor for CPU %u, event %u\n",
1600 policy->cpu, event);
1601 ret = policy->governor->governor(policy, event);
1602
1603 /* we keep one module reference alive for
1604 each CPU governed by this CPU */
1605 if ((event != CPUFREQ_GOV_START) || ret)
1606 module_put(policy->governor->owner);
1607 if ((event == CPUFREQ_GOV_STOP) && !ret)
1608 module_put(policy->governor->owner);
1609
1610 return ret;
1611 }
1612
1613
1614 int cpufreq_register_governor(struct cpufreq_governor *governor)
1615 {
1616 int err;
1617
1618 if (!governor)
1619 return -EINVAL;
1620
1621 mutex_lock(&cpufreq_governor_mutex);
1622
1623 err = -EBUSY;
1624 if (__find_governor(governor->name) == NULL) {
1625 err = 0;
1626 list_add(&governor->governor_list, &cpufreq_governor_list);
1627 }
1628
1629 mutex_unlock(&cpufreq_governor_mutex);
1630 return err;
1631 }
1632 EXPORT_SYMBOL_GPL(cpufreq_register_governor);
1633
1634
1635 void cpufreq_unregister_governor(struct cpufreq_governor *governor)
1636 {
1637 #ifdef CONFIG_HOTPLUG_CPU
1638 int cpu;
1639 #endif
1640
1641 if (!governor)
1642 return;
1643
1644 #ifdef CONFIG_HOTPLUG_CPU
1645 for_each_present_cpu(cpu) {
1646 if (cpu_online(cpu))
1647 continue;
1648 if (!strcmp(per_cpu(cpufreq_cpu_governor, cpu), governor->name))
1649 strcpy(per_cpu(cpufreq_cpu_governor, cpu), "\0");
1650 }
1651 #endif
1652
1653 mutex_lock(&cpufreq_governor_mutex);
1654 list_del(&governor->governor_list);
1655 mutex_unlock(&cpufreq_governor_mutex);
1656 return;
1657 }
1658 EXPORT_SYMBOL_GPL(cpufreq_unregister_governor);
1659
1660
1661
1662 /*********************************************************************
1663 * POLICY INTERFACE *
1664 *********************************************************************/
1665
1666 /**
1667 * cpufreq_get_policy - get the current cpufreq_policy
1668 * @policy: struct cpufreq_policy into which the current cpufreq_policy
1669 * is written
1670 *
1671 * Reads the current cpufreq policy.
1672 */
1673 int cpufreq_get_policy(struct cpufreq_policy *policy, unsigned int cpu)
1674 {
1675 struct cpufreq_policy *cpu_policy;
1676 if (!policy)
1677 return -EINVAL;
1678
1679 cpu_policy = cpufreq_cpu_get(cpu);
1680 if (!cpu_policy)
1681 return -EINVAL;
1682
1683 memcpy(policy, cpu_policy, sizeof(struct cpufreq_policy));
1684
1685 cpufreq_cpu_put(cpu_policy);
1686 return 0;
1687 }
1688 EXPORT_SYMBOL(cpufreq_get_policy);
1689
1690
1691 /*
1692 * data : current policy.
1693 * policy : policy to be set.
1694 */
1695 static int __cpufreq_set_policy(struct cpufreq_policy *data,
1696 struct cpufreq_policy *policy)
1697 {
1698 int ret = 0;
1699
1700 cpufreq_debug_disable_ratelimit();
1701 dprintk("setting new policy for CPU %u: %u - %u kHz\n", policy->cpu,
1702 policy->min, policy->max);
1703
1704 memcpy(&policy->cpuinfo, &data->cpuinfo,
1705 sizeof(struct cpufreq_cpuinfo));
1706
1707 if (policy->min > data->max || policy->max < data->min) {
1708 ret = -EINVAL;
1709 goto error_out;
1710 }
1711
1712 /* verify the cpu speed can be set within this limit */
1713 ret = cpufreq_driver->verify(policy);
1714 if (ret)
1715 goto error_out;
1716
1717 /* adjust if necessary - all reasons */
1718 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1719 CPUFREQ_ADJUST, policy);
1720
1721 /* adjust if necessary - hardware incompatibility*/
1722 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1723 CPUFREQ_INCOMPATIBLE, policy);
1724
1725 /* verify the cpu speed can be set within this limit,
1726 which might be different to the first one */
1727 ret = cpufreq_driver->verify(policy);
1728 if (ret)
1729 goto error_out;
1730
1731 /* notification of the new policy */
1732 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1733 CPUFREQ_NOTIFY, policy);
1734
1735 data->min = policy->min;
1736 data->max = policy->max;
1737
1738 dprintk("new min and max freqs are %u - %u kHz\n",
1739 data->min, data->max);
1740
1741 if (cpufreq_driver->setpolicy) {
1742 data->policy = policy->policy;
1743 dprintk("setting range\n");
1744 ret = cpufreq_driver->setpolicy(policy);
1745 } else {
1746 if (policy->governor != data->governor) {
1747 /* save old, working values */
1748 struct cpufreq_governor *old_gov = data->governor;
1749
1750 dprintk("governor switch\n");
1751
1752 /* end old governor */
1753 if (data->governor)
1754 __cpufreq_governor(data, CPUFREQ_GOV_STOP);
1755
1756 /* start new governor */
1757 data->governor = policy->governor;
1758 if (__cpufreq_governor(data, CPUFREQ_GOV_START)) {
1759 /* new governor failed, so re-start old one */
1760 dprintk("starting governor %s failed\n",
1761 data->governor->name);
1762 if (old_gov) {
1763 data->governor = old_gov;
1764 __cpufreq_governor(data,
1765 CPUFREQ_GOV_START);
1766 }
1767 ret = -EINVAL;
1768 goto error_out;
1769 }
1770 /* might be a policy change, too, so fall through */
1771 }
1772 dprintk("governor: change or update limits\n");
1773 __cpufreq_governor(data, CPUFREQ_GOV_LIMITS);
1774 }
1775
1776 error_out:
1777 cpufreq_debug_enable_ratelimit();
1778 return ret;
1779 }
1780
1781 /**
1782 * cpufreq_update_policy - re-evaluate an existing cpufreq policy
1783 * @cpu: CPU which shall be re-evaluated
1784 *
1785 * Useful for policy notifiers which have different necessities
1786 * at different times.
1787 */
1788 int cpufreq_update_policy(unsigned int cpu)
1789 {
1790 struct cpufreq_policy *data = cpufreq_cpu_get(cpu);
1791 struct cpufreq_policy policy;
1792 int ret;
1793
1794 if (!data) {
1795 ret = -ENODEV;
1796 goto no_policy;
1797 }
1798
1799 if (unlikely(lock_policy_rwsem_write(cpu))) {
1800 ret = -EINVAL;
1801 goto fail;
1802 }
1803
1804 dprintk("updating policy for CPU %u\n", cpu);
1805 memcpy(&policy, data, sizeof(struct cpufreq_policy));
1806 policy.min = data->user_policy.min;
1807 policy.max = data->user_policy.max;
1808 policy.policy = data->user_policy.policy;
1809 policy.governor = data->user_policy.governor;
1810
1811 /* BIOS might change freq behind our back
1812 -> ask driver for current freq and notify governors about a change */
1813 if (cpufreq_driver->get) {
1814 policy.cur = cpufreq_driver->get(cpu);
1815 if (!data->cur) {
1816 dprintk("Driver did not initialize current freq");
1817 data->cur = policy.cur;
1818 } else {
1819 if (data->cur != policy.cur)
1820 cpufreq_out_of_sync(cpu, data->cur,
1821 policy.cur);
1822 }
1823 }
1824
1825 ret = __cpufreq_set_policy(data, &policy);
1826
1827 unlock_policy_rwsem_write(cpu);
1828
1829 fail:
1830 cpufreq_cpu_put(data);
1831 no_policy:
1832 return ret;
1833 }
1834 EXPORT_SYMBOL(cpufreq_update_policy);
1835
1836 static int __cpuinit cpufreq_cpu_callback(struct notifier_block *nfb,
1837 unsigned long action, void *hcpu)
1838 {
1839 unsigned int cpu = (unsigned long)hcpu;
1840 struct sys_device *sys_dev;
1841
1842 sys_dev = get_cpu_sysdev(cpu);
1843 if (sys_dev) {
1844 switch (action) {
1845 case CPU_ONLINE:
1846 case CPU_ONLINE_FROZEN:
1847 cpufreq_add_dev(sys_dev);
1848 break;
1849 case CPU_DOWN_PREPARE:
1850 case CPU_DOWN_PREPARE_FROZEN:
1851 if (unlikely(lock_policy_rwsem_write(cpu)))
1852 BUG();
1853
1854 __cpufreq_remove_dev(sys_dev);
1855 break;
1856 case CPU_DOWN_FAILED:
1857 case CPU_DOWN_FAILED_FROZEN:
1858 cpufreq_add_dev(sys_dev);
1859 break;
1860 }
1861 }
1862 return NOTIFY_OK;
1863 }
1864
1865 static struct notifier_block __refdata cpufreq_cpu_notifier = {
1866 .notifier_call = cpufreq_cpu_callback,
1867 };
1868
1869 /*********************************************************************
1870 * REGISTER / UNREGISTER CPUFREQ DRIVER *
1871 *********************************************************************/
1872
1873 /**
1874 * cpufreq_register_driver - register a CPU Frequency driver
1875 * @driver_data: A struct cpufreq_driver containing the values#
1876 * submitted by the CPU Frequency driver.
1877 *
1878 * Registers a CPU Frequency driver to this core code. This code
1879 * returns zero on success, -EBUSY when another driver got here first
1880 * (and isn't unregistered in the meantime).
1881 *
1882 */
1883 int cpufreq_register_driver(struct cpufreq_driver *driver_data)
1884 {
1885 unsigned long flags;
1886 int ret;
1887
1888 if (!driver_data || !driver_data->verify || !driver_data->init ||
1889 ((!driver_data->setpolicy) && (!driver_data->target)))
1890 return -EINVAL;
1891
1892 dprintk("trying to register driver %s\n", driver_data->name);
1893
1894 if (driver_data->setpolicy)
1895 driver_data->flags |= CPUFREQ_CONST_LOOPS;
1896
1897 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1898 if (cpufreq_driver) {
1899 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1900 return -EBUSY;
1901 }
1902 cpufreq_driver = driver_data;
1903 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1904
1905 ret = sysdev_driver_register(&cpu_sysdev_class,
1906 &cpufreq_sysdev_driver);
1907 if (ret)
1908 goto err_null_driver;
1909
1910 if (!(cpufreq_driver->flags & CPUFREQ_STICKY)) {
1911 int i;
1912 ret = -ENODEV;
1913
1914 /* check for at least one working CPU */
1915 for (i = 0; i < nr_cpu_ids; i++)
1916 if (cpu_possible(i) && per_cpu(cpufreq_cpu_data, i)) {
1917 ret = 0;
1918 break;
1919 }
1920
1921 /* if all ->init() calls failed, unregister */
1922 if (ret) {
1923 dprintk("no CPU initialized for driver %s\n",
1924 driver_data->name);
1925 goto err_sysdev_unreg;
1926 }
1927 }
1928
1929 register_hotcpu_notifier(&cpufreq_cpu_notifier);
1930 dprintk("driver %s up and running\n", driver_data->name);
1931 cpufreq_debug_enable_ratelimit();
1932
1933 return 0;
1934 err_sysdev_unreg:
1935 sysdev_driver_unregister(&cpu_sysdev_class,
1936 &cpufreq_sysdev_driver);
1937 err_null_driver:
1938 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1939 cpufreq_driver = NULL;
1940 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1941 return ret;
1942 }
1943 EXPORT_SYMBOL_GPL(cpufreq_register_driver);
1944
1945
1946 /**
1947 * cpufreq_unregister_driver - unregister the current CPUFreq driver
1948 *
1949 * Unregister the current CPUFreq driver. Only call this if you have
1950 * the right to do so, i.e. if you have succeeded in initialising before!
1951 * Returns zero if successful, and -EINVAL if the cpufreq_driver is
1952 * currently not initialised.
1953 */
1954 int cpufreq_unregister_driver(struct cpufreq_driver *driver)
1955 {
1956 unsigned long flags;
1957
1958 cpufreq_debug_disable_ratelimit();
1959
1960 if (!cpufreq_driver || (driver != cpufreq_driver)) {
1961 cpufreq_debug_enable_ratelimit();
1962 return -EINVAL;
1963 }
1964
1965 dprintk("unregistering driver %s\n", driver->name);
1966
1967 sysdev_driver_unregister(&cpu_sysdev_class, &cpufreq_sysdev_driver);
1968 unregister_hotcpu_notifier(&cpufreq_cpu_notifier);
1969
1970 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1971 cpufreq_driver = NULL;
1972 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1973
1974 return 0;
1975 }
1976 EXPORT_SYMBOL_GPL(cpufreq_unregister_driver);
1977
1978 static int __init cpufreq_core_init(void)
1979 {
1980 int cpu;
1981
1982 for_each_possible_cpu(cpu) {
1983 per_cpu(cpufreq_policy_cpu, cpu) = -1;
1984 init_rwsem(&per_cpu(cpu_policy_rwsem, cpu));
1985 }
1986
1987 cpufreq_global_kobject = kobject_create_and_add("cpufreq",
1988 &cpu_sysdev_class.kset.kobj);
1989 BUG_ON(!cpufreq_global_kobject);
1990 register_syscore_ops(&cpufreq_syscore_ops);
1991
1992 return 0;
1993 }
1994 core_initcall(cpufreq_core_init);