2 * linux/drivers/cpufreq/cpufreq.c
4 * Copyright (C) 2001 Russell King
5 * (C) 2002 - 2003 Dominik Brodowski <linux@brodo.de>
7 * Oct 2005 - Ashok Raj <ashok.raj@intel.com>
8 * Added handling for CPU hotplug
9 * Feb 2006 - Jacob Shin <jacob.shin@amd.com>
10 * Fix handling for CPU hotplug -- affected CPUs
12 * This program is free software; you can redistribute it and/or modify
13 * it under the terms of the GNU General Public License version 2 as
14 * published by the Free Software Foundation.
18 #include <linux/kernel.h>
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/notifier.h>
22 #include <linux/cpufreq.h>
23 #include <linux/delay.h>
24 #include <linux/interrupt.h>
25 #include <linux/spinlock.h>
26 #include <linux/device.h>
27 #include <linux/slab.h>
28 #include <linux/cpu.h>
29 #include <linux/completion.h>
30 #include <linux/mutex.h>
32 #define dprintk(msg...) cpufreq_debug_printk(CPUFREQ_DEBUG_CORE, \
36 * The "cpufreq driver" - the arch- or hardware-dependent low
37 * level driver of CPUFreq support, and its spinlock. This lock
38 * also protects the cpufreq_cpu_data array.
40 static struct cpufreq_driver *cpufreq_driver;
41 static struct cpufreq_policy *cpufreq_cpu_data[NR_CPUS];
42 static DEFINE_SPINLOCK(cpufreq_driver_lock);
44 /* internal prototypes */
45 static int __cpufreq_governor(struct cpufreq_policy *policy, unsigned int event);
46 static void handle_update(struct work_struct *work);
49 * Two notifier lists: the "policy" list is involved in the
50 * validation process for a new CPU frequency policy; the
51 * "transition" list for kernel code that needs to handle
52 * changes to devices when the CPU clock speed changes.
53 * The mutex locks both lists.
55 static BLOCKING_NOTIFIER_HEAD(cpufreq_policy_notifier_list);
56 static struct srcu_notifier_head cpufreq_transition_notifier_list;
58 static int __init init_cpufreq_transition_notifier_list(void)
60 srcu_init_notifier_head(&cpufreq_transition_notifier_list);
63 pure_initcall(init_cpufreq_transition_notifier_list);
65 static LIST_HEAD(cpufreq_governor_list);
66 static DEFINE_MUTEX (cpufreq_governor_mutex);
68 struct cpufreq_policy *cpufreq_cpu_get(unsigned int cpu)
70 struct cpufreq_policy *data;
76 /* get the cpufreq driver */
77 spin_lock_irqsave(&cpufreq_driver_lock, flags);
82 if (!try_module_get(cpufreq_driver->owner))
87 data = cpufreq_cpu_data[cpu];
90 goto err_out_put_module;
92 if (!kobject_get(&data->kobj))
93 goto err_out_put_module;
95 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
99 module_put(cpufreq_driver->owner);
101 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
105 EXPORT_SYMBOL_GPL(cpufreq_cpu_get);
108 void cpufreq_cpu_put(struct cpufreq_policy *data)
110 kobject_put(&data->kobj);
111 module_put(cpufreq_driver->owner);
113 EXPORT_SYMBOL_GPL(cpufreq_cpu_put);
116 /*********************************************************************
117 * UNIFIED DEBUG HELPERS *
118 *********************************************************************/
119 #ifdef CONFIG_CPU_FREQ_DEBUG
121 /* what part(s) of the CPUfreq subsystem are debugged? */
122 static unsigned int debug;
124 /* is the debug output ratelimit'ed using printk_ratelimit? User can
125 * set or modify this value.
127 static unsigned int debug_ratelimit = 1;
129 /* is the printk_ratelimit'ing enabled? It's enabled after a successful
130 * loading of a cpufreq driver, temporarily disabled when a new policy
131 * is set, and disabled upon cpufreq driver removal
133 static unsigned int disable_ratelimit = 1;
134 static DEFINE_SPINLOCK(disable_ratelimit_lock);
136 static void cpufreq_debug_enable_ratelimit(void)
140 spin_lock_irqsave(&disable_ratelimit_lock, flags);
141 if (disable_ratelimit)
143 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
146 static void cpufreq_debug_disable_ratelimit(void)
150 spin_lock_irqsave(&disable_ratelimit_lock, flags);
152 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
155 void cpufreq_debug_printk(unsigned int type, const char *prefix,
156 const char *fmt, ...)
165 spin_lock_irqsave(&disable_ratelimit_lock, flags);
166 if (!disable_ratelimit && debug_ratelimit
167 && !printk_ratelimit()) {
168 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
171 spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
173 len = snprintf(s, 256, KERN_DEBUG "%s: ", prefix);
176 len += vsnprintf(&s[len], (256 - len), fmt, args);
184 EXPORT_SYMBOL(cpufreq_debug_printk);
187 module_param(debug, uint, 0644);
188 MODULE_PARM_DESC(debug, "CPUfreq debugging: add 1 to debug core,"
189 " 2 to debug drivers, and 4 to debug governors.");
191 module_param(debug_ratelimit, uint, 0644);
192 MODULE_PARM_DESC(debug_ratelimit, "CPUfreq debugging:"
193 " set to 0 to disable ratelimiting.");
195 #else /* !CONFIG_CPU_FREQ_DEBUG */
197 static inline void cpufreq_debug_enable_ratelimit(void) { return; }
198 static inline void cpufreq_debug_disable_ratelimit(void) { return; }
200 #endif /* CONFIG_CPU_FREQ_DEBUG */
203 /*********************************************************************
204 * EXTERNALLY AFFECTING FREQUENCY CHANGES *
205 *********************************************************************/
208 * adjust_jiffies - adjust the system "loops_per_jiffy"
210 * This function alters the system "loops_per_jiffy" for the clock
211 * speed change. Note that loops_per_jiffy cannot be updated on SMP
212 * systems as each CPU might be scaled differently. So, use the arch
213 * per-CPU loops_per_jiffy value wherever possible.
216 static unsigned long l_p_j_ref;
217 static unsigned int l_p_j_ref_freq;
219 static void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
221 if (ci->flags & CPUFREQ_CONST_LOOPS)
224 if (!l_p_j_ref_freq) {
225 l_p_j_ref = loops_per_jiffy;
226 l_p_j_ref_freq = ci->old;
227 dprintk("saving %lu as reference value for loops_per_jiffy;"
228 "freq is %u kHz\n", l_p_j_ref, l_p_j_ref_freq);
230 if ((val == CPUFREQ_PRECHANGE && ci->old < ci->new) ||
231 (val == CPUFREQ_POSTCHANGE && ci->old > ci->new) ||
232 (val == CPUFREQ_RESUMECHANGE || val == CPUFREQ_SUSPENDCHANGE)) {
233 loops_per_jiffy = cpufreq_scale(l_p_j_ref, l_p_j_ref_freq,
235 dprintk("scaling loops_per_jiffy to %lu"
236 "for frequency %u kHz\n", loops_per_jiffy, ci->new);
240 static inline void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
248 * cpufreq_notify_transition - call notifier chain and adjust_jiffies
249 * on frequency transition.
251 * This function calls the transition notifiers and the "adjust_jiffies"
252 * function. It is called twice on all CPU frequency changes that have
255 void cpufreq_notify_transition(struct cpufreq_freqs *freqs, unsigned int state)
257 struct cpufreq_policy *policy;
259 BUG_ON(irqs_disabled());
261 freqs->flags = cpufreq_driver->flags;
262 dprintk("notification %u of frequency transition to %u kHz\n",
265 policy = cpufreq_cpu_data[freqs->cpu];
268 case CPUFREQ_PRECHANGE:
269 /* detect if the driver reported a value as "old frequency"
270 * which is not equal to what the cpufreq core thinks is
273 if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
274 if ((policy) && (policy->cpu == freqs->cpu) &&
275 (policy->cur) && (policy->cur != freqs->old)) {
276 dprintk("Warning: CPU frequency is"
277 " %u, cpufreq assumed %u kHz.\n",
278 freqs->old, policy->cur);
279 freqs->old = policy->cur;
282 srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
283 CPUFREQ_PRECHANGE, freqs);
284 adjust_jiffies(CPUFREQ_PRECHANGE, freqs);
287 case CPUFREQ_POSTCHANGE:
288 adjust_jiffies(CPUFREQ_POSTCHANGE, freqs);
289 srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
290 CPUFREQ_POSTCHANGE, freqs);
291 if (likely(policy) && likely(policy->cpu == freqs->cpu))
292 policy->cur = freqs->new;
296 EXPORT_SYMBOL_GPL(cpufreq_notify_transition);
300 /*********************************************************************
302 *********************************************************************/
304 static struct cpufreq_governor *__find_governor(const char *str_governor)
306 struct cpufreq_governor *t;
308 list_for_each_entry(t, &cpufreq_governor_list, governor_list)
309 if (!strnicmp(str_governor,t->name,CPUFREQ_NAME_LEN))
316 * cpufreq_parse_governor - parse a governor string
318 static int cpufreq_parse_governor (char *str_governor, unsigned int *policy,
319 struct cpufreq_governor **governor)
326 if (cpufreq_driver->setpolicy) {
327 if (!strnicmp(str_governor, "performance", CPUFREQ_NAME_LEN)) {
328 *policy = CPUFREQ_POLICY_PERFORMANCE;
330 } else if (!strnicmp(str_governor, "powersave",
332 *policy = CPUFREQ_POLICY_POWERSAVE;
335 } else if (cpufreq_driver->target) {
336 struct cpufreq_governor *t;
338 mutex_lock(&cpufreq_governor_mutex);
340 t = __find_governor(str_governor);
343 char *name = kasprintf(GFP_KERNEL, "cpufreq_%s",
349 mutex_unlock(&cpufreq_governor_mutex);
350 ret = request_module(name);
351 mutex_lock(&cpufreq_governor_mutex);
354 t = __find_governor(str_governor);
365 mutex_unlock(&cpufreq_governor_mutex);
372 /* drivers/base/cpu.c */
373 extern struct sysdev_class cpu_sysdev_class;
377 * cpufreq_per_cpu_attr_read() / show_##file_name() -
378 * print out cpufreq information
380 * Write out information from cpufreq_driver->policy[cpu]; object must be
384 #define show_one(file_name, object) \
385 static ssize_t show_##file_name \
386 (struct cpufreq_policy * policy, char *buf) \
388 return sprintf (buf, "%u\n", policy->object); \
391 show_one(cpuinfo_min_freq, cpuinfo.min_freq);
392 show_one(cpuinfo_max_freq, cpuinfo.max_freq);
393 show_one(scaling_min_freq, min);
394 show_one(scaling_max_freq, max);
395 show_one(scaling_cur_freq, cur);
397 static int __cpufreq_set_policy(struct cpufreq_policy *data,
398 struct cpufreq_policy *policy);
401 * cpufreq_per_cpu_attr_write() / store_##file_name() - sysfs write access
403 #define store_one(file_name, object) \
404 static ssize_t store_##file_name \
405 (struct cpufreq_policy * policy, const char *buf, size_t count) \
407 unsigned int ret = -EINVAL; \
408 struct cpufreq_policy new_policy; \
410 ret = cpufreq_get_policy(&new_policy, policy->cpu); \
414 ret = sscanf (buf, "%u", &new_policy.object); \
418 lock_cpu_hotplug(); \
419 mutex_lock(&policy->lock); \
420 ret = __cpufreq_set_policy(policy, &new_policy); \
421 policy->user_policy.object = policy->object; \
422 mutex_unlock(&policy->lock); \
423 unlock_cpu_hotplug(); \
425 return ret ? ret : count; \
428 store_one(scaling_min_freq,min);
429 store_one(scaling_max_freq,max);
432 * show_cpuinfo_cur_freq - current CPU frequency as detected by hardware
434 static ssize_t show_cpuinfo_cur_freq (struct cpufreq_policy * policy,
437 unsigned int cur_freq = cpufreq_get(policy->cpu);
439 return sprintf(buf, "<unknown>");
440 return sprintf(buf, "%u\n", cur_freq);
445 * show_scaling_governor - show the current policy for the specified CPU
447 static ssize_t show_scaling_governor (struct cpufreq_policy * policy,
450 if(policy->policy == CPUFREQ_POLICY_POWERSAVE)
451 return sprintf(buf, "powersave\n");
452 else if (policy->policy == CPUFREQ_POLICY_PERFORMANCE)
453 return sprintf(buf, "performance\n");
454 else if (policy->governor)
455 return scnprintf(buf, CPUFREQ_NAME_LEN, "%s\n", policy->governor->name);
461 * store_scaling_governor - store policy for the specified CPU
463 static ssize_t store_scaling_governor (struct cpufreq_policy * policy,
464 const char *buf, size_t count)
466 unsigned int ret = -EINVAL;
467 char str_governor[16];
468 struct cpufreq_policy new_policy;
470 ret = cpufreq_get_policy(&new_policy, policy->cpu);
474 ret = sscanf (buf, "%15s", str_governor);
478 if (cpufreq_parse_governor(str_governor, &new_policy.policy,
479 &new_policy.governor))
484 /* Do not use cpufreq_set_policy here or the user_policy.max
485 will be wrongly overridden */
486 mutex_lock(&policy->lock);
487 ret = __cpufreq_set_policy(policy, &new_policy);
489 policy->user_policy.policy = policy->policy;
490 policy->user_policy.governor = policy->governor;
491 mutex_unlock(&policy->lock);
493 unlock_cpu_hotplug();
502 * show_scaling_driver - show the cpufreq driver currently loaded
504 static ssize_t show_scaling_driver (struct cpufreq_policy * policy, char *buf)
506 return scnprintf(buf, CPUFREQ_NAME_LEN, "%s\n", cpufreq_driver->name);
510 * show_scaling_available_governors - show the available CPUfreq governors
512 static ssize_t show_scaling_available_governors (struct cpufreq_policy *policy,
516 struct cpufreq_governor *t;
518 if (!cpufreq_driver->target) {
519 i += sprintf(buf, "performance powersave");
523 list_for_each_entry(t, &cpufreq_governor_list, governor_list) {
524 if (i >= (ssize_t) ((PAGE_SIZE / sizeof(char)) - (CPUFREQ_NAME_LEN + 2)))
526 i += scnprintf(&buf[i], CPUFREQ_NAME_LEN, "%s ", t->name);
529 i += sprintf(&buf[i], "\n");
533 * show_affected_cpus - show the CPUs affected by each transition
535 static ssize_t show_affected_cpus (struct cpufreq_policy * policy, char *buf)
540 for_each_cpu_mask(cpu, policy->cpus) {
542 i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), " ");
543 i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), "%u", cpu);
544 if (i >= (PAGE_SIZE - 5))
547 i += sprintf(&buf[i], "\n");
552 #define define_one_ro(_name) \
553 static struct freq_attr _name = \
554 __ATTR(_name, 0444, show_##_name, NULL)
556 #define define_one_ro0400(_name) \
557 static struct freq_attr _name = \
558 __ATTR(_name, 0400, show_##_name, NULL)
560 #define define_one_rw(_name) \
561 static struct freq_attr _name = \
562 __ATTR(_name, 0644, show_##_name, store_##_name)
564 define_one_ro0400(cpuinfo_cur_freq);
565 define_one_ro(cpuinfo_min_freq);
566 define_one_ro(cpuinfo_max_freq);
567 define_one_ro(scaling_available_governors);
568 define_one_ro(scaling_driver);
569 define_one_ro(scaling_cur_freq);
570 define_one_ro(affected_cpus);
571 define_one_rw(scaling_min_freq);
572 define_one_rw(scaling_max_freq);
573 define_one_rw(scaling_governor);
575 static struct attribute * default_attrs[] = {
576 &cpuinfo_min_freq.attr,
577 &cpuinfo_max_freq.attr,
578 &scaling_min_freq.attr,
579 &scaling_max_freq.attr,
581 &scaling_governor.attr,
582 &scaling_driver.attr,
583 &scaling_available_governors.attr,
587 #define to_policy(k) container_of(k,struct cpufreq_policy,kobj)
588 #define to_attr(a) container_of(a,struct freq_attr,attr)
590 static ssize_t show(struct kobject * kobj, struct attribute * attr ,char * buf)
592 struct cpufreq_policy * policy = to_policy(kobj);
593 struct freq_attr * fattr = to_attr(attr);
595 policy = cpufreq_cpu_get(policy->cpu);
599 ret = fattr->show(policy, buf);
603 cpufreq_cpu_put(policy);
607 static ssize_t store(struct kobject * kobj, struct attribute * attr,
608 const char * buf, size_t count)
610 struct cpufreq_policy * policy = to_policy(kobj);
611 struct freq_attr * fattr = to_attr(attr);
613 policy = cpufreq_cpu_get(policy->cpu);
617 ret = fattr->store(policy, buf, count);
621 cpufreq_cpu_put(policy);
625 static void cpufreq_sysfs_release(struct kobject * kobj)
627 struct cpufreq_policy * policy = to_policy(kobj);
628 dprintk("last reference is dropped\n");
629 complete(&policy->kobj_unregister);
632 static struct sysfs_ops sysfs_ops = {
637 static struct kobj_type ktype_cpufreq = {
638 .sysfs_ops = &sysfs_ops,
639 .default_attrs = default_attrs,
640 .release = cpufreq_sysfs_release,
645 * cpufreq_add_dev - add a CPU device
647 * Adds the cpufreq interface for a CPU device.
649 static int cpufreq_add_dev (struct sys_device * sys_dev)
651 unsigned int cpu = sys_dev->id;
653 struct cpufreq_policy new_policy;
654 struct cpufreq_policy *policy;
655 struct freq_attr **drv_attr;
656 struct sys_device *cpu_sys_dev;
660 struct cpufreq_policy *managed_policy;
663 if (cpu_is_offline(cpu))
666 cpufreq_debug_disable_ratelimit();
667 dprintk("adding CPU %u\n", cpu);
670 /* check whether a different CPU already registered this
671 * CPU because it is in the same boat. */
672 policy = cpufreq_cpu_get(cpu);
673 if (unlikely(policy)) {
674 cpufreq_cpu_put(policy);
675 cpufreq_debug_enable_ratelimit();
680 if (!try_module_get(cpufreq_driver->owner)) {
685 policy = kzalloc(sizeof(struct cpufreq_policy), GFP_KERNEL);
692 policy->cpus = cpumask_of_cpu(cpu);
694 mutex_init(&policy->lock);
695 mutex_lock(&policy->lock);
696 init_completion(&policy->kobj_unregister);
697 INIT_WORK(&policy->update, handle_update);
699 /* call driver. From then on the cpufreq must be able
700 * to accept all calls to ->verify and ->setpolicy for this CPU
702 ret = cpufreq_driver->init(policy);
704 dprintk("initialization failed\n");
705 mutex_unlock(&policy->lock);
710 for_each_cpu_mask(j, policy->cpus) {
714 /* check for existing affected CPUs. They may not be aware
715 * of it due to CPU Hotplug.
717 managed_policy = cpufreq_cpu_get(j);
718 if (unlikely(managed_policy)) {
719 spin_lock_irqsave(&cpufreq_driver_lock, flags);
720 managed_policy->cpus = policy->cpus;
721 cpufreq_cpu_data[cpu] = managed_policy;
722 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
724 dprintk("CPU already managed, adding link\n");
725 ret = sysfs_create_link(&sys_dev->kobj,
726 &managed_policy->kobj,
729 mutex_unlock(&policy->lock);
730 goto err_out_driver_exit;
733 cpufreq_debug_enable_ratelimit();
734 mutex_unlock(&policy->lock);
736 goto err_out_driver_exit; /* call driver->exit() */
740 memcpy(&new_policy, policy, sizeof(struct cpufreq_policy));
742 /* prepare interface data */
743 policy->kobj.parent = &sys_dev->kobj;
744 policy->kobj.ktype = &ktype_cpufreq;
745 strlcpy(policy->kobj.name, "cpufreq", KOBJ_NAME_LEN);
747 ret = kobject_register(&policy->kobj);
749 mutex_unlock(&policy->lock);
750 goto err_out_driver_exit;
752 /* set up files for this cpu device */
753 drv_attr = cpufreq_driver->attr;
754 while ((drv_attr) && (*drv_attr)) {
755 sysfs_create_file(&policy->kobj, &((*drv_attr)->attr));
758 if (cpufreq_driver->get)
759 sysfs_create_file(&policy->kobj, &cpuinfo_cur_freq.attr);
760 if (cpufreq_driver->target)
761 sysfs_create_file(&policy->kobj, &scaling_cur_freq.attr);
763 spin_lock_irqsave(&cpufreq_driver_lock, flags);
764 for_each_cpu_mask(j, policy->cpus)
765 cpufreq_cpu_data[j] = policy;
766 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
768 /* symlink affected CPUs */
769 for_each_cpu_mask(j, policy->cpus) {
775 dprintk("CPU %u already managed, adding link\n", j);
776 cpufreq_cpu_get(cpu);
777 cpu_sys_dev = get_cpu_sysdev(j);
778 ret = sysfs_create_link(&cpu_sys_dev->kobj, &policy->kobj,
781 mutex_unlock(&policy->lock);
782 goto err_out_unregister;
786 policy->governor = NULL; /* to assure that the starting sequence is
787 * run in cpufreq_set_policy */
788 mutex_unlock(&policy->lock);
790 /* set default policy */
791 ret = cpufreq_set_policy(&new_policy);
793 dprintk("setting policy failed\n");
794 goto err_out_unregister;
797 module_put(cpufreq_driver->owner);
798 dprintk("initialization complete\n");
799 cpufreq_debug_enable_ratelimit();
805 spin_lock_irqsave(&cpufreq_driver_lock, flags);
806 for_each_cpu_mask(j, policy->cpus)
807 cpufreq_cpu_data[j] = NULL;
808 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
810 kobject_unregister(&policy->kobj);
811 wait_for_completion(&policy->kobj_unregister);
814 if (cpufreq_driver->exit)
815 cpufreq_driver->exit(policy);
821 module_put(cpufreq_driver->owner);
823 cpufreq_debug_enable_ratelimit();
829 * cpufreq_remove_dev - remove a CPU device
831 * Removes the cpufreq interface for a CPU device.
833 static int cpufreq_remove_dev (struct sys_device * sys_dev)
835 unsigned int cpu = sys_dev->id;
837 struct cpufreq_policy *data;
839 struct sys_device *cpu_sys_dev;
843 cpufreq_debug_disable_ratelimit();
844 dprintk("unregistering CPU %u\n", cpu);
846 spin_lock_irqsave(&cpufreq_driver_lock, flags);
847 data = cpufreq_cpu_data[cpu];
850 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
851 cpufreq_debug_enable_ratelimit();
854 cpufreq_cpu_data[cpu] = NULL;
858 /* if this isn't the CPU which is the parent of the kobj, we
859 * only need to unlink, put and exit
861 if (unlikely(cpu != data->cpu)) {
862 dprintk("removing link\n");
863 cpu_clear(cpu, data->cpus);
864 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
865 sysfs_remove_link(&sys_dev->kobj, "cpufreq");
866 cpufreq_cpu_put(data);
867 cpufreq_debug_enable_ratelimit();
873 if (!kobject_get(&data->kobj)) {
874 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
875 cpufreq_debug_enable_ratelimit();
880 /* if we have other CPUs still registered, we need to unlink them,
881 * or else wait_for_completion below will lock up. Clean the
882 * cpufreq_cpu_data[] while holding the lock, and remove the sysfs
885 if (unlikely(cpus_weight(data->cpus) > 1)) {
886 for_each_cpu_mask(j, data->cpus) {
889 cpufreq_cpu_data[j] = NULL;
893 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
895 if (unlikely(cpus_weight(data->cpus) > 1)) {
896 for_each_cpu_mask(j, data->cpus) {
899 dprintk("removing link for cpu %u\n", j);
900 cpu_sys_dev = get_cpu_sysdev(j);
901 sysfs_remove_link(&cpu_sys_dev->kobj, "cpufreq");
902 cpufreq_cpu_put(data);
906 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
909 mutex_lock(&data->lock);
910 if (cpufreq_driver->target)
911 __cpufreq_governor(data, CPUFREQ_GOV_STOP);
912 mutex_unlock(&data->lock);
914 kobject_unregister(&data->kobj);
916 kobject_put(&data->kobj);
918 /* we need to make sure that the underlying kobj is actually
919 * not referenced anymore by anybody before we proceed with
922 dprintk("waiting for dropping of refcount\n");
923 wait_for_completion(&data->kobj_unregister);
924 dprintk("wait complete\n");
926 if (cpufreq_driver->exit)
927 cpufreq_driver->exit(data);
931 cpufreq_debug_enable_ratelimit();
936 static void handle_update(struct work_struct *work)
938 struct cpufreq_policy *policy =
939 container_of(work, struct cpufreq_policy, update);
940 unsigned int cpu = policy->cpu;
941 dprintk("handle_update for cpu %u called\n", cpu);
942 cpufreq_update_policy(cpu);
946 * cpufreq_out_of_sync - If actual and saved CPU frequency differs, we're in deep trouble.
948 * @old_freq: CPU frequency the kernel thinks the CPU runs at
949 * @new_freq: CPU frequency the CPU actually runs at
951 * We adjust to current frequency first, and need to clean up later. So either call
952 * to cpufreq_update_policy() or schedule handle_update()).
954 static void cpufreq_out_of_sync(unsigned int cpu, unsigned int old_freq,
955 unsigned int new_freq)
957 struct cpufreq_freqs freqs;
959 dprintk("Warning: CPU frequency out of sync: cpufreq and timing "
960 "core thinks of %u, is %u kHz.\n", old_freq, new_freq);
963 freqs.old = old_freq;
964 freqs.new = new_freq;
965 cpufreq_notify_transition(&freqs, CPUFREQ_PRECHANGE);
966 cpufreq_notify_transition(&freqs, CPUFREQ_POSTCHANGE);
971 * cpufreq_quick_get - get the CPU frequency (in kHz) from policy->cur
974 * This is the last known freq, without actually getting it from the driver.
975 * Return value will be same as what is shown in scaling_cur_freq in sysfs.
977 unsigned int cpufreq_quick_get(unsigned int cpu)
979 struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
980 unsigned int ret_freq = 0;
983 mutex_lock(&policy->lock);
984 ret_freq = policy->cur;
985 mutex_unlock(&policy->lock);
986 cpufreq_cpu_put(policy);
991 EXPORT_SYMBOL(cpufreq_quick_get);
995 * cpufreq_get - get the current CPU frequency (in kHz)
998 * Get the CPU current (static) CPU frequency
1000 unsigned int cpufreq_get(unsigned int cpu)
1002 struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1003 unsigned int ret_freq = 0;
1008 if (!cpufreq_driver->get)
1011 mutex_lock(&policy->lock);
1013 ret_freq = cpufreq_driver->get(cpu);
1015 if (ret_freq && policy->cur &&
1016 !(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
1017 /* verify no discrepancy between actual and
1018 saved value exists */
1019 if (unlikely(ret_freq != policy->cur)) {
1020 cpufreq_out_of_sync(cpu, policy->cur, ret_freq);
1021 schedule_work(&policy->update);
1025 mutex_unlock(&policy->lock);
1028 cpufreq_cpu_put(policy);
1032 EXPORT_SYMBOL(cpufreq_get);
1036 * cpufreq_suspend - let the low level driver prepare for suspend
1039 static int cpufreq_suspend(struct sys_device * sysdev, pm_message_t pmsg)
1041 int cpu = sysdev->id;
1043 unsigned int cur_freq = 0;
1044 struct cpufreq_policy *cpu_policy;
1046 dprintk("suspending cpu %u\n", cpu);
1048 if (!cpu_online(cpu))
1051 /* we may be lax here as interrupts are off. Nonetheless
1052 * we need to grab the correct cpu policy, as to check
1053 * whether we really run on this CPU.
1056 cpu_policy = cpufreq_cpu_get(cpu);
1060 /* only handle each CPU group once */
1061 if (unlikely(cpu_policy->cpu != cpu)) {
1062 cpufreq_cpu_put(cpu_policy);
1066 if (cpufreq_driver->suspend) {
1067 ret = cpufreq_driver->suspend(cpu_policy, pmsg);
1069 printk(KERN_ERR "cpufreq: suspend failed in ->suspend "
1070 "step on CPU %u\n", cpu_policy->cpu);
1071 cpufreq_cpu_put(cpu_policy);
1077 if (cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)
1080 if (cpufreq_driver->get)
1081 cur_freq = cpufreq_driver->get(cpu_policy->cpu);
1083 if (!cur_freq || !cpu_policy->cur) {
1084 printk(KERN_ERR "cpufreq: suspend failed to assert current "
1085 "frequency is what timing core thinks it is.\n");
1089 if (unlikely(cur_freq != cpu_policy->cur)) {
1090 struct cpufreq_freqs freqs;
1092 if (!(cpufreq_driver->flags & CPUFREQ_PM_NO_WARN))
1093 dprintk("Warning: CPU frequency is %u, "
1094 "cpufreq assumed %u kHz.\n",
1095 cur_freq, cpu_policy->cur);
1098 freqs.old = cpu_policy->cur;
1099 freqs.new = cur_freq;
1101 srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
1102 CPUFREQ_SUSPENDCHANGE, &freqs);
1103 adjust_jiffies(CPUFREQ_SUSPENDCHANGE, &freqs);
1105 cpu_policy->cur = cur_freq;
1109 cpufreq_cpu_put(cpu_policy);
1114 * cpufreq_resume - restore proper CPU frequency handling after resume
1116 * 1.) resume CPUfreq hardware support (cpufreq_driver->resume())
1117 * 2.) if ->target and !CPUFREQ_CONST_LOOPS: verify we're in sync
1118 * 3.) schedule call cpufreq_update_policy() ASAP as interrupts are
1121 static int cpufreq_resume(struct sys_device * sysdev)
1123 int cpu = sysdev->id;
1125 struct cpufreq_policy *cpu_policy;
1127 dprintk("resuming cpu %u\n", cpu);
1129 if (!cpu_online(cpu))
1132 /* we may be lax here as interrupts are off. Nonetheless
1133 * we need to grab the correct cpu policy, as to check
1134 * whether we really run on this CPU.
1137 cpu_policy = cpufreq_cpu_get(cpu);
1141 /* only handle each CPU group once */
1142 if (unlikely(cpu_policy->cpu != cpu)) {
1143 cpufreq_cpu_put(cpu_policy);
1147 if (cpufreq_driver->resume) {
1148 ret = cpufreq_driver->resume(cpu_policy);
1150 printk(KERN_ERR "cpufreq: resume failed in ->resume "
1151 "step on CPU %u\n", cpu_policy->cpu);
1152 cpufreq_cpu_put(cpu_policy);
1157 if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
1158 unsigned int cur_freq = 0;
1160 if (cpufreq_driver->get)
1161 cur_freq = cpufreq_driver->get(cpu_policy->cpu);
1163 if (!cur_freq || !cpu_policy->cur) {
1164 printk(KERN_ERR "cpufreq: resume failed to assert "
1165 "current frequency is what timing core "
1170 if (unlikely(cur_freq != cpu_policy->cur)) {
1171 struct cpufreq_freqs freqs;
1173 if (!(cpufreq_driver->flags & CPUFREQ_PM_NO_WARN))
1174 dprintk("Warning: CPU frequency"
1175 "is %u, cpufreq assumed %u kHz.\n",
1176 cur_freq, cpu_policy->cur);
1179 freqs.old = cpu_policy->cur;
1180 freqs.new = cur_freq;
1182 srcu_notifier_call_chain(
1183 &cpufreq_transition_notifier_list,
1184 CPUFREQ_RESUMECHANGE, &freqs);
1185 adjust_jiffies(CPUFREQ_RESUMECHANGE, &freqs);
1187 cpu_policy->cur = cur_freq;
1192 schedule_work(&cpu_policy->update);
1193 cpufreq_cpu_put(cpu_policy);
1197 static struct sysdev_driver cpufreq_sysdev_driver = {
1198 .add = cpufreq_add_dev,
1199 .remove = cpufreq_remove_dev,
1200 .suspend = cpufreq_suspend,
1201 .resume = cpufreq_resume,
1205 /*********************************************************************
1206 * NOTIFIER LISTS INTERFACE *
1207 *********************************************************************/
1210 * cpufreq_register_notifier - register a driver with cpufreq
1211 * @nb: notifier function to register
1212 * @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1214 * Add a driver to one of two lists: either a list of drivers that
1215 * are notified about clock rate changes (once before and once after
1216 * the transition), or a list of drivers that are notified about
1217 * changes in cpufreq policy.
1219 * This function may sleep, and has the same return conditions as
1220 * blocking_notifier_chain_register.
1222 int cpufreq_register_notifier(struct notifier_block *nb, unsigned int list)
1227 case CPUFREQ_TRANSITION_NOTIFIER:
1228 ret = srcu_notifier_chain_register(
1229 &cpufreq_transition_notifier_list, nb);
1231 case CPUFREQ_POLICY_NOTIFIER:
1232 ret = blocking_notifier_chain_register(
1233 &cpufreq_policy_notifier_list, nb);
1241 EXPORT_SYMBOL(cpufreq_register_notifier);
1245 * cpufreq_unregister_notifier - unregister a driver with cpufreq
1246 * @nb: notifier block to be unregistered
1247 * @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1249 * Remove a driver from the CPU frequency notifier list.
1251 * This function may sleep, and has the same return conditions as
1252 * blocking_notifier_chain_unregister.
1254 int cpufreq_unregister_notifier(struct notifier_block *nb, unsigned int list)
1259 case CPUFREQ_TRANSITION_NOTIFIER:
1260 ret = srcu_notifier_chain_unregister(
1261 &cpufreq_transition_notifier_list, nb);
1263 case CPUFREQ_POLICY_NOTIFIER:
1264 ret = blocking_notifier_chain_unregister(
1265 &cpufreq_policy_notifier_list, nb);
1273 EXPORT_SYMBOL(cpufreq_unregister_notifier);
1276 /*********************************************************************
1278 *********************************************************************/
1281 /* Must be called with lock_cpu_hotplug held */
1282 int __cpufreq_driver_target(struct cpufreq_policy *policy,
1283 unsigned int target_freq,
1284 unsigned int relation)
1286 int retval = -EINVAL;
1288 dprintk("target for CPU %u: %u kHz, relation %u\n", policy->cpu,
1289 target_freq, relation);
1290 if (cpu_online(policy->cpu) && cpufreq_driver->target)
1291 retval = cpufreq_driver->target(policy, target_freq, relation);
1295 EXPORT_SYMBOL_GPL(__cpufreq_driver_target);
1297 int cpufreq_driver_target(struct cpufreq_policy *policy,
1298 unsigned int target_freq,
1299 unsigned int relation)
1303 policy = cpufreq_cpu_get(policy->cpu);
1308 mutex_lock(&policy->lock);
1310 ret = __cpufreq_driver_target(policy, target_freq, relation);
1312 mutex_unlock(&policy->lock);
1313 unlock_cpu_hotplug();
1315 cpufreq_cpu_put(policy);
1318 EXPORT_SYMBOL_GPL(cpufreq_driver_target);
1320 int cpufreq_driver_getavg(struct cpufreq_policy *policy)
1324 policy = cpufreq_cpu_get(policy->cpu);
1328 mutex_lock(&policy->lock);
1330 if (cpu_online(policy->cpu) && cpufreq_driver->getavg)
1331 ret = cpufreq_driver->getavg(policy->cpu);
1333 mutex_unlock(&policy->lock);
1335 cpufreq_cpu_put(policy);
1338 EXPORT_SYMBOL_GPL(cpufreq_driver_getavg);
1341 * Locking: Must be called with the lock_cpu_hotplug() lock held
1342 * when "event" is CPUFREQ_GOV_LIMITS
1345 static int __cpufreq_governor(struct cpufreq_policy *policy,
1350 if (!try_module_get(policy->governor->owner))
1353 dprintk("__cpufreq_governor for CPU %u, event %u\n",
1354 policy->cpu, event);
1355 ret = policy->governor->governor(policy, event);
1357 /* we keep one module reference alive for
1358 each CPU governed by this CPU */
1359 if ((event != CPUFREQ_GOV_START) || ret)
1360 module_put(policy->governor->owner);
1361 if ((event == CPUFREQ_GOV_STOP) && !ret)
1362 module_put(policy->governor->owner);
1368 int cpufreq_register_governor(struct cpufreq_governor *governor)
1375 mutex_lock(&cpufreq_governor_mutex);
1378 if (__find_governor(governor->name) == NULL) {
1380 list_add(&governor->governor_list, &cpufreq_governor_list);
1383 mutex_unlock(&cpufreq_governor_mutex);
1386 EXPORT_SYMBOL_GPL(cpufreq_register_governor);
1389 void cpufreq_unregister_governor(struct cpufreq_governor *governor)
1394 mutex_lock(&cpufreq_governor_mutex);
1395 list_del(&governor->governor_list);
1396 mutex_unlock(&cpufreq_governor_mutex);
1399 EXPORT_SYMBOL_GPL(cpufreq_unregister_governor);
1403 /*********************************************************************
1404 * POLICY INTERFACE *
1405 *********************************************************************/
1408 * cpufreq_get_policy - get the current cpufreq_policy
1409 * @policy: struct cpufreq_policy into which the current cpufreq_policy is written
1411 * Reads the current cpufreq policy.
1413 int cpufreq_get_policy(struct cpufreq_policy *policy, unsigned int cpu)
1415 struct cpufreq_policy *cpu_policy;
1419 cpu_policy = cpufreq_cpu_get(cpu);
1423 mutex_lock(&cpu_policy->lock);
1424 memcpy(policy, cpu_policy, sizeof(struct cpufreq_policy));
1425 mutex_unlock(&cpu_policy->lock);
1427 cpufreq_cpu_put(cpu_policy);
1430 EXPORT_SYMBOL(cpufreq_get_policy);
1434 * data : current policy.
1435 * policy : policy to be set.
1436 * Locking: Must be called with the lock_cpu_hotplug() lock held
1438 static int __cpufreq_set_policy(struct cpufreq_policy *data,
1439 struct cpufreq_policy *policy)
1443 cpufreq_debug_disable_ratelimit();
1444 dprintk("setting new policy for CPU %u: %u - %u kHz\n", policy->cpu,
1445 policy->min, policy->max);
1447 memcpy(&policy->cpuinfo, &data->cpuinfo,
1448 sizeof(struct cpufreq_cpuinfo));
1450 if (policy->min > data->min && policy->min > policy->max) {
1455 /* verify the cpu speed can be set within this limit */
1456 ret = cpufreq_driver->verify(policy);
1460 /* adjust if necessary - all reasons */
1461 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1462 CPUFREQ_ADJUST, policy);
1464 /* adjust if necessary - hardware incompatibility*/
1465 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1466 CPUFREQ_INCOMPATIBLE, policy);
1468 /* verify the cpu speed can be set within this limit,
1469 which might be different to the first one */
1470 ret = cpufreq_driver->verify(policy);
1474 /* notification of the new policy */
1475 blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1476 CPUFREQ_NOTIFY, policy);
1478 data->min = policy->min;
1479 data->max = policy->max;
1481 dprintk("new min and max freqs are %u - %u kHz\n",
1482 data->min, data->max);
1484 if (cpufreq_driver->setpolicy) {
1485 data->policy = policy->policy;
1486 dprintk("setting range\n");
1487 ret = cpufreq_driver->setpolicy(policy);
1489 if (policy->governor != data->governor) {
1490 /* save old, working values */
1491 struct cpufreq_governor *old_gov = data->governor;
1493 dprintk("governor switch\n");
1495 /* end old governor */
1497 __cpufreq_governor(data, CPUFREQ_GOV_STOP);
1499 /* start new governor */
1500 data->governor = policy->governor;
1501 if (__cpufreq_governor(data, CPUFREQ_GOV_START)) {
1502 /* new governor failed, so re-start old one */
1503 dprintk("starting governor %s failed\n",
1504 data->governor->name);
1506 data->governor = old_gov;
1507 __cpufreq_governor(data,
1513 /* might be a policy change, too, so fall through */
1515 dprintk("governor: change or update limits\n");
1516 __cpufreq_governor(data, CPUFREQ_GOV_LIMITS);
1520 cpufreq_debug_enable_ratelimit();
1525 * cpufreq_set_policy - set a new CPUFreq policy
1526 * @policy: policy to be set.
1528 * Sets a new CPU frequency and voltage scaling policy.
1530 int cpufreq_set_policy(struct cpufreq_policy *policy)
1533 struct cpufreq_policy *data;
1538 data = cpufreq_cpu_get(policy->cpu);
1545 mutex_lock(&data->lock);
1547 ret = __cpufreq_set_policy(data, policy);
1548 data->user_policy.min = data->min;
1549 data->user_policy.max = data->max;
1550 data->user_policy.policy = data->policy;
1551 data->user_policy.governor = data->governor;
1553 mutex_unlock(&data->lock);
1555 unlock_cpu_hotplug();
1556 cpufreq_cpu_put(data);
1560 EXPORT_SYMBOL(cpufreq_set_policy);
1564 * cpufreq_update_policy - re-evaluate an existing cpufreq policy
1565 * @cpu: CPU which shall be re-evaluated
1567 * Usefull for policy notifiers which have different necessities
1568 * at different times.
1570 int cpufreq_update_policy(unsigned int cpu)
1572 struct cpufreq_policy *data = cpufreq_cpu_get(cpu);
1573 struct cpufreq_policy policy;
1580 mutex_lock(&data->lock);
1582 dprintk("updating policy for CPU %u\n", cpu);
1583 memcpy(&policy, data, sizeof(struct cpufreq_policy));
1584 policy.min = data->user_policy.min;
1585 policy.max = data->user_policy.max;
1586 policy.policy = data->user_policy.policy;
1587 policy.governor = data->user_policy.governor;
1589 /* BIOS might change freq behind our back
1590 -> ask driver for current freq and notify governors about a change */
1591 if (cpufreq_driver->get) {
1592 policy.cur = cpufreq_driver->get(cpu);
1594 dprintk("Driver did not initialize current freq");
1595 data->cur = policy.cur;
1597 if (data->cur != policy.cur)
1598 cpufreq_out_of_sync(cpu, data->cur,
1603 ret = __cpufreq_set_policy(data, &policy);
1605 mutex_unlock(&data->lock);
1606 unlock_cpu_hotplug();
1607 cpufreq_cpu_put(data);
1610 EXPORT_SYMBOL(cpufreq_update_policy);
1612 static int cpufreq_cpu_callback(struct notifier_block *nfb,
1613 unsigned long action, void *hcpu)
1615 unsigned int cpu = (unsigned long)hcpu;
1616 struct cpufreq_policy *policy;
1617 struct sys_device *sys_dev;
1619 sys_dev = get_cpu_sysdev(cpu);
1624 cpufreq_add_dev(sys_dev);
1626 case CPU_DOWN_PREPARE:
1628 * We attempt to put this cpu in lowest frequency
1629 * possible before going down. This will permit
1630 * hardware-managed P-State to switch other related
1631 * threads to min or higher speeds if possible.
1633 policy = cpufreq_cpu_data[cpu];
1635 cpufreq_driver_target(policy, policy->min,
1636 CPUFREQ_RELATION_H);
1640 cpufreq_remove_dev(sys_dev);
1647 static struct notifier_block __cpuinitdata cpufreq_cpu_notifier =
1649 .notifier_call = cpufreq_cpu_callback,
1652 /*********************************************************************
1653 * REGISTER / UNREGISTER CPUFREQ DRIVER *
1654 *********************************************************************/
1657 * cpufreq_register_driver - register a CPU Frequency driver
1658 * @driver_data: A struct cpufreq_driver containing the values#
1659 * submitted by the CPU Frequency driver.
1661 * Registers a CPU Frequency driver to this core code. This code
1662 * returns zero on success, -EBUSY when another driver got here first
1663 * (and isn't unregistered in the meantime).
1666 int cpufreq_register_driver(struct cpufreq_driver *driver_data)
1668 unsigned long flags;
1671 if (!driver_data || !driver_data->verify || !driver_data->init ||
1672 ((!driver_data->setpolicy) && (!driver_data->target)))
1675 dprintk("trying to register driver %s\n", driver_data->name);
1677 if (driver_data->setpolicy)
1678 driver_data->flags |= CPUFREQ_CONST_LOOPS;
1680 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1681 if (cpufreq_driver) {
1682 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1685 cpufreq_driver = driver_data;
1686 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1688 ret = sysdev_driver_register(&cpu_sysdev_class,&cpufreq_sysdev_driver);
1690 if ((!ret) && !(cpufreq_driver->flags & CPUFREQ_STICKY)) {
1694 /* check for at least one working CPU */
1695 for (i=0; i<NR_CPUS; i++)
1696 if (cpufreq_cpu_data[i])
1699 /* if all ->init() calls failed, unregister */
1701 dprintk("no CPU initialized for driver %s\n",
1703 sysdev_driver_unregister(&cpu_sysdev_class,
1704 &cpufreq_sysdev_driver);
1706 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1707 cpufreq_driver = NULL;
1708 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1713 register_hotcpu_notifier(&cpufreq_cpu_notifier);
1714 dprintk("driver %s up and running\n", driver_data->name);
1715 cpufreq_debug_enable_ratelimit();
1720 EXPORT_SYMBOL_GPL(cpufreq_register_driver);
1724 * cpufreq_unregister_driver - unregister the current CPUFreq driver
1726 * Unregister the current CPUFreq driver. Only call this if you have
1727 * the right to do so, i.e. if you have succeeded in initialising before!
1728 * Returns zero if successful, and -EINVAL if the cpufreq_driver is
1729 * currently not initialised.
1731 int cpufreq_unregister_driver(struct cpufreq_driver *driver)
1733 unsigned long flags;
1735 cpufreq_debug_disable_ratelimit();
1737 if (!cpufreq_driver || (driver != cpufreq_driver)) {
1738 cpufreq_debug_enable_ratelimit();
1742 dprintk("unregistering driver %s\n", driver->name);
1744 sysdev_driver_unregister(&cpu_sysdev_class, &cpufreq_sysdev_driver);
1745 unregister_hotcpu_notifier(&cpufreq_cpu_notifier);
1747 spin_lock_irqsave(&cpufreq_driver_lock, flags);
1748 cpufreq_driver = NULL;
1749 spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1753 EXPORT_SYMBOL_GPL(cpufreq_unregister_driver);