xref: /openbmc/linux/drivers/cpufreq/cpufreq.c (revision 606d099c)
1 /*
2  *  linux/drivers/cpufreq/cpufreq.c
3  *
4  *  Copyright (C) 2001 Russell King
5  *            (C) 2002 - 2003 Dominik Brodowski <linux@brodo.de>
6  *
7  *  Oct 2005 - Ashok Raj <ashok.raj@intel.com>
8  *	Added handling for CPU hotplug
9  *  Feb 2006 - Jacob Shin <jacob.shin@amd.com>
10  *	Fix handling for CPU hotplug -- affected CPUs
11  *
12  * This program is free software; you can redistribute it and/or modify
13  * it under the terms of the GNU General Public License version 2 as
14  * published by the Free Software Foundation.
15  *
16  */
17 
18 #include <linux/kernel.h>
19 #include <linux/module.h>
20 #include <linux/init.h>
21 #include <linux/notifier.h>
22 #include <linux/cpufreq.h>
23 #include <linux/delay.h>
24 #include <linux/interrupt.h>
25 #include <linux/spinlock.h>
26 #include <linux/device.h>
27 #include <linux/slab.h>
28 #include <linux/cpu.h>
29 #include <linux/completion.h>
30 #include <linux/mutex.h>
31 
32 #define dprintk(msg...) cpufreq_debug_printk(CPUFREQ_DEBUG_CORE, "cpufreq-core", msg)
33 
34 /**
35  * The "cpufreq driver" - the arch- or hardware-dependent low
36  * level driver of CPUFreq support, and its spinlock. This lock
37  * also protects the cpufreq_cpu_data array.
38  */
39 static struct cpufreq_driver *cpufreq_driver;
40 static struct cpufreq_policy *cpufreq_cpu_data[NR_CPUS];
41 static DEFINE_SPINLOCK(cpufreq_driver_lock);
42 
43 /* internal prototypes */
44 static int __cpufreq_governor(struct cpufreq_policy *policy, unsigned int event);
45 static void handle_update(struct work_struct *work);
46 
47 /**
48  * Two notifier lists: the "policy" list is involved in the
49  * validation process for a new CPU frequency policy; the
50  * "transition" list for kernel code that needs to handle
51  * changes to devices when the CPU clock speed changes.
52  * The mutex locks both lists.
53  */
54 static BLOCKING_NOTIFIER_HEAD(cpufreq_policy_notifier_list);
55 static struct srcu_notifier_head cpufreq_transition_notifier_list;
56 
57 static int __init init_cpufreq_transition_notifier_list(void)
58 {
59 	srcu_init_notifier_head(&cpufreq_transition_notifier_list);
60 	return 0;
61 }
62 pure_initcall(init_cpufreq_transition_notifier_list);
63 
64 static LIST_HEAD(cpufreq_governor_list);
65 static DEFINE_MUTEX (cpufreq_governor_mutex);
66 
67 struct cpufreq_policy *cpufreq_cpu_get(unsigned int cpu)
68 {
69 	struct cpufreq_policy *data;
70 	unsigned long flags;
71 
72 	if (cpu >= NR_CPUS)
73 		goto err_out;
74 
75 	/* get the cpufreq driver */
76 	spin_lock_irqsave(&cpufreq_driver_lock, flags);
77 
78 	if (!cpufreq_driver)
79 		goto err_out_unlock;
80 
81 	if (!try_module_get(cpufreq_driver->owner))
82 		goto err_out_unlock;
83 
84 
85 	/* get the CPU */
86 	data = cpufreq_cpu_data[cpu];
87 
88 	if (!data)
89 		goto err_out_put_module;
90 
91 	if (!kobject_get(&data->kobj))
92 		goto err_out_put_module;
93 
94 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
95 	return data;
96 
97 err_out_put_module:
98 	module_put(cpufreq_driver->owner);
99 err_out_unlock:
100 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
101 err_out:
102 	return NULL;
103 }
104 EXPORT_SYMBOL_GPL(cpufreq_cpu_get);
105 
106 
107 void cpufreq_cpu_put(struct cpufreq_policy *data)
108 {
109 	kobject_put(&data->kobj);
110 	module_put(cpufreq_driver->owner);
111 }
112 EXPORT_SYMBOL_GPL(cpufreq_cpu_put);
113 
114 
115 /*********************************************************************
116  *                     UNIFIED DEBUG HELPERS                         *
117  *********************************************************************/
118 #ifdef CONFIG_CPU_FREQ_DEBUG
119 
120 /* what part(s) of the CPUfreq subsystem are debugged? */
121 static unsigned int debug;
122 
123 /* is the debug output ratelimit'ed using printk_ratelimit? User can
124  * set or modify this value.
125  */
126 static unsigned int debug_ratelimit = 1;
127 
128 /* is the printk_ratelimit'ing enabled? It's enabled after a successful
129  * loading of a cpufreq driver, temporarily disabled when a new policy
130  * is set, and disabled upon cpufreq driver removal
131  */
132 static unsigned int disable_ratelimit = 1;
133 static DEFINE_SPINLOCK(disable_ratelimit_lock);
134 
135 static void cpufreq_debug_enable_ratelimit(void)
136 {
137 	unsigned long flags;
138 
139 	spin_lock_irqsave(&disable_ratelimit_lock, flags);
140 	if (disable_ratelimit)
141 		disable_ratelimit--;
142 	spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
143 }
144 
145 static void cpufreq_debug_disable_ratelimit(void)
146 {
147 	unsigned long flags;
148 
149 	spin_lock_irqsave(&disable_ratelimit_lock, flags);
150 	disable_ratelimit++;
151 	spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
152 }
153 
154 void cpufreq_debug_printk(unsigned int type, const char *prefix, const char *fmt, ...)
155 {
156 	char s[256];
157 	va_list args;
158 	unsigned int len;
159 	unsigned long flags;
160 
161 	WARN_ON(!prefix);
162 	if (type & debug) {
163 		spin_lock_irqsave(&disable_ratelimit_lock, flags);
164 		if (!disable_ratelimit && debug_ratelimit && !printk_ratelimit()) {
165 			spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
166 			return;
167 		}
168 		spin_unlock_irqrestore(&disable_ratelimit_lock, flags);
169 
170 		len = snprintf(s, 256, KERN_DEBUG "%s: ", prefix);
171 
172 		va_start(args, fmt);
173 		len += vsnprintf(&s[len], (256 - len), fmt, args);
174 		va_end(args);
175 
176 		printk(s);
177 
178 		WARN_ON(len < 5);
179 	}
180 }
181 EXPORT_SYMBOL(cpufreq_debug_printk);
182 
183 
184 module_param(debug, uint, 0644);
185 MODULE_PARM_DESC(debug, "CPUfreq debugging: add 1 to debug core, 2 to debug drivers, and 4 to debug governors.");
186 
187 module_param(debug_ratelimit, uint, 0644);
188 MODULE_PARM_DESC(debug_ratelimit, "CPUfreq debugging: set to 0 to disable ratelimiting.");
189 
190 #else /* !CONFIG_CPU_FREQ_DEBUG */
191 
192 static inline void cpufreq_debug_enable_ratelimit(void) { return; }
193 static inline void cpufreq_debug_disable_ratelimit(void) { return; }
194 
195 #endif /* CONFIG_CPU_FREQ_DEBUG */
196 
197 
198 /*********************************************************************
199  *            EXTERNALLY AFFECTING FREQUENCY CHANGES                 *
200  *********************************************************************/
201 
202 /**
203  * adjust_jiffies - adjust the system "loops_per_jiffy"
204  *
205  * This function alters the system "loops_per_jiffy" for the clock
206  * speed change. Note that loops_per_jiffy cannot be updated on SMP
207  * systems as each CPU might be scaled differently. So, use the arch
208  * per-CPU loops_per_jiffy value wherever possible.
209  */
210 #ifndef CONFIG_SMP
211 static unsigned long l_p_j_ref;
212 static unsigned int  l_p_j_ref_freq;
213 
214 static void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
215 {
216 	if (ci->flags & CPUFREQ_CONST_LOOPS)
217 		return;
218 
219 	if (!l_p_j_ref_freq) {
220 		l_p_j_ref = loops_per_jiffy;
221 		l_p_j_ref_freq = ci->old;
222 		dprintk("saving %lu as reference value for loops_per_jiffy; freq is %u kHz\n", l_p_j_ref, l_p_j_ref_freq);
223 	}
224 	if ((val == CPUFREQ_PRECHANGE  && ci->old < ci->new) ||
225 	    (val == CPUFREQ_POSTCHANGE && ci->old > ci->new) ||
226 	    (val == CPUFREQ_RESUMECHANGE || val == CPUFREQ_SUSPENDCHANGE)) {
227 		loops_per_jiffy = cpufreq_scale(l_p_j_ref, l_p_j_ref_freq, ci->new);
228 		dprintk("scaling loops_per_jiffy to %lu for frequency %u kHz\n", loops_per_jiffy, ci->new);
229 	}
230 }
231 #else
232 static inline void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci) { return; }
233 #endif
234 
235 
236 /**
237  * cpufreq_notify_transition - call notifier chain and adjust_jiffies
238  * on frequency transition.
239  *
240  * This function calls the transition notifiers and the "adjust_jiffies"
241  * function. It is called twice on all CPU frequency changes that have
242  * external effects.
243  */
244 void cpufreq_notify_transition(struct cpufreq_freqs *freqs, unsigned int state)
245 {
246 	struct cpufreq_policy *policy;
247 
248 	BUG_ON(irqs_disabled());
249 
250 	freqs->flags = cpufreq_driver->flags;
251 	dprintk("notification %u of frequency transition to %u kHz\n",
252 		state, freqs->new);
253 
254 	policy = cpufreq_cpu_data[freqs->cpu];
255 	switch (state) {
256 
257 	case CPUFREQ_PRECHANGE:
258 		/* detect if the driver reported a value as "old frequency"
259 		 * which is not equal to what the cpufreq core thinks is
260 		 * "old frequency".
261 		 */
262 		if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
263 			if ((policy) && (policy->cpu == freqs->cpu) &&
264 			    (policy->cur) && (policy->cur != freqs->old)) {
265 				dprintk("Warning: CPU frequency is"
266 					" %u, cpufreq assumed %u kHz.\n",
267 					freqs->old, policy->cur);
268 				freqs->old = policy->cur;
269 			}
270 		}
271 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
272 				CPUFREQ_PRECHANGE, freqs);
273 		adjust_jiffies(CPUFREQ_PRECHANGE, freqs);
274 		break;
275 
276 	case CPUFREQ_POSTCHANGE:
277 		adjust_jiffies(CPUFREQ_POSTCHANGE, freqs);
278 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
279 				CPUFREQ_POSTCHANGE, freqs);
280 		if (likely(policy) && likely(policy->cpu == freqs->cpu))
281 			policy->cur = freqs->new;
282 		break;
283 	}
284 }
285 EXPORT_SYMBOL_GPL(cpufreq_notify_transition);
286 
287 
288 
289 /*********************************************************************
290  *                          SYSFS INTERFACE                          *
291  *********************************************************************/
292 
293 static struct cpufreq_governor *__find_governor(const char *str_governor)
294 {
295 	struct cpufreq_governor *t;
296 
297 	list_for_each_entry(t, &cpufreq_governor_list, governor_list)
298 		if (!strnicmp(str_governor,t->name,CPUFREQ_NAME_LEN))
299 			return t;
300 
301 	return NULL;
302 }
303 
304 /**
305  * cpufreq_parse_governor - parse a governor string
306  */
307 static int cpufreq_parse_governor (char *str_governor, unsigned int *policy,
308 				struct cpufreq_governor **governor)
309 {
310 	int err = -EINVAL;
311 
312 	if (!cpufreq_driver)
313 		goto out;
314 
315 	if (cpufreq_driver->setpolicy) {
316 		if (!strnicmp(str_governor, "performance", CPUFREQ_NAME_LEN)) {
317 			*policy = CPUFREQ_POLICY_PERFORMANCE;
318 			err = 0;
319 		} else if (!strnicmp(str_governor, "powersave", CPUFREQ_NAME_LEN)) {
320 			*policy = CPUFREQ_POLICY_POWERSAVE;
321 			err = 0;
322 		}
323 	} else if (cpufreq_driver->target) {
324 		struct cpufreq_governor *t;
325 
326 		mutex_lock(&cpufreq_governor_mutex);
327 
328 		t = __find_governor(str_governor);
329 
330 		if (t == NULL) {
331 			char *name = kasprintf(GFP_KERNEL, "cpufreq_%s", str_governor);
332 
333 			if (name) {
334 				int ret;
335 
336 				mutex_unlock(&cpufreq_governor_mutex);
337 				ret = request_module(name);
338 				mutex_lock(&cpufreq_governor_mutex);
339 
340 				if (ret == 0)
341 					t = __find_governor(str_governor);
342 			}
343 
344 			kfree(name);
345 		}
346 
347 		if (t != NULL) {
348 			*governor = t;
349 			err = 0;
350 		}
351 
352 		mutex_unlock(&cpufreq_governor_mutex);
353 	}
354   out:
355 	return err;
356 }
357 
358 
359 /* drivers/base/cpu.c */
360 extern struct sysdev_class cpu_sysdev_class;
361 
362 
363 /**
364  * cpufreq_per_cpu_attr_read() / show_##file_name() - print out cpufreq information
365  *
366  * Write out information from cpufreq_driver->policy[cpu]; object must be
367  * "unsigned int".
368  */
369 
370 #define show_one(file_name, object)			\
371 static ssize_t show_##file_name				\
372 (struct cpufreq_policy * policy, char *buf)		\
373 {							\
374 	return sprintf (buf, "%u\n", policy->object);	\
375 }
376 
377 show_one(cpuinfo_min_freq, cpuinfo.min_freq);
378 show_one(cpuinfo_max_freq, cpuinfo.max_freq);
379 show_one(scaling_min_freq, min);
380 show_one(scaling_max_freq, max);
381 show_one(scaling_cur_freq, cur);
382 
383 static int __cpufreq_set_policy(struct cpufreq_policy *data, struct cpufreq_policy *policy);
384 
385 /**
386  * cpufreq_per_cpu_attr_write() / store_##file_name() - sysfs write access
387  */
388 #define store_one(file_name, object)			\
389 static ssize_t store_##file_name					\
390 (struct cpufreq_policy * policy, const char *buf, size_t count)		\
391 {									\
392 	unsigned int ret = -EINVAL;					\
393 	struct cpufreq_policy new_policy;				\
394 									\
395 	ret = cpufreq_get_policy(&new_policy, policy->cpu);		\
396 	if (ret)							\
397 		return -EINVAL;						\
398 									\
399 	ret = sscanf (buf, "%u", &new_policy.object);			\
400 	if (ret != 1)							\
401 		return -EINVAL;						\
402 									\
403 	lock_cpu_hotplug();						\
404 	mutex_lock(&policy->lock);					\
405 	ret = __cpufreq_set_policy(policy, &new_policy);		\
406 	policy->user_policy.object = policy->object;			\
407 	mutex_unlock(&policy->lock);					\
408 	unlock_cpu_hotplug();						\
409 									\
410 	return ret ? ret : count;					\
411 }
412 
413 store_one(scaling_min_freq,min);
414 store_one(scaling_max_freq,max);
415 
416 /**
417  * show_cpuinfo_cur_freq - current CPU frequency as detected by hardware
418  */
419 static ssize_t show_cpuinfo_cur_freq (struct cpufreq_policy * policy, char *buf)
420 {
421 	unsigned int cur_freq = cpufreq_get(policy->cpu);
422 	if (!cur_freq)
423 		return sprintf(buf, "<unknown>");
424 	return sprintf(buf, "%u\n", cur_freq);
425 }
426 
427 
428 /**
429  * show_scaling_governor - show the current policy for the specified CPU
430  */
431 static ssize_t show_scaling_governor (struct cpufreq_policy * policy, char *buf)
432 {
433 	if(policy->policy == CPUFREQ_POLICY_POWERSAVE)
434 		return sprintf(buf, "powersave\n");
435 	else if (policy->policy == CPUFREQ_POLICY_PERFORMANCE)
436 		return sprintf(buf, "performance\n");
437 	else if (policy->governor)
438 		return scnprintf(buf, CPUFREQ_NAME_LEN, "%s\n", policy->governor->name);
439 	return -EINVAL;
440 }
441 
442 
443 /**
444  * store_scaling_governor - store policy for the specified CPU
445  */
446 static ssize_t store_scaling_governor (struct cpufreq_policy * policy,
447 				       const char *buf, size_t count)
448 {
449 	unsigned int ret = -EINVAL;
450 	char	str_governor[16];
451 	struct cpufreq_policy new_policy;
452 
453 	ret = cpufreq_get_policy(&new_policy, policy->cpu);
454 	if (ret)
455 		return ret;
456 
457 	ret = sscanf (buf, "%15s", str_governor);
458 	if (ret != 1)
459 		return -EINVAL;
460 
461 	if (cpufreq_parse_governor(str_governor, &new_policy.policy, &new_policy.governor))
462 		return -EINVAL;
463 
464 	lock_cpu_hotplug();
465 
466 	/* Do not use cpufreq_set_policy here or the user_policy.max
467 	   will be wrongly overridden */
468 	mutex_lock(&policy->lock);
469 	ret = __cpufreq_set_policy(policy, &new_policy);
470 
471 	policy->user_policy.policy = policy->policy;
472 	policy->user_policy.governor = policy->governor;
473 	mutex_unlock(&policy->lock);
474 
475 	unlock_cpu_hotplug();
476 
477 	return ret ? ret : count;
478 }
479 
480 /**
481  * show_scaling_driver - show the cpufreq driver currently loaded
482  */
483 static ssize_t show_scaling_driver (struct cpufreq_policy * policy, char *buf)
484 {
485 	return scnprintf(buf, CPUFREQ_NAME_LEN, "%s\n", cpufreq_driver->name);
486 }
487 
488 /**
489  * show_scaling_available_governors - show the available CPUfreq governors
490  */
491 static ssize_t show_scaling_available_governors (struct cpufreq_policy * policy,
492 				char *buf)
493 {
494 	ssize_t i = 0;
495 	struct cpufreq_governor *t;
496 
497 	if (!cpufreq_driver->target) {
498 		i += sprintf(buf, "performance powersave");
499 		goto out;
500 	}
501 
502 	list_for_each_entry(t, &cpufreq_governor_list, governor_list) {
503 		if (i >= (ssize_t) ((PAGE_SIZE / sizeof(char)) - (CPUFREQ_NAME_LEN + 2)))
504 			goto out;
505 		i += scnprintf(&buf[i], CPUFREQ_NAME_LEN, "%s ", t->name);
506 	}
507 out:
508 	i += sprintf(&buf[i], "\n");
509 	return i;
510 }
511 /**
512  * show_affected_cpus - show the CPUs affected by each transition
513  */
514 static ssize_t show_affected_cpus (struct cpufreq_policy * policy, char *buf)
515 {
516 	ssize_t i = 0;
517 	unsigned int cpu;
518 
519 	for_each_cpu_mask(cpu, policy->cpus) {
520 		if (i)
521 			i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), " ");
522 		i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), "%u", cpu);
523 		if (i >= (PAGE_SIZE - 5))
524 		    break;
525 	}
526 	i += sprintf(&buf[i], "\n");
527 	return i;
528 }
529 
530 
531 #define define_one_ro(_name) \
532 static struct freq_attr _name = \
533 __ATTR(_name, 0444, show_##_name, NULL)
534 
535 #define define_one_ro0400(_name) \
536 static struct freq_attr _name = \
537 __ATTR(_name, 0400, show_##_name, NULL)
538 
539 #define define_one_rw(_name) \
540 static struct freq_attr _name = \
541 __ATTR(_name, 0644, show_##_name, store_##_name)
542 
543 define_one_ro0400(cpuinfo_cur_freq);
544 define_one_ro(cpuinfo_min_freq);
545 define_one_ro(cpuinfo_max_freq);
546 define_one_ro(scaling_available_governors);
547 define_one_ro(scaling_driver);
548 define_one_ro(scaling_cur_freq);
549 define_one_ro(affected_cpus);
550 define_one_rw(scaling_min_freq);
551 define_one_rw(scaling_max_freq);
552 define_one_rw(scaling_governor);
553 
554 static struct attribute * default_attrs[] = {
555 	&cpuinfo_min_freq.attr,
556 	&cpuinfo_max_freq.attr,
557 	&scaling_min_freq.attr,
558 	&scaling_max_freq.attr,
559 	&affected_cpus.attr,
560 	&scaling_governor.attr,
561 	&scaling_driver.attr,
562 	&scaling_available_governors.attr,
563 	NULL
564 };
565 
566 #define to_policy(k) container_of(k,struct cpufreq_policy,kobj)
567 #define to_attr(a) container_of(a,struct freq_attr,attr)
568 
569 static ssize_t show(struct kobject * kobj, struct attribute * attr ,char * buf)
570 {
571 	struct cpufreq_policy * policy = to_policy(kobj);
572 	struct freq_attr * fattr = to_attr(attr);
573 	ssize_t ret;
574 	policy = cpufreq_cpu_get(policy->cpu);
575 	if (!policy)
576 		return -EINVAL;
577 	ret = fattr->show ? fattr->show(policy,buf) : -EIO;
578 	cpufreq_cpu_put(policy);
579 	return ret;
580 }
581 
582 static ssize_t store(struct kobject * kobj, struct attribute * attr,
583 		     const char * buf, size_t count)
584 {
585 	struct cpufreq_policy * policy = to_policy(kobj);
586 	struct freq_attr * fattr = to_attr(attr);
587 	ssize_t ret;
588 	policy = cpufreq_cpu_get(policy->cpu);
589 	if (!policy)
590 		return -EINVAL;
591 	ret = fattr->store ? fattr->store(policy,buf,count) : -EIO;
592 	cpufreq_cpu_put(policy);
593 	return ret;
594 }
595 
596 static void cpufreq_sysfs_release(struct kobject * kobj)
597 {
598 	struct cpufreq_policy * policy = to_policy(kobj);
599 	dprintk("last reference is dropped\n");
600 	complete(&policy->kobj_unregister);
601 }
602 
603 static struct sysfs_ops sysfs_ops = {
604 	.show	= show,
605 	.store	= store,
606 };
607 
608 static struct kobj_type ktype_cpufreq = {
609 	.sysfs_ops	= &sysfs_ops,
610 	.default_attrs	= default_attrs,
611 	.release	= cpufreq_sysfs_release,
612 };
613 
614 
615 /**
616  * cpufreq_add_dev - add a CPU device
617  *
618  * Adds the cpufreq interface for a CPU device.
619  */
620 static int cpufreq_add_dev (struct sys_device * sys_dev)
621 {
622 	unsigned int cpu = sys_dev->id;
623 	int ret = 0;
624 	struct cpufreq_policy new_policy;
625 	struct cpufreq_policy *policy;
626 	struct freq_attr **drv_attr;
627 	struct sys_device *cpu_sys_dev;
628 	unsigned long flags;
629 	unsigned int j;
630 #ifdef CONFIG_SMP
631 	struct cpufreq_policy *managed_policy;
632 #endif
633 
634 	if (cpu_is_offline(cpu))
635 		return 0;
636 
637 	cpufreq_debug_disable_ratelimit();
638 	dprintk("adding CPU %u\n", cpu);
639 
640 #ifdef CONFIG_SMP
641 	/* check whether a different CPU already registered this
642 	 * CPU because it is in the same boat. */
643 	policy = cpufreq_cpu_get(cpu);
644 	if (unlikely(policy)) {
645 		cpufreq_cpu_put(policy);
646 		cpufreq_debug_enable_ratelimit();
647 		return 0;
648 	}
649 #endif
650 
651 	if (!try_module_get(cpufreq_driver->owner)) {
652 		ret = -EINVAL;
653 		goto module_out;
654 	}
655 
656 	policy = kzalloc(sizeof(struct cpufreq_policy), GFP_KERNEL);
657 	if (!policy) {
658 		ret = -ENOMEM;
659 		goto nomem_out;
660 	}
661 
662 	policy->cpu = cpu;
663 	policy->cpus = cpumask_of_cpu(cpu);
664 
665 	mutex_init(&policy->lock);
666 	mutex_lock(&policy->lock);
667 	init_completion(&policy->kobj_unregister);
668 	INIT_WORK(&policy->update, handle_update);
669 
670 	/* call driver. From then on the cpufreq must be able
671 	 * to accept all calls to ->verify and ->setpolicy for this CPU
672 	 */
673 	ret = cpufreq_driver->init(policy);
674 	if (ret) {
675 		dprintk("initialization failed\n");
676 		mutex_unlock(&policy->lock);
677 		goto err_out;
678 	}
679 
680 #ifdef CONFIG_SMP
681 	for_each_cpu_mask(j, policy->cpus) {
682 		if (cpu == j)
683 			continue;
684 
685 		/* check for existing affected CPUs.  They may not be aware
686 		 * of it due to CPU Hotplug.
687 		 */
688 		managed_policy = cpufreq_cpu_get(j);
689 		if (unlikely(managed_policy)) {
690 			spin_lock_irqsave(&cpufreq_driver_lock, flags);
691 			managed_policy->cpus = policy->cpus;
692 			cpufreq_cpu_data[cpu] = managed_policy;
693 			spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
694 
695 			dprintk("CPU already managed, adding link\n");
696 			sysfs_create_link(&sys_dev->kobj,
697 					  &managed_policy->kobj, "cpufreq");
698 
699 			cpufreq_debug_enable_ratelimit();
700 			mutex_unlock(&policy->lock);
701 			ret = 0;
702 			goto err_out_driver_exit; /* call driver->exit() */
703 		}
704 	}
705 #endif
706 	memcpy(&new_policy, policy, sizeof(struct cpufreq_policy));
707 
708 	/* prepare interface data */
709 	policy->kobj.parent = &sys_dev->kobj;
710 	policy->kobj.ktype = &ktype_cpufreq;
711 	strlcpy(policy->kobj.name, "cpufreq", KOBJ_NAME_LEN);
712 
713 	ret = kobject_register(&policy->kobj);
714 	if (ret) {
715 		mutex_unlock(&policy->lock);
716 		goto err_out_driver_exit;
717 	}
718 	/* set up files for this cpu device */
719 	drv_attr = cpufreq_driver->attr;
720 	while ((drv_attr) && (*drv_attr)) {
721 		sysfs_create_file(&policy->kobj, &((*drv_attr)->attr));
722 		drv_attr++;
723 	}
724 	if (cpufreq_driver->get)
725 		sysfs_create_file(&policy->kobj, &cpuinfo_cur_freq.attr);
726 	if (cpufreq_driver->target)
727 		sysfs_create_file(&policy->kobj, &scaling_cur_freq.attr);
728 
729 	spin_lock_irqsave(&cpufreq_driver_lock, flags);
730 	for_each_cpu_mask(j, policy->cpus)
731 		cpufreq_cpu_data[j] = policy;
732 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
733 
734 	/* symlink affected CPUs */
735 	for_each_cpu_mask(j, policy->cpus) {
736 		if (j == cpu)
737 			continue;
738 		if (!cpu_online(j))
739 			continue;
740 
741 		dprintk("CPU %u already managed, adding link\n", j);
742 		cpufreq_cpu_get(cpu);
743 		cpu_sys_dev = get_cpu_sysdev(j);
744 		sysfs_create_link(&cpu_sys_dev->kobj, &policy->kobj,
745 				  "cpufreq");
746 	}
747 
748 	policy->governor = NULL; /* to assure that the starting sequence is
749 				  * run in cpufreq_set_policy */
750 	mutex_unlock(&policy->lock);
751 
752 	/* set default policy */
753 	ret = cpufreq_set_policy(&new_policy);
754 	if (ret) {
755 		dprintk("setting policy failed\n");
756 		goto err_out_unregister;
757 	}
758 
759 	module_put(cpufreq_driver->owner);
760 	dprintk("initialization complete\n");
761 	cpufreq_debug_enable_ratelimit();
762 
763 	return 0;
764 
765 
766 err_out_unregister:
767 	spin_lock_irqsave(&cpufreq_driver_lock, flags);
768 	for_each_cpu_mask(j, policy->cpus)
769 		cpufreq_cpu_data[j] = NULL;
770 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
771 
772 	kobject_unregister(&policy->kobj);
773 	wait_for_completion(&policy->kobj_unregister);
774 
775 err_out_driver_exit:
776 	if (cpufreq_driver->exit)
777 		cpufreq_driver->exit(policy);
778 
779 err_out:
780 	kfree(policy);
781 
782 nomem_out:
783 	module_put(cpufreq_driver->owner);
784 module_out:
785 	cpufreq_debug_enable_ratelimit();
786 	return ret;
787 }
788 
789 
790 /**
791  * cpufreq_remove_dev - remove a CPU device
792  *
793  * Removes the cpufreq interface for a CPU device.
794  */
795 static int cpufreq_remove_dev (struct sys_device * sys_dev)
796 {
797 	unsigned int cpu = sys_dev->id;
798 	unsigned long flags;
799 	struct cpufreq_policy *data;
800 #ifdef CONFIG_SMP
801 	struct sys_device *cpu_sys_dev;
802 	unsigned int j;
803 #endif
804 
805 	cpufreq_debug_disable_ratelimit();
806 	dprintk("unregistering CPU %u\n", cpu);
807 
808 	spin_lock_irqsave(&cpufreq_driver_lock, flags);
809 	data = cpufreq_cpu_data[cpu];
810 
811 	if (!data) {
812 		spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
813 		cpufreq_debug_enable_ratelimit();
814 		return -EINVAL;
815 	}
816 	cpufreq_cpu_data[cpu] = NULL;
817 
818 
819 #ifdef CONFIG_SMP
820 	/* if this isn't the CPU which is the parent of the kobj, we
821 	 * only need to unlink, put and exit
822 	 */
823 	if (unlikely(cpu != data->cpu)) {
824 		dprintk("removing link\n");
825 		cpu_clear(cpu, data->cpus);
826 		spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
827 		sysfs_remove_link(&sys_dev->kobj, "cpufreq");
828 		cpufreq_cpu_put(data);
829 		cpufreq_debug_enable_ratelimit();
830 		return 0;
831 	}
832 #endif
833 
834 
835 	if (!kobject_get(&data->kobj)) {
836 		spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
837 		cpufreq_debug_enable_ratelimit();
838 		return -EFAULT;
839 	}
840 
841 #ifdef CONFIG_SMP
842 	/* if we have other CPUs still registered, we need to unlink them,
843 	 * or else wait_for_completion below will lock up. Clean the
844 	 * cpufreq_cpu_data[] while holding the lock, and remove the sysfs
845 	 * links afterwards.
846 	 */
847 	if (unlikely(cpus_weight(data->cpus) > 1)) {
848 		for_each_cpu_mask(j, data->cpus) {
849 			if (j == cpu)
850 				continue;
851 			cpufreq_cpu_data[j] = NULL;
852 		}
853 	}
854 
855 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
856 
857 	if (unlikely(cpus_weight(data->cpus) > 1)) {
858 		for_each_cpu_mask(j, data->cpus) {
859 			if (j == cpu)
860 				continue;
861 			dprintk("removing link for cpu %u\n", j);
862 			cpu_sys_dev = get_cpu_sysdev(j);
863 			sysfs_remove_link(&cpu_sys_dev->kobj, "cpufreq");
864 			cpufreq_cpu_put(data);
865 		}
866 	}
867 #else
868 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
869 #endif
870 
871 	mutex_lock(&data->lock);
872 	if (cpufreq_driver->target)
873 		__cpufreq_governor(data, CPUFREQ_GOV_STOP);
874 	mutex_unlock(&data->lock);
875 
876 	kobject_unregister(&data->kobj);
877 
878 	kobject_put(&data->kobj);
879 
880 	/* we need to make sure that the underlying kobj is actually
881 	 * not referenced anymore by anybody before we proceed with
882 	 * unloading.
883 	 */
884 	dprintk("waiting for dropping of refcount\n");
885 	wait_for_completion(&data->kobj_unregister);
886 	dprintk("wait complete\n");
887 
888 	if (cpufreq_driver->exit)
889 		cpufreq_driver->exit(data);
890 
891 	kfree(data);
892 
893 	cpufreq_debug_enable_ratelimit();
894 	return 0;
895 }
896 
897 
898 static void handle_update(struct work_struct *work)
899 {
900 	struct cpufreq_policy *policy =
901 		container_of(work, struct cpufreq_policy, update);
902 	unsigned int cpu = policy->cpu;
903 	dprintk("handle_update for cpu %u called\n", cpu);
904 	cpufreq_update_policy(cpu);
905 }
906 
907 /**
908  *	cpufreq_out_of_sync - If actual and saved CPU frequency differs, we're in deep trouble.
909  *	@cpu: cpu number
910  *	@old_freq: CPU frequency the kernel thinks the CPU runs at
911  *	@new_freq: CPU frequency the CPU actually runs at
912  *
913  *	We adjust to current frequency first, and need to clean up later. So either call
914  *	to cpufreq_update_policy() or schedule handle_update()).
915  */
916 static void cpufreq_out_of_sync(unsigned int cpu, unsigned int old_freq, unsigned int new_freq)
917 {
918 	struct cpufreq_freqs freqs;
919 
920 	dprintk("Warning: CPU frequency out of sync: cpufreq and timing "
921 	       "core thinks of %u, is %u kHz.\n", old_freq, new_freq);
922 
923 	freqs.cpu = cpu;
924 	freqs.old = old_freq;
925 	freqs.new = new_freq;
926 	cpufreq_notify_transition(&freqs, CPUFREQ_PRECHANGE);
927 	cpufreq_notify_transition(&freqs, CPUFREQ_POSTCHANGE);
928 }
929 
930 
931 /**
932  * cpufreq_quick_get - get the CPU frequency (in kHz) frpm policy->cur
933  * @cpu: CPU number
934  *
935  * This is the last known freq, without actually getting it from the driver.
936  * Return value will be same as what is shown in scaling_cur_freq in sysfs.
937  */
938 unsigned int cpufreq_quick_get(unsigned int cpu)
939 {
940 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
941 	unsigned int ret = 0;
942 
943 	if (policy) {
944 		mutex_lock(&policy->lock);
945 		ret = policy->cur;
946 		mutex_unlock(&policy->lock);
947 		cpufreq_cpu_put(policy);
948 	}
949 
950 	return (ret);
951 }
952 EXPORT_SYMBOL(cpufreq_quick_get);
953 
954 
955 /**
956  * cpufreq_get - get the current CPU frequency (in kHz)
957  * @cpu: CPU number
958  *
959  * Get the CPU current (static) CPU frequency
960  */
961 unsigned int cpufreq_get(unsigned int cpu)
962 {
963 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
964 	unsigned int ret = 0;
965 
966 	if (!policy)
967 		return 0;
968 
969 	if (!cpufreq_driver->get)
970 		goto out;
971 
972 	mutex_lock(&policy->lock);
973 
974 	ret = cpufreq_driver->get(cpu);
975 
976 	if (ret && policy->cur && !(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
977 		/* verify no discrepancy between actual and saved value exists */
978 		if (unlikely(ret != policy->cur)) {
979 			cpufreq_out_of_sync(cpu, policy->cur, ret);
980 			schedule_work(&policy->update);
981 		}
982 	}
983 
984 	mutex_unlock(&policy->lock);
985 
986 out:
987 	cpufreq_cpu_put(policy);
988 
989 	return (ret);
990 }
991 EXPORT_SYMBOL(cpufreq_get);
992 
993 
994 /**
995  *	cpufreq_suspend - let the low level driver prepare for suspend
996  */
997 
998 static int cpufreq_suspend(struct sys_device * sysdev, pm_message_t pmsg)
999 {
1000 	int cpu = sysdev->id;
1001 	unsigned int ret = 0;
1002 	unsigned int cur_freq = 0;
1003 	struct cpufreq_policy *cpu_policy;
1004 
1005 	dprintk("suspending cpu %u\n", cpu);
1006 
1007 	if (!cpu_online(cpu))
1008 		return 0;
1009 
1010 	/* we may be lax here as interrupts are off. Nonetheless
1011 	 * we need to grab the correct cpu policy, as to check
1012 	 * whether we really run on this CPU.
1013 	 */
1014 
1015 	cpu_policy = cpufreq_cpu_get(cpu);
1016 	if (!cpu_policy)
1017 		return -EINVAL;
1018 
1019 	/* only handle each CPU group once */
1020 	if (unlikely(cpu_policy->cpu != cpu)) {
1021 		cpufreq_cpu_put(cpu_policy);
1022 		return 0;
1023 	}
1024 
1025 	if (cpufreq_driver->suspend) {
1026 		ret = cpufreq_driver->suspend(cpu_policy, pmsg);
1027 		if (ret) {
1028 			printk(KERN_ERR "cpufreq: suspend failed in ->suspend "
1029 					"step on CPU %u\n", cpu_policy->cpu);
1030 			cpufreq_cpu_put(cpu_policy);
1031 			return ret;
1032 		}
1033 	}
1034 
1035 
1036 	if (cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)
1037 		goto out;
1038 
1039 	if (cpufreq_driver->get)
1040 		cur_freq = cpufreq_driver->get(cpu_policy->cpu);
1041 
1042 	if (!cur_freq || !cpu_policy->cur) {
1043 		printk(KERN_ERR "cpufreq: suspend failed to assert current "
1044 		       "frequency is what timing core thinks it is.\n");
1045 		goto out;
1046 	}
1047 
1048 	if (unlikely(cur_freq != cpu_policy->cur)) {
1049 		struct cpufreq_freqs freqs;
1050 
1051 		if (!(cpufreq_driver->flags & CPUFREQ_PM_NO_WARN))
1052 			dprintk("Warning: CPU frequency is %u, "
1053 			       "cpufreq assumed %u kHz.\n",
1054 			       cur_freq, cpu_policy->cur);
1055 
1056 		freqs.cpu = cpu;
1057 		freqs.old = cpu_policy->cur;
1058 		freqs.new = cur_freq;
1059 
1060 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
1061 				    CPUFREQ_SUSPENDCHANGE, &freqs);
1062 		adjust_jiffies(CPUFREQ_SUSPENDCHANGE, &freqs);
1063 
1064 		cpu_policy->cur = cur_freq;
1065 	}
1066 
1067 out:
1068 	cpufreq_cpu_put(cpu_policy);
1069 	return 0;
1070 }
1071 
1072 /**
1073  *	cpufreq_resume -  restore proper CPU frequency handling after resume
1074  *
1075  *	1.) resume CPUfreq hardware support (cpufreq_driver->resume())
1076  *	2.) if ->target and !CPUFREQ_CONST_LOOPS: verify we're in sync
1077  *	3.) schedule call cpufreq_update_policy() ASAP as interrupts are
1078  *	    restored.
1079  */
1080 static int cpufreq_resume(struct sys_device * sysdev)
1081 {
1082 	int cpu = sysdev->id;
1083 	unsigned int ret = 0;
1084 	struct cpufreq_policy *cpu_policy;
1085 
1086 	dprintk("resuming cpu %u\n", cpu);
1087 
1088 	if (!cpu_online(cpu))
1089 		return 0;
1090 
1091 	/* we may be lax here as interrupts are off. Nonetheless
1092 	 * we need to grab the correct cpu policy, as to check
1093 	 * whether we really run on this CPU.
1094 	 */
1095 
1096 	cpu_policy = cpufreq_cpu_get(cpu);
1097 	if (!cpu_policy)
1098 		return -EINVAL;
1099 
1100 	/* only handle each CPU group once */
1101 	if (unlikely(cpu_policy->cpu != cpu)) {
1102 		cpufreq_cpu_put(cpu_policy);
1103 		return 0;
1104 	}
1105 
1106 	if (cpufreq_driver->resume) {
1107 		ret = cpufreq_driver->resume(cpu_policy);
1108 		if (ret) {
1109 			printk(KERN_ERR "cpufreq: resume failed in ->resume "
1110 					"step on CPU %u\n", cpu_policy->cpu);
1111 			cpufreq_cpu_put(cpu_policy);
1112 			return ret;
1113 		}
1114 	}
1115 
1116 	if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
1117 		unsigned int cur_freq = 0;
1118 
1119 		if (cpufreq_driver->get)
1120 			cur_freq = cpufreq_driver->get(cpu_policy->cpu);
1121 
1122 		if (!cur_freq || !cpu_policy->cur) {
1123 			printk(KERN_ERR "cpufreq: resume failed to assert "
1124 					"current frequency is what timing core "
1125 					"thinks it is.\n");
1126 			goto out;
1127 		}
1128 
1129 		if (unlikely(cur_freq != cpu_policy->cur)) {
1130 			struct cpufreq_freqs freqs;
1131 
1132 			if (!(cpufreq_driver->flags & CPUFREQ_PM_NO_WARN))
1133 				dprintk("Warning: CPU frequency"
1134 				       "is %u, cpufreq assumed %u kHz.\n",
1135 				       cur_freq, cpu_policy->cur);
1136 
1137 			freqs.cpu = cpu;
1138 			freqs.old = cpu_policy->cur;
1139 			freqs.new = cur_freq;
1140 
1141 			srcu_notifier_call_chain(
1142 					&cpufreq_transition_notifier_list,
1143 					CPUFREQ_RESUMECHANGE, &freqs);
1144 			adjust_jiffies(CPUFREQ_RESUMECHANGE, &freqs);
1145 
1146 			cpu_policy->cur = cur_freq;
1147 		}
1148 	}
1149 
1150 out:
1151 	schedule_work(&cpu_policy->update);
1152 	cpufreq_cpu_put(cpu_policy);
1153 	return ret;
1154 }
1155 
1156 static struct sysdev_driver cpufreq_sysdev_driver = {
1157 	.add		= cpufreq_add_dev,
1158 	.remove		= cpufreq_remove_dev,
1159 	.suspend	= cpufreq_suspend,
1160 	.resume		= cpufreq_resume,
1161 };
1162 
1163 
1164 /*********************************************************************
1165  *                     NOTIFIER LISTS INTERFACE                      *
1166  *********************************************************************/
1167 
1168 /**
1169  *	cpufreq_register_notifier - register a driver with cpufreq
1170  *	@nb: notifier function to register
1171  *      @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1172  *
1173  *	Add a driver to one of two lists: either a list of drivers that
1174  *      are notified about clock rate changes (once before and once after
1175  *      the transition), or a list of drivers that are notified about
1176  *      changes in cpufreq policy.
1177  *
1178  *	This function may sleep, and has the same return conditions as
1179  *	blocking_notifier_chain_register.
1180  */
1181 int cpufreq_register_notifier(struct notifier_block *nb, unsigned int list)
1182 {
1183 	int ret;
1184 
1185 	switch (list) {
1186 	case CPUFREQ_TRANSITION_NOTIFIER:
1187 		ret = srcu_notifier_chain_register(
1188 				&cpufreq_transition_notifier_list, nb);
1189 		break;
1190 	case CPUFREQ_POLICY_NOTIFIER:
1191 		ret = blocking_notifier_chain_register(
1192 				&cpufreq_policy_notifier_list, nb);
1193 		break;
1194 	default:
1195 		ret = -EINVAL;
1196 	}
1197 
1198 	return ret;
1199 }
1200 EXPORT_SYMBOL(cpufreq_register_notifier);
1201 
1202 
1203 /**
1204  *	cpufreq_unregister_notifier - unregister a driver with cpufreq
1205  *	@nb: notifier block to be unregistered
1206  *      @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1207  *
1208  *	Remove a driver from the CPU frequency notifier list.
1209  *
1210  *	This function may sleep, and has the same return conditions as
1211  *	blocking_notifier_chain_unregister.
1212  */
1213 int cpufreq_unregister_notifier(struct notifier_block *nb, unsigned int list)
1214 {
1215 	int ret;
1216 
1217 	switch (list) {
1218 	case CPUFREQ_TRANSITION_NOTIFIER:
1219 		ret = srcu_notifier_chain_unregister(
1220 				&cpufreq_transition_notifier_list, nb);
1221 		break;
1222 	case CPUFREQ_POLICY_NOTIFIER:
1223 		ret = blocking_notifier_chain_unregister(
1224 				&cpufreq_policy_notifier_list, nb);
1225 		break;
1226 	default:
1227 		ret = -EINVAL;
1228 	}
1229 
1230 	return ret;
1231 }
1232 EXPORT_SYMBOL(cpufreq_unregister_notifier);
1233 
1234 
1235 /*********************************************************************
1236  *                              GOVERNORS                            *
1237  *********************************************************************/
1238 
1239 
1240 /* Must be called with lock_cpu_hotplug held */
1241 int __cpufreq_driver_target(struct cpufreq_policy *policy,
1242 			    unsigned int target_freq,
1243 			    unsigned int relation)
1244 {
1245 	int retval = -EINVAL;
1246 
1247 	dprintk("target for CPU %u: %u kHz, relation %u\n", policy->cpu,
1248 		target_freq, relation);
1249 	if (cpu_online(policy->cpu) && cpufreq_driver->target)
1250 		retval = cpufreq_driver->target(policy, target_freq, relation);
1251 
1252 	return retval;
1253 }
1254 EXPORT_SYMBOL_GPL(__cpufreq_driver_target);
1255 
1256 int cpufreq_driver_target(struct cpufreq_policy *policy,
1257 			  unsigned int target_freq,
1258 			  unsigned int relation)
1259 {
1260 	int ret;
1261 
1262 	policy = cpufreq_cpu_get(policy->cpu);
1263 	if (!policy)
1264 		return -EINVAL;
1265 
1266 	lock_cpu_hotplug();
1267 	mutex_lock(&policy->lock);
1268 
1269 	ret = __cpufreq_driver_target(policy, target_freq, relation);
1270 
1271 	mutex_unlock(&policy->lock);
1272 	unlock_cpu_hotplug();
1273 
1274 	cpufreq_cpu_put(policy);
1275 	return ret;
1276 }
1277 EXPORT_SYMBOL_GPL(cpufreq_driver_target);
1278 
1279 /*
1280  * Locking: Must be called with the lock_cpu_hotplug() lock held
1281  * when "event" is CPUFREQ_GOV_LIMITS
1282  */
1283 
1284 static int __cpufreq_governor(struct cpufreq_policy *policy, unsigned int event)
1285 {
1286 	int ret;
1287 
1288 	if (!try_module_get(policy->governor->owner))
1289 		return -EINVAL;
1290 
1291 	dprintk("__cpufreq_governor for CPU %u, event %u\n", policy->cpu, event);
1292 	ret = policy->governor->governor(policy, event);
1293 
1294 	/* we keep one module reference alive for each CPU governed by this CPU */
1295 	if ((event != CPUFREQ_GOV_START) || ret)
1296 		module_put(policy->governor->owner);
1297 	if ((event == CPUFREQ_GOV_STOP) && !ret)
1298 		module_put(policy->governor->owner);
1299 
1300 	return ret;
1301 }
1302 
1303 
1304 int cpufreq_register_governor(struct cpufreq_governor *governor)
1305 {
1306 	int err;
1307 
1308 	if (!governor)
1309 		return -EINVAL;
1310 
1311 	mutex_lock(&cpufreq_governor_mutex);
1312 
1313 	err = -EBUSY;
1314 	if (__find_governor(governor->name) == NULL) {
1315 		err = 0;
1316 		list_add(&governor->governor_list, &cpufreq_governor_list);
1317 	}
1318 
1319 	mutex_unlock(&cpufreq_governor_mutex);
1320 	return err;
1321 }
1322 EXPORT_SYMBOL_GPL(cpufreq_register_governor);
1323 
1324 
1325 void cpufreq_unregister_governor(struct cpufreq_governor *governor)
1326 {
1327 	if (!governor)
1328 		return;
1329 
1330 	mutex_lock(&cpufreq_governor_mutex);
1331 	list_del(&governor->governor_list);
1332 	mutex_unlock(&cpufreq_governor_mutex);
1333 	return;
1334 }
1335 EXPORT_SYMBOL_GPL(cpufreq_unregister_governor);
1336 
1337 
1338 
1339 /*********************************************************************
1340  *                          POLICY INTERFACE                         *
1341  *********************************************************************/
1342 
1343 /**
1344  * cpufreq_get_policy - get the current cpufreq_policy
1345  * @policy: struct cpufreq_policy into which the current cpufreq_policy is written
1346  *
1347  * Reads the current cpufreq policy.
1348  */
1349 int cpufreq_get_policy(struct cpufreq_policy *policy, unsigned int cpu)
1350 {
1351 	struct cpufreq_policy *cpu_policy;
1352 	if (!policy)
1353 		return -EINVAL;
1354 
1355 	cpu_policy = cpufreq_cpu_get(cpu);
1356 	if (!cpu_policy)
1357 		return -EINVAL;
1358 
1359 	mutex_lock(&cpu_policy->lock);
1360 	memcpy(policy, cpu_policy, sizeof(struct cpufreq_policy));
1361 	mutex_unlock(&cpu_policy->lock);
1362 
1363 	cpufreq_cpu_put(cpu_policy);
1364 	return 0;
1365 }
1366 EXPORT_SYMBOL(cpufreq_get_policy);
1367 
1368 
1369 /*
1370  * Locking: Must be called with the lock_cpu_hotplug() lock held
1371  */
1372 static int __cpufreq_set_policy(struct cpufreq_policy *data, struct cpufreq_policy *policy)
1373 {
1374 	int ret = 0;
1375 
1376 	cpufreq_debug_disable_ratelimit();
1377 	dprintk("setting new policy for CPU %u: %u - %u kHz\n", policy->cpu,
1378 		policy->min, policy->max);
1379 
1380 	memcpy(&policy->cpuinfo, &data->cpuinfo, sizeof(struct cpufreq_cpuinfo));
1381 
1382 	if (policy->min > data->min && policy->min > policy->max) {
1383 		ret = -EINVAL;
1384 		goto error_out;
1385 	}
1386 
1387 	/* verify the cpu speed can be set within this limit */
1388 	ret = cpufreq_driver->verify(policy);
1389 	if (ret)
1390 		goto error_out;
1391 
1392 	/* adjust if necessary - all reasons */
1393 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1394 			CPUFREQ_ADJUST, policy);
1395 
1396 	/* adjust if necessary - hardware incompatibility*/
1397 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1398 			CPUFREQ_INCOMPATIBLE, policy);
1399 
1400 	/* verify the cpu speed can be set within this limit,
1401 	   which might be different to the first one */
1402 	ret = cpufreq_driver->verify(policy);
1403 	if (ret)
1404 		goto error_out;
1405 
1406 	/* notification of the new policy */
1407 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1408 			CPUFREQ_NOTIFY, policy);
1409 
1410 	data->min = policy->min;
1411 	data->max = policy->max;
1412 
1413 	dprintk("new min and max freqs are %u - %u kHz\n", data->min, data->max);
1414 
1415 	if (cpufreq_driver->setpolicy) {
1416 		data->policy = policy->policy;
1417 		dprintk("setting range\n");
1418 		ret = cpufreq_driver->setpolicy(policy);
1419 	} else {
1420 		if (policy->governor != data->governor) {
1421 			/* save old, working values */
1422 			struct cpufreq_governor *old_gov = data->governor;
1423 
1424 			dprintk("governor switch\n");
1425 
1426 			/* end old governor */
1427 			if (data->governor)
1428 				__cpufreq_governor(data, CPUFREQ_GOV_STOP);
1429 
1430 			/* start new governor */
1431 			data->governor = policy->governor;
1432 			if (__cpufreq_governor(data, CPUFREQ_GOV_START)) {
1433 				/* new governor failed, so re-start old one */
1434 				dprintk("starting governor %s failed\n", data->governor->name);
1435 				if (old_gov) {
1436 					data->governor = old_gov;
1437 					__cpufreq_governor(data, CPUFREQ_GOV_START);
1438 				}
1439 				ret = -EINVAL;
1440 				goto error_out;
1441 			}
1442 			/* might be a policy change, too, so fall through */
1443 		}
1444 		dprintk("governor: change or update limits\n");
1445 		__cpufreq_governor(data, CPUFREQ_GOV_LIMITS);
1446 	}
1447 
1448 error_out:
1449 	cpufreq_debug_enable_ratelimit();
1450 	return ret;
1451 }
1452 
1453 /**
1454  *	cpufreq_set_policy - set a new CPUFreq policy
1455  *	@policy: policy to be set.
1456  *
1457  *	Sets a new CPU frequency and voltage scaling policy.
1458  */
1459 int cpufreq_set_policy(struct cpufreq_policy *policy)
1460 {
1461 	int ret = 0;
1462 	struct cpufreq_policy *data;
1463 
1464 	if (!policy)
1465 		return -EINVAL;
1466 
1467 	data = cpufreq_cpu_get(policy->cpu);
1468 	if (!data)
1469 		return -EINVAL;
1470 
1471 	lock_cpu_hotplug();
1472 
1473 	/* lock this CPU */
1474 	mutex_lock(&data->lock);
1475 
1476 	ret = __cpufreq_set_policy(data, policy);
1477 	data->user_policy.min = data->min;
1478 	data->user_policy.max = data->max;
1479 	data->user_policy.policy = data->policy;
1480 	data->user_policy.governor = data->governor;
1481 
1482 	mutex_unlock(&data->lock);
1483 
1484 	unlock_cpu_hotplug();
1485 	cpufreq_cpu_put(data);
1486 
1487 	return ret;
1488 }
1489 EXPORT_SYMBOL(cpufreq_set_policy);
1490 
1491 
1492 /**
1493  *	cpufreq_update_policy - re-evaluate an existing cpufreq policy
1494  *	@cpu: CPU which shall be re-evaluated
1495  *
1496  *	Usefull for policy notifiers which have different necessities
1497  *	at different times.
1498  */
1499 int cpufreq_update_policy(unsigned int cpu)
1500 {
1501 	struct cpufreq_policy *data = cpufreq_cpu_get(cpu);
1502 	struct cpufreq_policy policy;
1503 	int ret = 0;
1504 
1505 	if (!data)
1506 		return -ENODEV;
1507 
1508 	lock_cpu_hotplug();
1509 	mutex_lock(&data->lock);
1510 
1511 	dprintk("updating policy for CPU %u\n", cpu);
1512 	memcpy(&policy, data, sizeof(struct cpufreq_policy));
1513 	policy.min = data->user_policy.min;
1514 	policy.max = data->user_policy.max;
1515 	policy.policy = data->user_policy.policy;
1516 	policy.governor = data->user_policy.governor;
1517 
1518 	/* BIOS might change freq behind our back
1519 	  -> ask driver for current freq and notify governors about a change */
1520 	if (cpufreq_driver->get) {
1521 		policy.cur = cpufreq_driver->get(cpu);
1522 		if (!data->cur) {
1523 			dprintk("Driver did not initialize current freq");
1524 			data->cur = policy.cur;
1525 		} else {
1526 			if (data->cur != policy.cur)
1527 				cpufreq_out_of_sync(cpu, data->cur, policy.cur);
1528 		}
1529 	}
1530 
1531 	ret = __cpufreq_set_policy(data, &policy);
1532 
1533 	mutex_unlock(&data->lock);
1534 	unlock_cpu_hotplug();
1535 	cpufreq_cpu_put(data);
1536 	return ret;
1537 }
1538 EXPORT_SYMBOL(cpufreq_update_policy);
1539 
1540 static int cpufreq_cpu_callback(struct notifier_block *nfb,
1541 					unsigned long action, void *hcpu)
1542 {
1543 	unsigned int cpu = (unsigned long)hcpu;
1544 	struct cpufreq_policy *policy;
1545 	struct sys_device *sys_dev;
1546 
1547 	sys_dev = get_cpu_sysdev(cpu);
1548 
1549 	if (sys_dev) {
1550 		switch (action) {
1551 		case CPU_ONLINE:
1552 			cpufreq_add_dev(sys_dev);
1553 			break;
1554 		case CPU_DOWN_PREPARE:
1555 			/*
1556 			 * We attempt to put this cpu in lowest frequency
1557 			 * possible before going down. This will permit
1558 			 * hardware-managed P-State to switch other related
1559 			 * threads to min or higher speeds if possible.
1560 			 */
1561 			policy = cpufreq_cpu_data[cpu];
1562 			if (policy) {
1563 				cpufreq_driver_target(policy, policy->min,
1564 						CPUFREQ_RELATION_H);
1565 			}
1566 			break;
1567 		case CPU_DEAD:
1568 			cpufreq_remove_dev(sys_dev);
1569 			break;
1570 		}
1571 	}
1572 	return NOTIFY_OK;
1573 }
1574 
1575 static struct notifier_block __cpuinitdata cpufreq_cpu_notifier =
1576 {
1577     .notifier_call = cpufreq_cpu_callback,
1578 };
1579 
1580 /*********************************************************************
1581  *               REGISTER / UNREGISTER CPUFREQ DRIVER                *
1582  *********************************************************************/
1583 
1584 /**
1585  * cpufreq_register_driver - register a CPU Frequency driver
1586  * @driver_data: A struct cpufreq_driver containing the values#
1587  * submitted by the CPU Frequency driver.
1588  *
1589  *   Registers a CPU Frequency driver to this core code. This code
1590  * returns zero on success, -EBUSY when another driver got here first
1591  * (and isn't unregistered in the meantime).
1592  *
1593  */
1594 int cpufreq_register_driver(struct cpufreq_driver *driver_data)
1595 {
1596 	unsigned long flags;
1597 	int ret;
1598 
1599 	if (!driver_data || !driver_data->verify || !driver_data->init ||
1600 	    ((!driver_data->setpolicy) && (!driver_data->target)))
1601 		return -EINVAL;
1602 
1603 	dprintk("trying to register driver %s\n", driver_data->name);
1604 
1605 	if (driver_data->setpolicy)
1606 		driver_data->flags |= CPUFREQ_CONST_LOOPS;
1607 
1608 	spin_lock_irqsave(&cpufreq_driver_lock, flags);
1609 	if (cpufreq_driver) {
1610 		spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1611 		return -EBUSY;
1612 	}
1613 	cpufreq_driver = driver_data;
1614 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1615 
1616 	ret = sysdev_driver_register(&cpu_sysdev_class,&cpufreq_sysdev_driver);
1617 
1618 	if ((!ret) && !(cpufreq_driver->flags & CPUFREQ_STICKY)) {
1619 		int i;
1620 		ret = -ENODEV;
1621 
1622 		/* check for at least one working CPU */
1623 		for (i=0; i<NR_CPUS; i++)
1624 			if (cpufreq_cpu_data[i])
1625 				ret = 0;
1626 
1627 		/* if all ->init() calls failed, unregister */
1628 		if (ret) {
1629 			dprintk("no CPU initialized for driver %s\n", driver_data->name);
1630 			sysdev_driver_unregister(&cpu_sysdev_class, &cpufreq_sysdev_driver);
1631 
1632 			spin_lock_irqsave(&cpufreq_driver_lock, flags);
1633 			cpufreq_driver = NULL;
1634 			spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1635 		}
1636 	}
1637 
1638 	if (!ret) {
1639 		register_hotcpu_notifier(&cpufreq_cpu_notifier);
1640 		dprintk("driver %s up and running\n", driver_data->name);
1641 		cpufreq_debug_enable_ratelimit();
1642 	}
1643 
1644 	return (ret);
1645 }
1646 EXPORT_SYMBOL_GPL(cpufreq_register_driver);
1647 
1648 
1649 /**
1650  * cpufreq_unregister_driver - unregister the current CPUFreq driver
1651  *
1652  *    Unregister the current CPUFreq driver. Only call this if you have
1653  * the right to do so, i.e. if you have succeeded in initialising before!
1654  * Returns zero if successful, and -EINVAL if the cpufreq_driver is
1655  * currently not initialised.
1656  */
1657 int cpufreq_unregister_driver(struct cpufreq_driver *driver)
1658 {
1659 	unsigned long flags;
1660 
1661 	cpufreq_debug_disable_ratelimit();
1662 
1663 	if (!cpufreq_driver || (driver != cpufreq_driver)) {
1664 		cpufreq_debug_enable_ratelimit();
1665 		return -EINVAL;
1666 	}
1667 
1668 	dprintk("unregistering driver %s\n", driver->name);
1669 
1670 	sysdev_driver_unregister(&cpu_sysdev_class, &cpufreq_sysdev_driver);
1671 	unregister_hotcpu_notifier(&cpufreq_cpu_notifier);
1672 
1673 	spin_lock_irqsave(&cpufreq_driver_lock, flags);
1674 	cpufreq_driver = NULL;
1675 	spin_unlock_irqrestore(&cpufreq_driver_lock, flags);
1676 
1677 	return 0;
1678 }
1679 EXPORT_SYMBOL_GPL(cpufreq_unregister_driver);
1680