xref: /linux/drivers/cpufreq/cpufreq.c (revision a224bd36bf5ccc72d0f12ab11216706762133177)
1 /*
2  *  linux/drivers/cpufreq/cpufreq.c
3  *
4  *  Copyright (C) 2001 Russell King
5  *            (C) 2002 - 2003 Dominik Brodowski <linux@brodo.de>
6  *            (C) 2013 Viresh Kumar <viresh.kumar@linaro.org>
7  *
8  *  Oct 2005 - Ashok Raj <ashok.raj@intel.com>
9  *	Added handling for CPU hotplug
10  *  Feb 2006 - Jacob Shin <jacob.shin@amd.com>
11  *	Fix handling for CPU hotplug -- affected CPUs
12  *
13  * This program is free software; you can redistribute it and/or modify
14  * it under the terms of the GNU General Public License version 2 as
15  * published by the Free Software Foundation.
16  */
17 
18 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 
20 #include <linux/cpu.h>
21 #include <linux/cpufreq.h>
22 #include <linux/delay.h>
23 #include <linux/device.h>
24 #include <linux/init.h>
25 #include <linux/kernel_stat.h>
26 #include <linux/module.h>
27 #include <linux/mutex.h>
28 #include <linux/slab.h>
29 #include <linux/syscore_ops.h>
30 #include <linux/tick.h>
31 #include <trace/events/power.h>
32 
33 /**
34  * The "cpufreq driver" - the arch- or hardware-dependent low
35  * level driver of CPUFreq support, and its spinlock. This lock
36  * also protects the cpufreq_cpu_data array.
37  */
38 static struct cpufreq_driver *cpufreq_driver;
39 static DEFINE_PER_CPU(struct cpufreq_policy *, cpufreq_cpu_data);
40 static DEFINE_PER_CPU(struct cpufreq_policy *, cpufreq_cpu_data_fallback);
41 static DEFINE_RWLOCK(cpufreq_driver_lock);
42 static DEFINE_MUTEX(cpufreq_governor_lock);
43 static LIST_HEAD(cpufreq_policy_list);
44 
45 #ifdef CONFIG_HOTPLUG_CPU
46 /* This one keeps track of the previously set governor of a removed CPU */
47 static DEFINE_PER_CPU(char[CPUFREQ_NAME_LEN], cpufreq_cpu_governor);
48 #endif
49 
50 /*
51  * cpu_policy_rwsem is a per CPU reader-writer semaphore designed to cure
52  * all cpufreq/hotplug/workqueue/etc related lock issues.
53  *
54  * The rules for this semaphore:
55  * - Any routine that wants to read from the policy structure will
56  *   do a down_read on this semaphore.
57  * - Any routine that will write to the policy structure and/or may take away
58  *   the policy altogether (eg. CPU hotplug), will hold this lock in write
59  *   mode before doing so.
60  *
61  * Additional rules:
62  * - Governor routines that can be called in cpufreq hotplug path should not
63  *   take this sem as top level hotplug notifier handler takes this.
64  * - Lock should not be held across
65  *     __cpufreq_governor(data, CPUFREQ_GOV_STOP);
66  */
67 static DEFINE_PER_CPU(struct rw_semaphore, cpu_policy_rwsem);
68 
69 #define lock_policy_rwsem(mode, cpu)					\
70 static int lock_policy_rwsem_##mode(int cpu)				\
71 {									\
72 	struct cpufreq_policy *policy = per_cpu(cpufreq_cpu_data, cpu);	\
73 	BUG_ON(!policy);						\
74 	down_##mode(&per_cpu(cpu_policy_rwsem, policy->cpu));		\
75 									\
76 	return 0;							\
77 }
78 
79 lock_policy_rwsem(read, cpu);
80 lock_policy_rwsem(write, cpu);
81 
82 #define unlock_policy_rwsem(mode, cpu)					\
83 static void unlock_policy_rwsem_##mode(int cpu)				\
84 {									\
85 	struct cpufreq_policy *policy = per_cpu(cpufreq_cpu_data, cpu);	\
86 	BUG_ON(!policy);						\
87 	up_##mode(&per_cpu(cpu_policy_rwsem, policy->cpu));		\
88 }
89 
90 unlock_policy_rwsem(read, cpu);
91 unlock_policy_rwsem(write, cpu);
92 
93 /*
94  * rwsem to guarantee that cpufreq driver module doesn't unload during critical
95  * sections
96  */
97 static DECLARE_RWSEM(cpufreq_rwsem);
98 
99 /* internal prototypes */
100 static int __cpufreq_governor(struct cpufreq_policy *policy,
101 		unsigned int event);
102 static unsigned int __cpufreq_get(unsigned int cpu);
103 static void handle_update(struct work_struct *work);
104 
105 /**
106  * Two notifier lists: the "policy" list is involved in the
107  * validation process for a new CPU frequency policy; the
108  * "transition" list for kernel code that needs to handle
109  * changes to devices when the CPU clock speed changes.
110  * The mutex locks both lists.
111  */
112 static BLOCKING_NOTIFIER_HEAD(cpufreq_policy_notifier_list);
113 static struct srcu_notifier_head cpufreq_transition_notifier_list;
114 
115 static bool init_cpufreq_transition_notifier_list_called;
116 static int __init init_cpufreq_transition_notifier_list(void)
117 {
118 	srcu_init_notifier_head(&cpufreq_transition_notifier_list);
119 	init_cpufreq_transition_notifier_list_called = true;
120 	return 0;
121 }
122 pure_initcall(init_cpufreq_transition_notifier_list);
123 
124 static int off __read_mostly;
125 static int cpufreq_disabled(void)
126 {
127 	return off;
128 }
129 void disable_cpufreq(void)
130 {
131 	off = 1;
132 }
133 static LIST_HEAD(cpufreq_governor_list);
134 static DEFINE_MUTEX(cpufreq_governor_mutex);
135 
136 bool have_governor_per_policy(void)
137 {
138 	return cpufreq_driver->have_governor_per_policy;
139 }
140 EXPORT_SYMBOL_GPL(have_governor_per_policy);
141 
142 struct kobject *get_governor_parent_kobj(struct cpufreq_policy *policy)
143 {
144 	if (have_governor_per_policy())
145 		return &policy->kobj;
146 	else
147 		return cpufreq_global_kobject;
148 }
149 EXPORT_SYMBOL_GPL(get_governor_parent_kobj);
150 
151 static inline u64 get_cpu_idle_time_jiffy(unsigned int cpu, u64 *wall)
152 {
153 	u64 idle_time;
154 	u64 cur_wall_time;
155 	u64 busy_time;
156 
157 	cur_wall_time = jiffies64_to_cputime64(get_jiffies_64());
158 
159 	busy_time = kcpustat_cpu(cpu).cpustat[CPUTIME_USER];
160 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_SYSTEM];
161 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_IRQ];
162 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_SOFTIRQ];
163 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_STEAL];
164 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_NICE];
165 
166 	idle_time = cur_wall_time - busy_time;
167 	if (wall)
168 		*wall = cputime_to_usecs(cur_wall_time);
169 
170 	return cputime_to_usecs(idle_time);
171 }
172 
173 u64 get_cpu_idle_time(unsigned int cpu, u64 *wall, int io_busy)
174 {
175 	u64 idle_time = get_cpu_idle_time_us(cpu, io_busy ? wall : NULL);
176 
177 	if (idle_time == -1ULL)
178 		return get_cpu_idle_time_jiffy(cpu, wall);
179 	else if (!io_busy)
180 		idle_time += get_cpu_iowait_time_us(cpu, wall);
181 
182 	return idle_time;
183 }
184 EXPORT_SYMBOL_GPL(get_cpu_idle_time);
185 
186 struct cpufreq_policy *cpufreq_cpu_get(unsigned int cpu)
187 {
188 	struct cpufreq_policy *policy = NULL;
189 	unsigned long flags;
190 
191 	if (cpufreq_disabled() || (cpu >= nr_cpu_ids))
192 		return NULL;
193 
194 	if (!down_read_trylock(&cpufreq_rwsem))
195 		return NULL;
196 
197 	/* get the cpufreq driver */
198 	read_lock_irqsave(&cpufreq_driver_lock, flags);
199 
200 	if (cpufreq_driver) {
201 		/* get the CPU */
202 		policy = per_cpu(cpufreq_cpu_data, cpu);
203 		if (policy)
204 			kobject_get(&policy->kobj);
205 	}
206 
207 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
208 
209 	if (!policy)
210 		up_read(&cpufreq_rwsem);
211 
212 	return policy;
213 }
214 EXPORT_SYMBOL_GPL(cpufreq_cpu_get);
215 
216 void cpufreq_cpu_put(struct cpufreq_policy *policy)
217 {
218 	if (cpufreq_disabled())
219 		return;
220 
221 	kobject_put(&policy->kobj);
222 	up_read(&cpufreq_rwsem);
223 }
224 EXPORT_SYMBOL_GPL(cpufreq_cpu_put);
225 
226 /*********************************************************************
227  *            EXTERNALLY AFFECTING FREQUENCY CHANGES                 *
228  *********************************************************************/
229 
230 /**
231  * adjust_jiffies - adjust the system "loops_per_jiffy"
232  *
233  * This function alters the system "loops_per_jiffy" for the clock
234  * speed change. Note that loops_per_jiffy cannot be updated on SMP
235  * systems as each CPU might be scaled differently. So, use the arch
236  * per-CPU loops_per_jiffy value wherever possible.
237  */
238 #ifndef CONFIG_SMP
239 static unsigned long l_p_j_ref;
240 static unsigned int l_p_j_ref_freq;
241 
242 static void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
243 {
244 	if (ci->flags & CPUFREQ_CONST_LOOPS)
245 		return;
246 
247 	if (!l_p_j_ref_freq) {
248 		l_p_j_ref = loops_per_jiffy;
249 		l_p_j_ref_freq = ci->old;
250 		pr_debug("saving %lu as reference value for loops_per_jiffy; "
251 			"freq is %u kHz\n", l_p_j_ref, l_p_j_ref_freq);
252 	}
253 	if ((val == CPUFREQ_POSTCHANGE && ci->old != ci->new) ||
254 	    (val == CPUFREQ_RESUMECHANGE || val == CPUFREQ_SUSPENDCHANGE)) {
255 		loops_per_jiffy = cpufreq_scale(l_p_j_ref, l_p_j_ref_freq,
256 								ci->new);
257 		pr_debug("scaling loops_per_jiffy to %lu "
258 			"for frequency %u kHz\n", loops_per_jiffy, ci->new);
259 	}
260 }
261 #else
262 static inline void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
263 {
264 	return;
265 }
266 #endif
267 
268 static void __cpufreq_notify_transition(struct cpufreq_policy *policy,
269 		struct cpufreq_freqs *freqs, unsigned int state)
270 {
271 	BUG_ON(irqs_disabled());
272 
273 	if (cpufreq_disabled())
274 		return;
275 
276 	freqs->flags = cpufreq_driver->flags;
277 	pr_debug("notification %u of frequency transition to %u kHz\n",
278 		state, freqs->new);
279 
280 	switch (state) {
281 
282 	case CPUFREQ_PRECHANGE:
283 		/* detect if the driver reported a value as "old frequency"
284 		 * which is not equal to what the cpufreq core thinks is
285 		 * "old frequency".
286 		 */
287 		if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
288 			if ((policy) && (policy->cpu == freqs->cpu) &&
289 			    (policy->cur) && (policy->cur != freqs->old)) {
290 				pr_debug("Warning: CPU frequency is"
291 					" %u, cpufreq assumed %u kHz.\n",
292 					freqs->old, policy->cur);
293 				freqs->old = policy->cur;
294 			}
295 		}
296 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
297 				CPUFREQ_PRECHANGE, freqs);
298 		adjust_jiffies(CPUFREQ_PRECHANGE, freqs);
299 		break;
300 
301 	case CPUFREQ_POSTCHANGE:
302 		adjust_jiffies(CPUFREQ_POSTCHANGE, freqs);
303 		pr_debug("FREQ: %lu - CPU: %lu", (unsigned long)freqs->new,
304 			(unsigned long)freqs->cpu);
305 		trace_cpu_frequency(freqs->new, freqs->cpu);
306 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
307 				CPUFREQ_POSTCHANGE, freqs);
308 		if (likely(policy) && likely(policy->cpu == freqs->cpu))
309 			policy->cur = freqs->new;
310 		break;
311 	}
312 }
313 
314 /**
315  * cpufreq_notify_transition - call notifier chain and adjust_jiffies
316  * on frequency transition.
317  *
318  * This function calls the transition notifiers and the "adjust_jiffies"
319  * function. It is called twice on all CPU frequency changes that have
320  * external effects.
321  */
322 void cpufreq_notify_transition(struct cpufreq_policy *policy,
323 		struct cpufreq_freqs *freqs, unsigned int state)
324 {
325 	for_each_cpu(freqs->cpu, policy->cpus)
326 		__cpufreq_notify_transition(policy, freqs, state);
327 }
328 EXPORT_SYMBOL_GPL(cpufreq_notify_transition);
329 
330 
331 /*********************************************************************
332  *                          SYSFS INTERFACE                          *
333  *********************************************************************/
334 
335 static struct cpufreq_governor *__find_governor(const char *str_governor)
336 {
337 	struct cpufreq_governor *t;
338 
339 	list_for_each_entry(t, &cpufreq_governor_list, governor_list)
340 		if (!strnicmp(str_governor, t->name, CPUFREQ_NAME_LEN))
341 			return t;
342 
343 	return NULL;
344 }
345 
346 /**
347  * cpufreq_parse_governor - parse a governor string
348  */
349 static int cpufreq_parse_governor(char *str_governor, unsigned int *policy,
350 				struct cpufreq_governor **governor)
351 {
352 	int err = -EINVAL;
353 
354 	if (!cpufreq_driver)
355 		goto out;
356 
357 	if (cpufreq_driver->setpolicy) {
358 		if (!strnicmp(str_governor, "performance", CPUFREQ_NAME_LEN)) {
359 			*policy = CPUFREQ_POLICY_PERFORMANCE;
360 			err = 0;
361 		} else if (!strnicmp(str_governor, "powersave",
362 						CPUFREQ_NAME_LEN)) {
363 			*policy = CPUFREQ_POLICY_POWERSAVE;
364 			err = 0;
365 		}
366 	} else if (cpufreq_driver->target) {
367 		struct cpufreq_governor *t;
368 
369 		mutex_lock(&cpufreq_governor_mutex);
370 
371 		t = __find_governor(str_governor);
372 
373 		if (t == NULL) {
374 			int ret;
375 
376 			mutex_unlock(&cpufreq_governor_mutex);
377 			ret = request_module("cpufreq_%s", str_governor);
378 			mutex_lock(&cpufreq_governor_mutex);
379 
380 			if (ret == 0)
381 				t = __find_governor(str_governor);
382 		}
383 
384 		if (t != NULL) {
385 			*governor = t;
386 			err = 0;
387 		}
388 
389 		mutex_unlock(&cpufreq_governor_mutex);
390 	}
391 out:
392 	return err;
393 }
394 
395 /**
396  * cpufreq_per_cpu_attr_read() / show_##file_name() -
397  * print out cpufreq information
398  *
399  * Write out information from cpufreq_driver->policy[cpu]; object must be
400  * "unsigned int".
401  */
402 
403 #define show_one(file_name, object)			\
404 static ssize_t show_##file_name				\
405 (struct cpufreq_policy *policy, char *buf)		\
406 {							\
407 	return sprintf(buf, "%u\n", policy->object);	\
408 }
409 
410 show_one(cpuinfo_min_freq, cpuinfo.min_freq);
411 show_one(cpuinfo_max_freq, cpuinfo.max_freq);
412 show_one(cpuinfo_transition_latency, cpuinfo.transition_latency);
413 show_one(scaling_min_freq, min);
414 show_one(scaling_max_freq, max);
415 show_one(scaling_cur_freq, cur);
416 
417 static int __cpufreq_set_policy(struct cpufreq_policy *policy,
418 				struct cpufreq_policy *new_policy);
419 
420 /**
421  * cpufreq_per_cpu_attr_write() / store_##file_name() - sysfs write access
422  */
423 #define store_one(file_name, object)			\
424 static ssize_t store_##file_name					\
425 (struct cpufreq_policy *policy, const char *buf, size_t count)		\
426 {									\
427 	int ret;							\
428 	struct cpufreq_policy new_policy;				\
429 									\
430 	ret = cpufreq_get_policy(&new_policy, policy->cpu);		\
431 	if (ret)							\
432 		return -EINVAL;						\
433 									\
434 	ret = sscanf(buf, "%u", &new_policy.object);			\
435 	if (ret != 1)							\
436 		return -EINVAL;						\
437 									\
438 	ret = __cpufreq_set_policy(policy, &new_policy);		\
439 	policy->user_policy.object = policy->object;			\
440 									\
441 	return ret ? ret : count;					\
442 }
443 
444 store_one(scaling_min_freq, min);
445 store_one(scaling_max_freq, max);
446 
447 /**
448  * show_cpuinfo_cur_freq - current CPU frequency as detected by hardware
449  */
450 static ssize_t show_cpuinfo_cur_freq(struct cpufreq_policy *policy,
451 					char *buf)
452 {
453 	unsigned int cur_freq = __cpufreq_get(policy->cpu);
454 	if (!cur_freq)
455 		return sprintf(buf, "<unknown>");
456 	return sprintf(buf, "%u\n", cur_freq);
457 }
458 
459 /**
460  * show_scaling_governor - show the current policy for the specified CPU
461  */
462 static ssize_t show_scaling_governor(struct cpufreq_policy *policy, char *buf)
463 {
464 	if (policy->policy == CPUFREQ_POLICY_POWERSAVE)
465 		return sprintf(buf, "powersave\n");
466 	else if (policy->policy == CPUFREQ_POLICY_PERFORMANCE)
467 		return sprintf(buf, "performance\n");
468 	else if (policy->governor)
469 		return scnprintf(buf, CPUFREQ_NAME_PLEN, "%s\n",
470 				policy->governor->name);
471 	return -EINVAL;
472 }
473 
474 /**
475  * store_scaling_governor - store policy for the specified CPU
476  */
477 static ssize_t store_scaling_governor(struct cpufreq_policy *policy,
478 					const char *buf, size_t count)
479 {
480 	int ret;
481 	char	str_governor[16];
482 	struct cpufreq_policy new_policy;
483 
484 	ret = cpufreq_get_policy(&new_policy, policy->cpu);
485 	if (ret)
486 		return ret;
487 
488 	ret = sscanf(buf, "%15s", str_governor);
489 	if (ret != 1)
490 		return -EINVAL;
491 
492 	if (cpufreq_parse_governor(str_governor, &new_policy.policy,
493 						&new_policy.governor))
494 		return -EINVAL;
495 
496 	/*
497 	 * Do not use cpufreq_set_policy here or the user_policy.max
498 	 * will be wrongly overridden
499 	 */
500 	ret = __cpufreq_set_policy(policy, &new_policy);
501 
502 	policy->user_policy.policy = policy->policy;
503 	policy->user_policy.governor = policy->governor;
504 
505 	if (ret)
506 		return ret;
507 	else
508 		return count;
509 }
510 
511 /**
512  * show_scaling_driver - show the cpufreq driver currently loaded
513  */
514 static ssize_t show_scaling_driver(struct cpufreq_policy *policy, char *buf)
515 {
516 	return scnprintf(buf, CPUFREQ_NAME_PLEN, "%s\n", cpufreq_driver->name);
517 }
518 
519 /**
520  * show_scaling_available_governors - show the available CPUfreq governors
521  */
522 static ssize_t show_scaling_available_governors(struct cpufreq_policy *policy,
523 						char *buf)
524 {
525 	ssize_t i = 0;
526 	struct cpufreq_governor *t;
527 
528 	if (!cpufreq_driver->target) {
529 		i += sprintf(buf, "performance powersave");
530 		goto out;
531 	}
532 
533 	list_for_each_entry(t, &cpufreq_governor_list, governor_list) {
534 		if (i >= (ssize_t) ((PAGE_SIZE / sizeof(char))
535 		    - (CPUFREQ_NAME_LEN + 2)))
536 			goto out;
537 		i += scnprintf(&buf[i], CPUFREQ_NAME_PLEN, "%s ", t->name);
538 	}
539 out:
540 	i += sprintf(&buf[i], "\n");
541 	return i;
542 }
543 
544 ssize_t cpufreq_show_cpus(const struct cpumask *mask, char *buf)
545 {
546 	ssize_t i = 0;
547 	unsigned int cpu;
548 
549 	for_each_cpu(cpu, mask) {
550 		if (i)
551 			i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), " ");
552 		i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), "%u", cpu);
553 		if (i >= (PAGE_SIZE - 5))
554 			break;
555 	}
556 	i += sprintf(&buf[i], "\n");
557 	return i;
558 }
559 EXPORT_SYMBOL_GPL(cpufreq_show_cpus);
560 
561 /**
562  * show_related_cpus - show the CPUs affected by each transition even if
563  * hw coordination is in use
564  */
565 static ssize_t show_related_cpus(struct cpufreq_policy *policy, char *buf)
566 {
567 	return cpufreq_show_cpus(policy->related_cpus, buf);
568 }
569 
570 /**
571  * show_affected_cpus - show the CPUs affected by each transition
572  */
573 static ssize_t show_affected_cpus(struct cpufreq_policy *policy, char *buf)
574 {
575 	return cpufreq_show_cpus(policy->cpus, buf);
576 }
577 
578 static ssize_t store_scaling_setspeed(struct cpufreq_policy *policy,
579 					const char *buf, size_t count)
580 {
581 	unsigned int freq = 0;
582 	unsigned int ret;
583 
584 	if (!policy->governor || !policy->governor->store_setspeed)
585 		return -EINVAL;
586 
587 	ret = sscanf(buf, "%u", &freq);
588 	if (ret != 1)
589 		return -EINVAL;
590 
591 	policy->governor->store_setspeed(policy, freq);
592 
593 	return count;
594 }
595 
596 static ssize_t show_scaling_setspeed(struct cpufreq_policy *policy, char *buf)
597 {
598 	if (!policy->governor || !policy->governor->show_setspeed)
599 		return sprintf(buf, "<unsupported>\n");
600 
601 	return policy->governor->show_setspeed(policy, buf);
602 }
603 
604 /**
605  * show_bios_limit - show the current cpufreq HW/BIOS limitation
606  */
607 static ssize_t show_bios_limit(struct cpufreq_policy *policy, char *buf)
608 {
609 	unsigned int limit;
610 	int ret;
611 	if (cpufreq_driver->bios_limit) {
612 		ret = cpufreq_driver->bios_limit(policy->cpu, &limit);
613 		if (!ret)
614 			return sprintf(buf, "%u\n", limit);
615 	}
616 	return sprintf(buf, "%u\n", policy->cpuinfo.max_freq);
617 }
618 
619 cpufreq_freq_attr_ro_perm(cpuinfo_cur_freq, 0400);
620 cpufreq_freq_attr_ro(cpuinfo_min_freq);
621 cpufreq_freq_attr_ro(cpuinfo_max_freq);
622 cpufreq_freq_attr_ro(cpuinfo_transition_latency);
623 cpufreq_freq_attr_ro(scaling_available_governors);
624 cpufreq_freq_attr_ro(scaling_driver);
625 cpufreq_freq_attr_ro(scaling_cur_freq);
626 cpufreq_freq_attr_ro(bios_limit);
627 cpufreq_freq_attr_ro(related_cpus);
628 cpufreq_freq_attr_ro(affected_cpus);
629 cpufreq_freq_attr_rw(scaling_min_freq);
630 cpufreq_freq_attr_rw(scaling_max_freq);
631 cpufreq_freq_attr_rw(scaling_governor);
632 cpufreq_freq_attr_rw(scaling_setspeed);
633 
634 static struct attribute *default_attrs[] = {
635 	&cpuinfo_min_freq.attr,
636 	&cpuinfo_max_freq.attr,
637 	&cpuinfo_transition_latency.attr,
638 	&scaling_min_freq.attr,
639 	&scaling_max_freq.attr,
640 	&affected_cpus.attr,
641 	&related_cpus.attr,
642 	&scaling_governor.attr,
643 	&scaling_driver.attr,
644 	&scaling_available_governors.attr,
645 	&scaling_setspeed.attr,
646 	NULL
647 };
648 
649 #define to_policy(k) container_of(k, struct cpufreq_policy, kobj)
650 #define to_attr(a) container_of(a, struct freq_attr, attr)
651 
652 static ssize_t show(struct kobject *kobj, struct attribute *attr, char *buf)
653 {
654 	struct cpufreq_policy *policy = to_policy(kobj);
655 	struct freq_attr *fattr = to_attr(attr);
656 	ssize_t ret = -EINVAL;
657 
658 	if (!down_read_trylock(&cpufreq_rwsem))
659 		goto exit;
660 
661 	if (lock_policy_rwsem_read(policy->cpu) < 0)
662 		goto up_read;
663 
664 	if (fattr->show)
665 		ret = fattr->show(policy, buf);
666 	else
667 		ret = -EIO;
668 
669 	unlock_policy_rwsem_read(policy->cpu);
670 
671 up_read:
672 	up_read(&cpufreq_rwsem);
673 exit:
674 	return ret;
675 }
676 
677 static ssize_t store(struct kobject *kobj, struct attribute *attr,
678 		     const char *buf, size_t count)
679 {
680 	struct cpufreq_policy *policy = to_policy(kobj);
681 	struct freq_attr *fattr = to_attr(attr);
682 	ssize_t ret = -EINVAL;
683 
684 	get_online_cpus();
685 
686 	if (!cpu_online(policy->cpu))
687 		goto unlock;
688 
689 	if (!down_read_trylock(&cpufreq_rwsem))
690 		goto unlock;
691 
692 	if (lock_policy_rwsem_write(policy->cpu) < 0)
693 		goto up_read;
694 
695 	if (fattr->store)
696 		ret = fattr->store(policy, buf, count);
697 	else
698 		ret = -EIO;
699 
700 	unlock_policy_rwsem_write(policy->cpu);
701 
702 up_read:
703 	up_read(&cpufreq_rwsem);
704 unlock:
705 	put_online_cpus();
706 
707 	return ret;
708 }
709 
710 static void cpufreq_sysfs_release(struct kobject *kobj)
711 {
712 	struct cpufreq_policy *policy = to_policy(kobj);
713 	pr_debug("last reference is dropped\n");
714 	complete(&policy->kobj_unregister);
715 }
716 
717 static const struct sysfs_ops sysfs_ops = {
718 	.show	= show,
719 	.store	= store,
720 };
721 
722 static struct kobj_type ktype_cpufreq = {
723 	.sysfs_ops	= &sysfs_ops,
724 	.default_attrs	= default_attrs,
725 	.release	= cpufreq_sysfs_release,
726 };
727 
728 struct kobject *cpufreq_global_kobject;
729 EXPORT_SYMBOL(cpufreq_global_kobject);
730 
731 static int cpufreq_global_kobject_usage;
732 
733 int cpufreq_get_global_kobject(void)
734 {
735 	if (!cpufreq_global_kobject_usage++)
736 		return kobject_add(cpufreq_global_kobject,
737 				&cpu_subsys.dev_root->kobj, "%s", "cpufreq");
738 
739 	return 0;
740 }
741 EXPORT_SYMBOL(cpufreq_get_global_kobject);
742 
743 void cpufreq_put_global_kobject(void)
744 {
745 	if (!--cpufreq_global_kobject_usage)
746 		kobject_del(cpufreq_global_kobject);
747 }
748 EXPORT_SYMBOL(cpufreq_put_global_kobject);
749 
750 int cpufreq_sysfs_create_file(const struct attribute *attr)
751 {
752 	int ret = cpufreq_get_global_kobject();
753 
754 	if (!ret) {
755 		ret = sysfs_create_file(cpufreq_global_kobject, attr);
756 		if (ret)
757 			cpufreq_put_global_kobject();
758 	}
759 
760 	return ret;
761 }
762 EXPORT_SYMBOL(cpufreq_sysfs_create_file);
763 
764 void cpufreq_sysfs_remove_file(const struct attribute *attr)
765 {
766 	sysfs_remove_file(cpufreq_global_kobject, attr);
767 	cpufreq_put_global_kobject();
768 }
769 EXPORT_SYMBOL(cpufreq_sysfs_remove_file);
770 
771 /* symlink affected CPUs */
772 static int cpufreq_add_dev_symlink(struct cpufreq_policy *policy)
773 {
774 	unsigned int j;
775 	int ret = 0;
776 
777 	for_each_cpu(j, policy->cpus) {
778 		struct device *cpu_dev;
779 
780 		if (j == policy->cpu)
781 			continue;
782 
783 		pr_debug("Adding link for CPU: %u\n", j);
784 		cpu_dev = get_cpu_device(j);
785 		ret = sysfs_create_link(&cpu_dev->kobj, &policy->kobj,
786 					"cpufreq");
787 		if (ret)
788 			break;
789 	}
790 	return ret;
791 }
792 
793 static int cpufreq_add_dev_interface(struct cpufreq_policy *policy,
794 				     struct device *dev)
795 {
796 	struct freq_attr **drv_attr;
797 	int ret = 0;
798 
799 	/* prepare interface data */
800 	ret = kobject_init_and_add(&policy->kobj, &ktype_cpufreq,
801 				   &dev->kobj, "cpufreq");
802 	if (ret)
803 		return ret;
804 
805 	/* set up files for this cpu device */
806 	drv_attr = cpufreq_driver->attr;
807 	while ((drv_attr) && (*drv_attr)) {
808 		ret = sysfs_create_file(&policy->kobj, &((*drv_attr)->attr));
809 		if (ret)
810 			goto err_out_kobj_put;
811 		drv_attr++;
812 	}
813 	if (cpufreq_driver->get) {
814 		ret = sysfs_create_file(&policy->kobj, &cpuinfo_cur_freq.attr);
815 		if (ret)
816 			goto err_out_kobj_put;
817 	}
818 	if (cpufreq_driver->target) {
819 		ret = sysfs_create_file(&policy->kobj, &scaling_cur_freq.attr);
820 		if (ret)
821 			goto err_out_kobj_put;
822 	}
823 	if (cpufreq_driver->bios_limit) {
824 		ret = sysfs_create_file(&policy->kobj, &bios_limit.attr);
825 		if (ret)
826 			goto err_out_kobj_put;
827 	}
828 
829 	ret = cpufreq_add_dev_symlink(policy);
830 	if (ret)
831 		goto err_out_kobj_put;
832 
833 	return ret;
834 
835 err_out_kobj_put:
836 	kobject_put(&policy->kobj);
837 	wait_for_completion(&policy->kobj_unregister);
838 	return ret;
839 }
840 
841 static void cpufreq_init_policy(struct cpufreq_policy *policy)
842 {
843 	struct cpufreq_policy new_policy;
844 	int ret = 0;
845 
846 	memcpy(&new_policy, policy, sizeof(*policy));
847 	/* assure that the starting sequence is run in __cpufreq_set_policy */
848 	policy->governor = NULL;
849 
850 	/* set default policy */
851 	ret = __cpufreq_set_policy(policy, &new_policy);
852 	policy->user_policy.policy = policy->policy;
853 	policy->user_policy.governor = policy->governor;
854 
855 	if (ret) {
856 		pr_debug("setting policy failed\n");
857 		if (cpufreq_driver->exit)
858 			cpufreq_driver->exit(policy);
859 	}
860 }
861 
862 #ifdef CONFIG_HOTPLUG_CPU
863 static int cpufreq_add_policy_cpu(struct cpufreq_policy *policy,
864 				  unsigned int cpu, struct device *dev,
865 				  bool frozen)
866 {
867 	int ret = 0, has_target = !!cpufreq_driver->target;
868 	unsigned long flags;
869 
870 	if (has_target) {
871 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_STOP);
872 		if (ret) {
873 			pr_err("%s: Failed to stop governor\n", __func__);
874 			return ret;
875 		}
876 	}
877 
878 	lock_policy_rwsem_write(policy->cpu);
879 
880 	write_lock_irqsave(&cpufreq_driver_lock, flags);
881 
882 	cpumask_set_cpu(cpu, policy->cpus);
883 	per_cpu(cpufreq_cpu_data, cpu) = policy;
884 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
885 
886 	unlock_policy_rwsem_write(policy->cpu);
887 
888 	if (has_target) {
889 		if ((ret = __cpufreq_governor(policy, CPUFREQ_GOV_START)) ||
890 			(ret = __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS))) {
891 			pr_err("%s: Failed to start governor\n", __func__);
892 			return ret;
893 		}
894 	}
895 
896 	/* Don't touch sysfs links during light-weight init */
897 	if (!frozen)
898 		ret = sysfs_create_link(&dev->kobj, &policy->kobj, "cpufreq");
899 
900 	return ret;
901 }
902 #endif
903 
904 static struct cpufreq_policy *cpufreq_policy_restore(unsigned int cpu)
905 {
906 	struct cpufreq_policy *policy;
907 	unsigned long flags;
908 
909 	read_lock_irqsave(&cpufreq_driver_lock, flags);
910 
911 	policy = per_cpu(cpufreq_cpu_data_fallback, cpu);
912 
913 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
914 
915 	return policy;
916 }
917 
918 static struct cpufreq_policy *cpufreq_policy_alloc(void)
919 {
920 	struct cpufreq_policy *policy;
921 
922 	policy = kzalloc(sizeof(*policy), GFP_KERNEL);
923 	if (!policy)
924 		return NULL;
925 
926 	if (!alloc_cpumask_var(&policy->cpus, GFP_KERNEL))
927 		goto err_free_policy;
928 
929 	if (!zalloc_cpumask_var(&policy->related_cpus, GFP_KERNEL))
930 		goto err_free_cpumask;
931 
932 	INIT_LIST_HEAD(&policy->policy_list);
933 	return policy;
934 
935 err_free_cpumask:
936 	free_cpumask_var(policy->cpus);
937 err_free_policy:
938 	kfree(policy);
939 
940 	return NULL;
941 }
942 
943 static void cpufreq_policy_free(struct cpufreq_policy *policy)
944 {
945 	free_cpumask_var(policy->related_cpus);
946 	free_cpumask_var(policy->cpus);
947 	kfree(policy);
948 }
949 
950 static void update_policy_cpu(struct cpufreq_policy *policy, unsigned int cpu)
951 {
952 	if (cpu == policy->cpu)
953 		return;
954 
955 	policy->last_cpu = policy->cpu;
956 	policy->cpu = cpu;
957 
958 #ifdef CONFIG_CPU_FREQ_TABLE
959 	cpufreq_frequency_table_update_policy_cpu(policy);
960 #endif
961 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
962 			CPUFREQ_UPDATE_POLICY_CPU, policy);
963 }
964 
965 static int __cpufreq_add_dev(struct device *dev, struct subsys_interface *sif,
966 			     bool frozen)
967 {
968 	unsigned int j, cpu = dev->id;
969 	int ret = -ENOMEM;
970 	struct cpufreq_policy *policy;
971 	unsigned long flags;
972 #ifdef CONFIG_HOTPLUG_CPU
973 	struct cpufreq_policy *tpolicy;
974 	struct cpufreq_governor *gov;
975 #endif
976 
977 	if (cpu_is_offline(cpu))
978 		return 0;
979 
980 	pr_debug("adding CPU %u\n", cpu);
981 
982 #ifdef CONFIG_SMP
983 	/* check whether a different CPU already registered this
984 	 * CPU because it is in the same boat. */
985 	policy = cpufreq_cpu_get(cpu);
986 	if (unlikely(policy)) {
987 		cpufreq_cpu_put(policy);
988 		return 0;
989 	}
990 #endif
991 
992 	if (!down_read_trylock(&cpufreq_rwsem))
993 		return 0;
994 
995 #ifdef CONFIG_HOTPLUG_CPU
996 	/* Check if this cpu was hot-unplugged earlier and has siblings */
997 	read_lock_irqsave(&cpufreq_driver_lock, flags);
998 	list_for_each_entry(tpolicy, &cpufreq_policy_list, policy_list) {
999 		if (cpumask_test_cpu(cpu, tpolicy->related_cpus)) {
1000 			read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1001 			ret = cpufreq_add_policy_cpu(tpolicy, cpu, dev, frozen);
1002 			up_read(&cpufreq_rwsem);
1003 			return ret;
1004 		}
1005 	}
1006 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1007 #endif
1008 
1009 	if (frozen)
1010 		/* Restore the saved policy when doing light-weight init */
1011 		policy = cpufreq_policy_restore(cpu);
1012 	else
1013 		policy = cpufreq_policy_alloc();
1014 
1015 	if (!policy)
1016 		goto nomem_out;
1017 
1018 
1019 	/*
1020 	 * In the resume path, since we restore a saved policy, the assignment
1021 	 * to policy->cpu is like an update of the existing policy, rather than
1022 	 * the creation of a brand new one. So we need to perform this update
1023 	 * by invoking update_policy_cpu().
1024 	 */
1025 	if (frozen && cpu != policy->cpu)
1026 		update_policy_cpu(policy, cpu);
1027 	else
1028 		policy->cpu = cpu;
1029 
1030 	policy->governor = CPUFREQ_DEFAULT_GOVERNOR;
1031 	cpumask_copy(policy->cpus, cpumask_of(cpu));
1032 
1033 	init_completion(&policy->kobj_unregister);
1034 	INIT_WORK(&policy->update, handle_update);
1035 
1036 	/* call driver. From then on the cpufreq must be able
1037 	 * to accept all calls to ->verify and ->setpolicy for this CPU
1038 	 */
1039 	ret = cpufreq_driver->init(policy);
1040 	if (ret) {
1041 		pr_debug("initialization failed\n");
1042 		goto err_set_policy_cpu;
1043 	}
1044 
1045 	/* related cpus should atleast have policy->cpus */
1046 	cpumask_or(policy->related_cpus, policy->related_cpus, policy->cpus);
1047 
1048 	/*
1049 	 * affected cpus must always be the one, which are online. We aren't
1050 	 * managing offline cpus here.
1051 	 */
1052 	cpumask_and(policy->cpus, policy->cpus, cpu_online_mask);
1053 
1054 	policy->user_policy.min = policy->min;
1055 	policy->user_policy.max = policy->max;
1056 
1057 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1058 				     CPUFREQ_START, policy);
1059 
1060 #ifdef CONFIG_HOTPLUG_CPU
1061 	gov = __find_governor(per_cpu(cpufreq_cpu_governor, cpu));
1062 	if (gov) {
1063 		policy->governor = gov;
1064 		pr_debug("Restoring governor %s for cpu %d\n",
1065 		       policy->governor->name, cpu);
1066 	}
1067 #endif
1068 
1069 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1070 	for_each_cpu(j, policy->cpus)
1071 		per_cpu(cpufreq_cpu_data, j) = policy;
1072 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1073 
1074 	if (!frozen) {
1075 		ret = cpufreq_add_dev_interface(policy, dev);
1076 		if (ret)
1077 			goto err_out_unregister;
1078 	}
1079 
1080 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1081 	list_add(&policy->policy_list, &cpufreq_policy_list);
1082 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1083 
1084 	cpufreq_init_policy(policy);
1085 
1086 	kobject_uevent(&policy->kobj, KOBJ_ADD);
1087 	up_read(&cpufreq_rwsem);
1088 
1089 	pr_debug("initialization complete\n");
1090 
1091 	return 0;
1092 
1093 err_out_unregister:
1094 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1095 	for_each_cpu(j, policy->cpus)
1096 		per_cpu(cpufreq_cpu_data, j) = NULL;
1097 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1098 
1099 err_set_policy_cpu:
1100 	cpufreq_policy_free(policy);
1101 nomem_out:
1102 	up_read(&cpufreq_rwsem);
1103 
1104 	return ret;
1105 }
1106 
1107 /**
1108  * cpufreq_add_dev - add a CPU device
1109  *
1110  * Adds the cpufreq interface for a CPU device.
1111  *
1112  * The Oracle says: try running cpufreq registration/unregistration concurrently
1113  * with with cpu hotplugging and all hell will break loose. Tried to clean this
1114  * mess up, but more thorough testing is needed. - Mathieu
1115  */
1116 static int cpufreq_add_dev(struct device *dev, struct subsys_interface *sif)
1117 {
1118 	return __cpufreq_add_dev(dev, sif, false);
1119 }
1120 
1121 static int cpufreq_nominate_new_policy_cpu(struct cpufreq_policy *policy,
1122 					   unsigned int old_cpu, bool frozen)
1123 {
1124 	struct device *cpu_dev;
1125 	int ret;
1126 
1127 	/* first sibling now owns the new sysfs dir */
1128 	cpu_dev = get_cpu_device(cpumask_first(policy->cpus));
1129 
1130 	/* Don't touch sysfs files during light-weight tear-down */
1131 	if (frozen)
1132 		return cpu_dev->id;
1133 
1134 	sysfs_remove_link(&cpu_dev->kobj, "cpufreq");
1135 	ret = kobject_move(&policy->kobj, &cpu_dev->kobj);
1136 	if (ret) {
1137 		pr_err("%s: Failed to move kobj: %d", __func__, ret);
1138 
1139 		WARN_ON(lock_policy_rwsem_write(old_cpu));
1140 		cpumask_set_cpu(old_cpu, policy->cpus);
1141 		unlock_policy_rwsem_write(old_cpu);
1142 
1143 		ret = sysfs_create_link(&cpu_dev->kobj, &policy->kobj,
1144 					"cpufreq");
1145 
1146 		return -EINVAL;
1147 	}
1148 
1149 	return cpu_dev->id;
1150 }
1151 
1152 static int __cpufreq_remove_dev_prepare(struct device *dev,
1153 					struct subsys_interface *sif,
1154 					bool frozen)
1155 {
1156 	unsigned int cpu = dev->id, cpus;
1157 	int new_cpu, ret;
1158 	unsigned long flags;
1159 	struct cpufreq_policy *policy;
1160 
1161 	pr_debug("%s: unregistering CPU %u\n", __func__, cpu);
1162 
1163 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1164 
1165 	policy = per_cpu(cpufreq_cpu_data, cpu);
1166 
1167 	/* Save the policy somewhere when doing a light-weight tear-down */
1168 	if (frozen)
1169 		per_cpu(cpufreq_cpu_data_fallback, cpu) = policy;
1170 
1171 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1172 
1173 	if (!policy) {
1174 		pr_debug("%s: No cpu_data found\n", __func__);
1175 		return -EINVAL;
1176 	}
1177 
1178 	if (cpufreq_driver->target) {
1179 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_STOP);
1180 		if (ret) {
1181 			pr_err("%s: Failed to stop governor\n", __func__);
1182 			return ret;
1183 		}
1184 	}
1185 
1186 #ifdef CONFIG_HOTPLUG_CPU
1187 	if (!cpufreq_driver->setpolicy)
1188 		strncpy(per_cpu(cpufreq_cpu_governor, cpu),
1189 			policy->governor->name, CPUFREQ_NAME_LEN);
1190 #endif
1191 
1192 	WARN_ON(lock_policy_rwsem_write(cpu));
1193 	cpus = cpumask_weight(policy->cpus);
1194 
1195 	if (cpus > 1)
1196 		cpumask_clear_cpu(cpu, policy->cpus);
1197 	unlock_policy_rwsem_write(cpu);
1198 
1199 	if (cpu != policy->cpu) {
1200 		if (!frozen)
1201 			sysfs_remove_link(&dev->kobj, "cpufreq");
1202 	} else if (cpus > 1) {
1203 
1204 		new_cpu = cpufreq_nominate_new_policy_cpu(policy, cpu, frozen);
1205 		if (new_cpu >= 0) {
1206 			WARN_ON(lock_policy_rwsem_write(cpu));
1207 			update_policy_cpu(policy, new_cpu);
1208 			unlock_policy_rwsem_write(cpu);
1209 
1210 			if (!frozen) {
1211 				pr_debug("%s: policy Kobject moved to cpu: %d "
1212 					 "from: %d\n",__func__, new_cpu, cpu);
1213 			}
1214 		}
1215 	}
1216 
1217 	return 0;
1218 }
1219 
1220 static int __cpufreq_remove_dev_finish(struct device *dev,
1221 				       struct subsys_interface *sif,
1222 				       bool frozen)
1223 {
1224 	unsigned int cpu = dev->id, cpus;
1225 	int ret;
1226 	unsigned long flags;
1227 	struct cpufreq_policy *policy;
1228 	struct kobject *kobj;
1229 	struct completion *cmp;
1230 
1231 	read_lock_irqsave(&cpufreq_driver_lock, flags);
1232 	policy = per_cpu(cpufreq_cpu_data, cpu);
1233 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1234 
1235 	if (!policy) {
1236 		pr_debug("%s: No cpu_data found\n", __func__);
1237 		return -EINVAL;
1238 	}
1239 
1240 	lock_policy_rwsem_read(cpu);
1241 	cpus = cpumask_weight(policy->cpus);
1242 	unlock_policy_rwsem_read(cpu);
1243 
1244 	/* If cpu is last user of policy, free policy */
1245 	if (cpus == 1) {
1246 		if (cpufreq_driver->target) {
1247 			ret = __cpufreq_governor(policy,
1248 					CPUFREQ_GOV_POLICY_EXIT);
1249 			if (ret) {
1250 				pr_err("%s: Failed to exit governor\n",
1251 						__func__);
1252 				return ret;
1253 			}
1254 		}
1255 
1256 		if (!frozen) {
1257 			lock_policy_rwsem_read(cpu);
1258 			kobj = &policy->kobj;
1259 			cmp = &policy->kobj_unregister;
1260 			unlock_policy_rwsem_read(cpu);
1261 			kobject_put(kobj);
1262 
1263 			/*
1264 			 * We need to make sure that the underlying kobj is
1265 			 * actually not referenced anymore by anybody before we
1266 			 * proceed with unloading.
1267 			 */
1268 			pr_debug("waiting for dropping of refcount\n");
1269 			wait_for_completion(cmp);
1270 			pr_debug("wait complete\n");
1271 		}
1272 
1273 		/*
1274 		 * Perform the ->exit() even during light-weight tear-down,
1275 		 * since this is a core component, and is essential for the
1276 		 * subsequent light-weight ->init() to succeed.
1277 		 */
1278 		if (cpufreq_driver->exit)
1279 			cpufreq_driver->exit(policy);
1280 
1281 		/* Remove policy from list of active policies */
1282 		write_lock_irqsave(&cpufreq_driver_lock, flags);
1283 		list_del(&policy->policy_list);
1284 		write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1285 
1286 		if (!frozen)
1287 			cpufreq_policy_free(policy);
1288 	} else {
1289 		if (cpufreq_driver->target) {
1290 			if ((ret = __cpufreq_governor(policy, CPUFREQ_GOV_START)) ||
1291 					(ret = __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS))) {
1292 				pr_err("%s: Failed to start governor\n",
1293 						__func__);
1294 				return ret;
1295 			}
1296 		}
1297 	}
1298 
1299 	per_cpu(cpufreq_cpu_data, cpu) = NULL;
1300 	return 0;
1301 }
1302 
1303 /**
1304  * __cpufreq_remove_dev - remove a CPU device
1305  *
1306  * Removes the cpufreq interface for a CPU device.
1307  * Caller should already have policy_rwsem in write mode for this CPU.
1308  * This routine frees the rwsem before returning.
1309  */
1310 static inline int __cpufreq_remove_dev(struct device *dev,
1311 				       struct subsys_interface *sif,
1312 				       bool frozen)
1313 {
1314 	int ret;
1315 
1316 	ret = __cpufreq_remove_dev_prepare(dev, sif, frozen);
1317 
1318 	if (!ret)
1319 		ret = __cpufreq_remove_dev_finish(dev, sif, frozen);
1320 
1321 	return ret;
1322 }
1323 
1324 static int cpufreq_remove_dev(struct device *dev, struct subsys_interface *sif)
1325 {
1326 	unsigned int cpu = dev->id;
1327 	int retval;
1328 
1329 	if (cpu_is_offline(cpu))
1330 		return 0;
1331 
1332 	retval = __cpufreq_remove_dev(dev, sif, false);
1333 	return retval;
1334 }
1335 
1336 static void handle_update(struct work_struct *work)
1337 {
1338 	struct cpufreq_policy *policy =
1339 		container_of(work, struct cpufreq_policy, update);
1340 	unsigned int cpu = policy->cpu;
1341 	pr_debug("handle_update for cpu %u called\n", cpu);
1342 	cpufreq_update_policy(cpu);
1343 }
1344 
1345 /**
1346  *	cpufreq_out_of_sync - If actual and saved CPU frequency differs, we're
1347  *	in deep trouble.
1348  *	@cpu: cpu number
1349  *	@old_freq: CPU frequency the kernel thinks the CPU runs at
1350  *	@new_freq: CPU frequency the CPU actually runs at
1351  *
1352  *	We adjust to current frequency first, and need to clean up later.
1353  *	So either call to cpufreq_update_policy() or schedule handle_update()).
1354  */
1355 static void cpufreq_out_of_sync(unsigned int cpu, unsigned int old_freq,
1356 				unsigned int new_freq)
1357 {
1358 	struct cpufreq_policy *policy;
1359 	struct cpufreq_freqs freqs;
1360 	unsigned long flags;
1361 
1362 	pr_debug("Warning: CPU frequency out of sync: cpufreq and timing "
1363 	       "core thinks of %u, is %u kHz.\n", old_freq, new_freq);
1364 
1365 	freqs.old = old_freq;
1366 	freqs.new = new_freq;
1367 
1368 	read_lock_irqsave(&cpufreq_driver_lock, flags);
1369 	policy = per_cpu(cpufreq_cpu_data, cpu);
1370 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1371 
1372 	cpufreq_notify_transition(policy, &freqs, CPUFREQ_PRECHANGE);
1373 	cpufreq_notify_transition(policy, &freqs, CPUFREQ_POSTCHANGE);
1374 }
1375 
1376 /**
1377  * cpufreq_quick_get - get the CPU frequency (in kHz) from policy->cur
1378  * @cpu: CPU number
1379  *
1380  * This is the last known freq, without actually getting it from the driver.
1381  * Return value will be same as what is shown in scaling_cur_freq in sysfs.
1382  */
1383 unsigned int cpufreq_quick_get(unsigned int cpu)
1384 {
1385 	struct cpufreq_policy *policy;
1386 	unsigned int ret_freq = 0;
1387 
1388 	if (cpufreq_driver && cpufreq_driver->setpolicy && cpufreq_driver->get)
1389 		return cpufreq_driver->get(cpu);
1390 
1391 	policy = cpufreq_cpu_get(cpu);
1392 	if (policy) {
1393 		ret_freq = policy->cur;
1394 		cpufreq_cpu_put(policy);
1395 	}
1396 
1397 	return ret_freq;
1398 }
1399 EXPORT_SYMBOL(cpufreq_quick_get);
1400 
1401 /**
1402  * cpufreq_quick_get_max - get the max reported CPU frequency for this CPU
1403  * @cpu: CPU number
1404  *
1405  * Just return the max possible frequency for a given CPU.
1406  */
1407 unsigned int cpufreq_quick_get_max(unsigned int cpu)
1408 {
1409 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1410 	unsigned int ret_freq = 0;
1411 
1412 	if (policy) {
1413 		ret_freq = policy->max;
1414 		cpufreq_cpu_put(policy);
1415 	}
1416 
1417 	return ret_freq;
1418 }
1419 EXPORT_SYMBOL(cpufreq_quick_get_max);
1420 
1421 static unsigned int __cpufreq_get(unsigned int cpu)
1422 {
1423 	struct cpufreq_policy *policy = per_cpu(cpufreq_cpu_data, cpu);
1424 	unsigned int ret_freq = 0;
1425 
1426 	if (!cpufreq_driver->get)
1427 		return ret_freq;
1428 
1429 	ret_freq = cpufreq_driver->get(cpu);
1430 
1431 	if (ret_freq && policy->cur &&
1432 		!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
1433 		/* verify no discrepancy between actual and
1434 					saved value exists */
1435 		if (unlikely(ret_freq != policy->cur)) {
1436 			cpufreq_out_of_sync(cpu, policy->cur, ret_freq);
1437 			schedule_work(&policy->update);
1438 		}
1439 	}
1440 
1441 	return ret_freq;
1442 }
1443 
1444 /**
1445  * cpufreq_get - get the current CPU frequency (in kHz)
1446  * @cpu: CPU number
1447  *
1448  * Get the CPU current (static) CPU frequency
1449  */
1450 unsigned int cpufreq_get(unsigned int cpu)
1451 {
1452 	unsigned int ret_freq = 0;
1453 
1454 	if (!down_read_trylock(&cpufreq_rwsem))
1455 		return 0;
1456 
1457 	if (unlikely(lock_policy_rwsem_read(cpu)))
1458 		goto out_policy;
1459 
1460 	ret_freq = __cpufreq_get(cpu);
1461 
1462 	unlock_policy_rwsem_read(cpu);
1463 
1464 out_policy:
1465 	up_read(&cpufreq_rwsem);
1466 
1467 	return ret_freq;
1468 }
1469 EXPORT_SYMBOL(cpufreq_get);
1470 
1471 static struct subsys_interface cpufreq_interface = {
1472 	.name		= "cpufreq",
1473 	.subsys		= &cpu_subsys,
1474 	.add_dev	= cpufreq_add_dev,
1475 	.remove_dev	= cpufreq_remove_dev,
1476 };
1477 
1478 /**
1479  * cpufreq_bp_suspend - Prepare the boot CPU for system suspend.
1480  *
1481  * This function is only executed for the boot processor.  The other CPUs
1482  * have been put offline by means of CPU hotplug.
1483  */
1484 static int cpufreq_bp_suspend(void)
1485 {
1486 	int ret = 0;
1487 
1488 	int cpu = smp_processor_id();
1489 	struct cpufreq_policy *policy;
1490 
1491 	pr_debug("suspending cpu %u\n", cpu);
1492 
1493 	/* If there's no policy for the boot CPU, we have nothing to do. */
1494 	policy = cpufreq_cpu_get(cpu);
1495 	if (!policy)
1496 		return 0;
1497 
1498 	if (cpufreq_driver->suspend) {
1499 		ret = cpufreq_driver->suspend(policy);
1500 		if (ret)
1501 			printk(KERN_ERR "cpufreq: suspend failed in ->suspend "
1502 					"step on CPU %u\n", policy->cpu);
1503 	}
1504 
1505 	cpufreq_cpu_put(policy);
1506 	return ret;
1507 }
1508 
1509 /**
1510  * cpufreq_bp_resume - Restore proper frequency handling of the boot CPU.
1511  *
1512  *	1.) resume CPUfreq hardware support (cpufreq_driver->resume())
1513  *	2.) schedule call cpufreq_update_policy() ASAP as interrupts are
1514  *	    restored. It will verify that the current freq is in sync with
1515  *	    what we believe it to be. This is a bit later than when it
1516  *	    should be, but nonethteless it's better than calling
1517  *	    cpufreq_driver->get() here which might re-enable interrupts...
1518  *
1519  * This function is only executed for the boot CPU.  The other CPUs have not
1520  * been turned on yet.
1521  */
1522 static void cpufreq_bp_resume(void)
1523 {
1524 	int ret = 0;
1525 
1526 	int cpu = smp_processor_id();
1527 	struct cpufreq_policy *policy;
1528 
1529 	pr_debug("resuming cpu %u\n", cpu);
1530 
1531 	/* If there's no policy for the boot CPU, we have nothing to do. */
1532 	policy = cpufreq_cpu_get(cpu);
1533 	if (!policy)
1534 		return;
1535 
1536 	if (cpufreq_driver->resume) {
1537 		ret = cpufreq_driver->resume(policy);
1538 		if (ret) {
1539 			printk(KERN_ERR "cpufreq: resume failed in ->resume "
1540 					"step on CPU %u\n", policy->cpu);
1541 			goto fail;
1542 		}
1543 	}
1544 
1545 	schedule_work(&policy->update);
1546 
1547 fail:
1548 	cpufreq_cpu_put(policy);
1549 }
1550 
1551 static struct syscore_ops cpufreq_syscore_ops = {
1552 	.suspend	= cpufreq_bp_suspend,
1553 	.resume		= cpufreq_bp_resume,
1554 };
1555 
1556 /**
1557  *	cpufreq_get_current_driver - return current driver's name
1558  *
1559  *	Return the name string of the currently loaded cpufreq driver
1560  *	or NULL, if none.
1561  */
1562 const char *cpufreq_get_current_driver(void)
1563 {
1564 	if (cpufreq_driver)
1565 		return cpufreq_driver->name;
1566 
1567 	return NULL;
1568 }
1569 EXPORT_SYMBOL_GPL(cpufreq_get_current_driver);
1570 
1571 /*********************************************************************
1572  *                     NOTIFIER LISTS INTERFACE                      *
1573  *********************************************************************/
1574 
1575 /**
1576  *	cpufreq_register_notifier - register a driver with cpufreq
1577  *	@nb: notifier function to register
1578  *      @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1579  *
1580  *	Add a driver to one of two lists: either a list of drivers that
1581  *      are notified about clock rate changes (once before and once after
1582  *      the transition), or a list of drivers that are notified about
1583  *      changes in cpufreq policy.
1584  *
1585  *	This function may sleep, and has the same return conditions as
1586  *	blocking_notifier_chain_register.
1587  */
1588 int cpufreq_register_notifier(struct notifier_block *nb, unsigned int list)
1589 {
1590 	int ret;
1591 
1592 	if (cpufreq_disabled())
1593 		return -EINVAL;
1594 
1595 	WARN_ON(!init_cpufreq_transition_notifier_list_called);
1596 
1597 	switch (list) {
1598 	case CPUFREQ_TRANSITION_NOTIFIER:
1599 		ret = srcu_notifier_chain_register(
1600 				&cpufreq_transition_notifier_list, nb);
1601 		break;
1602 	case CPUFREQ_POLICY_NOTIFIER:
1603 		ret = blocking_notifier_chain_register(
1604 				&cpufreq_policy_notifier_list, nb);
1605 		break;
1606 	default:
1607 		ret = -EINVAL;
1608 	}
1609 
1610 	return ret;
1611 }
1612 EXPORT_SYMBOL(cpufreq_register_notifier);
1613 
1614 /**
1615  *	cpufreq_unregister_notifier - unregister a driver with cpufreq
1616  *	@nb: notifier block to be unregistered
1617  *	@list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1618  *
1619  *	Remove a driver from the CPU frequency notifier list.
1620  *
1621  *	This function may sleep, and has the same return conditions as
1622  *	blocking_notifier_chain_unregister.
1623  */
1624 int cpufreq_unregister_notifier(struct notifier_block *nb, unsigned int list)
1625 {
1626 	int ret;
1627 
1628 	if (cpufreq_disabled())
1629 		return -EINVAL;
1630 
1631 	switch (list) {
1632 	case CPUFREQ_TRANSITION_NOTIFIER:
1633 		ret = srcu_notifier_chain_unregister(
1634 				&cpufreq_transition_notifier_list, nb);
1635 		break;
1636 	case CPUFREQ_POLICY_NOTIFIER:
1637 		ret = blocking_notifier_chain_unregister(
1638 				&cpufreq_policy_notifier_list, nb);
1639 		break;
1640 	default:
1641 		ret = -EINVAL;
1642 	}
1643 
1644 	return ret;
1645 }
1646 EXPORT_SYMBOL(cpufreq_unregister_notifier);
1647 
1648 
1649 /*********************************************************************
1650  *                              GOVERNORS                            *
1651  *********************************************************************/
1652 
1653 int __cpufreq_driver_target(struct cpufreq_policy *policy,
1654 			    unsigned int target_freq,
1655 			    unsigned int relation)
1656 {
1657 	int retval = -EINVAL;
1658 	unsigned int old_target_freq = target_freq;
1659 
1660 	if (cpufreq_disabled())
1661 		return -ENODEV;
1662 
1663 	/* Make sure that target_freq is within supported range */
1664 	if (target_freq > policy->max)
1665 		target_freq = policy->max;
1666 	if (target_freq < policy->min)
1667 		target_freq = policy->min;
1668 
1669 	pr_debug("target for CPU %u: %u kHz, relation %u, requested %u kHz\n",
1670 			policy->cpu, target_freq, relation, old_target_freq);
1671 
1672 	if (target_freq == policy->cur)
1673 		return 0;
1674 
1675 	if (cpufreq_driver->target)
1676 		retval = cpufreq_driver->target(policy, target_freq, relation);
1677 
1678 	return retval;
1679 }
1680 EXPORT_SYMBOL_GPL(__cpufreq_driver_target);
1681 
1682 int cpufreq_driver_target(struct cpufreq_policy *policy,
1683 			  unsigned int target_freq,
1684 			  unsigned int relation)
1685 {
1686 	int ret = -EINVAL;
1687 
1688 	if (unlikely(lock_policy_rwsem_write(policy->cpu)))
1689 		goto fail;
1690 
1691 	ret = __cpufreq_driver_target(policy, target_freq, relation);
1692 
1693 	unlock_policy_rwsem_write(policy->cpu);
1694 
1695 fail:
1696 	return ret;
1697 }
1698 EXPORT_SYMBOL_GPL(cpufreq_driver_target);
1699 
1700 /*
1701  * when "event" is CPUFREQ_GOV_LIMITS
1702  */
1703 
1704 static int __cpufreq_governor(struct cpufreq_policy *policy,
1705 					unsigned int event)
1706 {
1707 	int ret;
1708 
1709 	/* Only must be defined when default governor is known to have latency
1710 	   restrictions, like e.g. conservative or ondemand.
1711 	   That this is the case is already ensured in Kconfig
1712 	*/
1713 #ifdef CONFIG_CPU_FREQ_GOV_PERFORMANCE
1714 	struct cpufreq_governor *gov = &cpufreq_gov_performance;
1715 #else
1716 	struct cpufreq_governor *gov = NULL;
1717 #endif
1718 
1719 	if (policy->governor->max_transition_latency &&
1720 	    policy->cpuinfo.transition_latency >
1721 	    policy->governor->max_transition_latency) {
1722 		if (!gov)
1723 			return -EINVAL;
1724 		else {
1725 			printk(KERN_WARNING "%s governor failed, too long"
1726 			       " transition latency of HW, fallback"
1727 			       " to %s governor\n",
1728 			       policy->governor->name,
1729 			       gov->name);
1730 			policy->governor = gov;
1731 		}
1732 	}
1733 
1734 	if (event == CPUFREQ_GOV_POLICY_INIT)
1735 		if (!try_module_get(policy->governor->owner))
1736 			return -EINVAL;
1737 
1738 	pr_debug("__cpufreq_governor for CPU %u, event %u\n",
1739 						policy->cpu, event);
1740 
1741 	mutex_lock(&cpufreq_governor_lock);
1742 	if ((policy->governor_enabled && event == CPUFREQ_GOV_START)
1743 	    || (!policy->governor_enabled
1744 	    && (event == CPUFREQ_GOV_LIMITS || event == CPUFREQ_GOV_STOP))) {
1745 		mutex_unlock(&cpufreq_governor_lock);
1746 		return -EBUSY;
1747 	}
1748 
1749 	if (event == CPUFREQ_GOV_STOP)
1750 		policy->governor_enabled = false;
1751 	else if (event == CPUFREQ_GOV_START)
1752 		policy->governor_enabled = true;
1753 
1754 	mutex_unlock(&cpufreq_governor_lock);
1755 
1756 	ret = policy->governor->governor(policy, event);
1757 
1758 	if (!ret) {
1759 		if (event == CPUFREQ_GOV_POLICY_INIT)
1760 			policy->governor->initialized++;
1761 		else if (event == CPUFREQ_GOV_POLICY_EXIT)
1762 			policy->governor->initialized--;
1763 	} else {
1764 		/* Restore original values */
1765 		mutex_lock(&cpufreq_governor_lock);
1766 		if (event == CPUFREQ_GOV_STOP)
1767 			policy->governor_enabled = true;
1768 		else if (event == CPUFREQ_GOV_START)
1769 			policy->governor_enabled = false;
1770 		mutex_unlock(&cpufreq_governor_lock);
1771 	}
1772 
1773 	if (((event == CPUFREQ_GOV_POLICY_INIT) && ret) ||
1774 			((event == CPUFREQ_GOV_POLICY_EXIT) && !ret))
1775 		module_put(policy->governor->owner);
1776 
1777 	return ret;
1778 }
1779 
1780 int cpufreq_register_governor(struct cpufreq_governor *governor)
1781 {
1782 	int err;
1783 
1784 	if (!governor)
1785 		return -EINVAL;
1786 
1787 	if (cpufreq_disabled())
1788 		return -ENODEV;
1789 
1790 	mutex_lock(&cpufreq_governor_mutex);
1791 
1792 	governor->initialized = 0;
1793 	err = -EBUSY;
1794 	if (__find_governor(governor->name) == NULL) {
1795 		err = 0;
1796 		list_add(&governor->governor_list, &cpufreq_governor_list);
1797 	}
1798 
1799 	mutex_unlock(&cpufreq_governor_mutex);
1800 	return err;
1801 }
1802 EXPORT_SYMBOL_GPL(cpufreq_register_governor);
1803 
1804 void cpufreq_unregister_governor(struct cpufreq_governor *governor)
1805 {
1806 #ifdef CONFIG_HOTPLUG_CPU
1807 	int cpu;
1808 #endif
1809 
1810 	if (!governor)
1811 		return;
1812 
1813 	if (cpufreq_disabled())
1814 		return;
1815 
1816 #ifdef CONFIG_HOTPLUG_CPU
1817 	for_each_present_cpu(cpu) {
1818 		if (cpu_online(cpu))
1819 			continue;
1820 		if (!strcmp(per_cpu(cpufreq_cpu_governor, cpu), governor->name))
1821 			strcpy(per_cpu(cpufreq_cpu_governor, cpu), "\0");
1822 	}
1823 #endif
1824 
1825 	mutex_lock(&cpufreq_governor_mutex);
1826 	list_del(&governor->governor_list);
1827 	mutex_unlock(&cpufreq_governor_mutex);
1828 	return;
1829 }
1830 EXPORT_SYMBOL_GPL(cpufreq_unregister_governor);
1831 
1832 
1833 /*********************************************************************
1834  *                          POLICY INTERFACE                         *
1835  *********************************************************************/
1836 
1837 /**
1838  * cpufreq_get_policy - get the current cpufreq_policy
1839  * @policy: struct cpufreq_policy into which the current cpufreq_policy
1840  *	is written
1841  *
1842  * Reads the current cpufreq policy.
1843  */
1844 int cpufreq_get_policy(struct cpufreq_policy *policy, unsigned int cpu)
1845 {
1846 	struct cpufreq_policy *cpu_policy;
1847 	if (!policy)
1848 		return -EINVAL;
1849 
1850 	cpu_policy = cpufreq_cpu_get(cpu);
1851 	if (!cpu_policy)
1852 		return -EINVAL;
1853 
1854 	memcpy(policy, cpu_policy, sizeof(*policy));
1855 
1856 	cpufreq_cpu_put(cpu_policy);
1857 	return 0;
1858 }
1859 EXPORT_SYMBOL(cpufreq_get_policy);
1860 
1861 /*
1862  * data   : current policy.
1863  * policy : policy to be set.
1864  */
1865 static int __cpufreq_set_policy(struct cpufreq_policy *policy,
1866 				struct cpufreq_policy *new_policy)
1867 {
1868 	int ret = 0, failed = 1;
1869 
1870 	pr_debug("setting new policy for CPU %u: %u - %u kHz\n", new_policy->cpu,
1871 		new_policy->min, new_policy->max);
1872 
1873 	memcpy(&new_policy->cpuinfo, &policy->cpuinfo, sizeof(policy->cpuinfo));
1874 
1875 	if (new_policy->min > policy->max || new_policy->max < policy->min) {
1876 		ret = -EINVAL;
1877 		goto error_out;
1878 	}
1879 
1880 	/* verify the cpu speed can be set within this limit */
1881 	ret = cpufreq_driver->verify(new_policy);
1882 	if (ret)
1883 		goto error_out;
1884 
1885 	/* adjust if necessary - all reasons */
1886 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1887 			CPUFREQ_ADJUST, new_policy);
1888 
1889 	/* adjust if necessary - hardware incompatibility*/
1890 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1891 			CPUFREQ_INCOMPATIBLE, new_policy);
1892 
1893 	/*
1894 	 * verify the cpu speed can be set within this limit, which might be
1895 	 * different to the first one
1896 	 */
1897 	ret = cpufreq_driver->verify(new_policy);
1898 	if (ret)
1899 		goto error_out;
1900 
1901 	/* notification of the new policy */
1902 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1903 			CPUFREQ_NOTIFY, new_policy);
1904 
1905 	policy->min = new_policy->min;
1906 	policy->max = new_policy->max;
1907 
1908 	pr_debug("new min and max freqs are %u - %u kHz\n",
1909 					policy->min, policy->max);
1910 
1911 	if (cpufreq_driver->setpolicy) {
1912 		policy->policy = new_policy->policy;
1913 		pr_debug("setting range\n");
1914 		ret = cpufreq_driver->setpolicy(new_policy);
1915 	} else {
1916 		if (new_policy->governor != policy->governor) {
1917 			/* save old, working values */
1918 			struct cpufreq_governor *old_gov = policy->governor;
1919 
1920 			pr_debug("governor switch\n");
1921 
1922 			/* end old governor */
1923 			if (policy->governor) {
1924 				__cpufreq_governor(policy, CPUFREQ_GOV_STOP);
1925 				unlock_policy_rwsem_write(new_policy->cpu);
1926 				__cpufreq_governor(policy,
1927 						CPUFREQ_GOV_POLICY_EXIT);
1928 				lock_policy_rwsem_write(new_policy->cpu);
1929 			}
1930 
1931 			/* start new governor */
1932 			policy->governor = new_policy->governor;
1933 			if (!__cpufreq_governor(policy, CPUFREQ_GOV_POLICY_INIT)) {
1934 				if (!__cpufreq_governor(policy, CPUFREQ_GOV_START)) {
1935 					failed = 0;
1936 				} else {
1937 					unlock_policy_rwsem_write(new_policy->cpu);
1938 					__cpufreq_governor(policy,
1939 							CPUFREQ_GOV_POLICY_EXIT);
1940 					lock_policy_rwsem_write(new_policy->cpu);
1941 				}
1942 			}
1943 
1944 			if (failed) {
1945 				/* new governor failed, so re-start old one */
1946 				pr_debug("starting governor %s failed\n",
1947 							policy->governor->name);
1948 				if (old_gov) {
1949 					policy->governor = old_gov;
1950 					__cpufreq_governor(policy,
1951 							CPUFREQ_GOV_POLICY_INIT);
1952 					__cpufreq_governor(policy,
1953 							   CPUFREQ_GOV_START);
1954 				}
1955 				ret = -EINVAL;
1956 				goto error_out;
1957 			}
1958 			/* might be a policy change, too, so fall through */
1959 		}
1960 		pr_debug("governor: change or update limits\n");
1961 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS);
1962 	}
1963 
1964 error_out:
1965 	return ret;
1966 }
1967 
1968 /**
1969  *	cpufreq_update_policy - re-evaluate an existing cpufreq policy
1970  *	@cpu: CPU which shall be re-evaluated
1971  *
1972  *	Useful for policy notifiers which have different necessities
1973  *	at different times.
1974  */
1975 int cpufreq_update_policy(unsigned int cpu)
1976 {
1977 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1978 	struct cpufreq_policy new_policy;
1979 	int ret;
1980 
1981 	if (!policy) {
1982 		ret = -ENODEV;
1983 		goto no_policy;
1984 	}
1985 
1986 	if (unlikely(lock_policy_rwsem_write(cpu))) {
1987 		ret = -EINVAL;
1988 		goto fail;
1989 	}
1990 
1991 	pr_debug("updating policy for CPU %u\n", cpu);
1992 	memcpy(&new_policy, policy, sizeof(*policy));
1993 	new_policy.min = policy->user_policy.min;
1994 	new_policy.max = policy->user_policy.max;
1995 	new_policy.policy = policy->user_policy.policy;
1996 	new_policy.governor = policy->user_policy.governor;
1997 
1998 	/*
1999 	 * BIOS might change freq behind our back
2000 	 * -> ask driver for current freq and notify governors about a change
2001 	 */
2002 	if (cpufreq_driver->get) {
2003 		new_policy.cur = cpufreq_driver->get(cpu);
2004 		if (!policy->cur) {
2005 			pr_debug("Driver did not initialize current freq");
2006 			policy->cur = new_policy.cur;
2007 		} else {
2008 			if (policy->cur != new_policy.cur && cpufreq_driver->target)
2009 				cpufreq_out_of_sync(cpu, policy->cur,
2010 								new_policy.cur);
2011 		}
2012 	}
2013 
2014 	ret = __cpufreq_set_policy(policy, &new_policy);
2015 
2016 	unlock_policy_rwsem_write(cpu);
2017 
2018 fail:
2019 	cpufreq_cpu_put(policy);
2020 no_policy:
2021 	return ret;
2022 }
2023 EXPORT_SYMBOL(cpufreq_update_policy);
2024 
2025 static int cpufreq_cpu_callback(struct notifier_block *nfb,
2026 					unsigned long action, void *hcpu)
2027 {
2028 	unsigned int cpu = (unsigned long)hcpu;
2029 	struct device *dev;
2030 	bool frozen = false;
2031 
2032 	dev = get_cpu_device(cpu);
2033 	if (dev) {
2034 
2035 		if (action & CPU_TASKS_FROZEN)
2036 			frozen = true;
2037 
2038 		switch (action & ~CPU_TASKS_FROZEN) {
2039 		case CPU_ONLINE:
2040 			__cpufreq_add_dev(dev, NULL, frozen);
2041 			cpufreq_update_policy(cpu);
2042 			break;
2043 
2044 		case CPU_DOWN_PREPARE:
2045 			__cpufreq_remove_dev_prepare(dev, NULL, frozen);
2046 			break;
2047 
2048 		case CPU_POST_DEAD:
2049 			__cpufreq_remove_dev_finish(dev, NULL, frozen);
2050 			break;
2051 
2052 		case CPU_DOWN_FAILED:
2053 			__cpufreq_add_dev(dev, NULL, frozen);
2054 			break;
2055 		}
2056 	}
2057 	return NOTIFY_OK;
2058 }
2059 
2060 static struct notifier_block __refdata cpufreq_cpu_notifier = {
2061 	.notifier_call = cpufreq_cpu_callback,
2062 };
2063 
2064 /*********************************************************************
2065  *               REGISTER / UNREGISTER CPUFREQ DRIVER                *
2066  *********************************************************************/
2067 
2068 /**
2069  * cpufreq_register_driver - register a CPU Frequency driver
2070  * @driver_data: A struct cpufreq_driver containing the values#
2071  * submitted by the CPU Frequency driver.
2072  *
2073  * Registers a CPU Frequency driver to this core code. This code
2074  * returns zero on success, -EBUSY when another driver got here first
2075  * (and isn't unregistered in the meantime).
2076  *
2077  */
2078 int cpufreq_register_driver(struct cpufreq_driver *driver_data)
2079 {
2080 	unsigned long flags;
2081 	int ret;
2082 
2083 	if (cpufreq_disabled())
2084 		return -ENODEV;
2085 
2086 	if (!driver_data || !driver_data->verify || !driver_data->init ||
2087 	    ((!driver_data->setpolicy) && (!driver_data->target)))
2088 		return -EINVAL;
2089 
2090 	pr_debug("trying to register driver %s\n", driver_data->name);
2091 
2092 	if (driver_data->setpolicy)
2093 		driver_data->flags |= CPUFREQ_CONST_LOOPS;
2094 
2095 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2096 	if (cpufreq_driver) {
2097 		write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2098 		return -EBUSY;
2099 	}
2100 	cpufreq_driver = driver_data;
2101 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2102 
2103 	ret = subsys_interface_register(&cpufreq_interface);
2104 	if (ret)
2105 		goto err_null_driver;
2106 
2107 	if (!(cpufreq_driver->flags & CPUFREQ_STICKY)) {
2108 		int i;
2109 		ret = -ENODEV;
2110 
2111 		/* check for at least one working CPU */
2112 		for (i = 0; i < nr_cpu_ids; i++)
2113 			if (cpu_possible(i) && per_cpu(cpufreq_cpu_data, i)) {
2114 				ret = 0;
2115 				break;
2116 			}
2117 
2118 		/* if all ->init() calls failed, unregister */
2119 		if (ret) {
2120 			pr_debug("no CPU initialized for driver %s\n",
2121 							driver_data->name);
2122 			goto err_if_unreg;
2123 		}
2124 	}
2125 
2126 	register_hotcpu_notifier(&cpufreq_cpu_notifier);
2127 	pr_debug("driver %s up and running\n", driver_data->name);
2128 
2129 	return 0;
2130 err_if_unreg:
2131 	subsys_interface_unregister(&cpufreq_interface);
2132 err_null_driver:
2133 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2134 	cpufreq_driver = NULL;
2135 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2136 	return ret;
2137 }
2138 EXPORT_SYMBOL_GPL(cpufreq_register_driver);
2139 
2140 /**
2141  * cpufreq_unregister_driver - unregister the current CPUFreq driver
2142  *
2143  * Unregister the current CPUFreq driver. Only call this if you have
2144  * the right to do so, i.e. if you have succeeded in initialising before!
2145  * Returns zero if successful, and -EINVAL if the cpufreq_driver is
2146  * currently not initialised.
2147  */
2148 int cpufreq_unregister_driver(struct cpufreq_driver *driver)
2149 {
2150 	unsigned long flags;
2151 
2152 	if (!cpufreq_driver || (driver != cpufreq_driver))
2153 		return -EINVAL;
2154 
2155 	pr_debug("unregistering driver %s\n", driver->name);
2156 
2157 	subsys_interface_unregister(&cpufreq_interface);
2158 	unregister_hotcpu_notifier(&cpufreq_cpu_notifier);
2159 
2160 	down_write(&cpufreq_rwsem);
2161 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2162 
2163 	cpufreq_driver = NULL;
2164 
2165 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2166 	up_write(&cpufreq_rwsem);
2167 
2168 	return 0;
2169 }
2170 EXPORT_SYMBOL_GPL(cpufreq_unregister_driver);
2171 
2172 static int __init cpufreq_core_init(void)
2173 {
2174 	int cpu;
2175 
2176 	if (cpufreq_disabled())
2177 		return -ENODEV;
2178 
2179 	for_each_possible_cpu(cpu)
2180 		init_rwsem(&per_cpu(cpu_policy_rwsem, cpu));
2181 
2182 	cpufreq_global_kobject = kobject_create();
2183 	BUG_ON(!cpufreq_global_kobject);
2184 	register_syscore_ops(&cpufreq_syscore_ops);
2185 
2186 	return 0;
2187 }
2188 core_initcall(cpufreq_core_init);
2189