xref: /linux/drivers/cpufreq/cpufreq.c (revision 0f29b46d49b0ca50536632c6a33986c3171f5ea1)
1 /*
2  *  linux/drivers/cpufreq/cpufreq.c
3  *
4  *  Copyright (C) 2001 Russell King
5  *            (C) 2002 - 2003 Dominik Brodowski <linux@brodo.de>
6  *            (C) 2013 Viresh Kumar <viresh.kumar@linaro.org>
7  *
8  *  Oct 2005 - Ashok Raj <ashok.raj@intel.com>
9  *	Added handling for CPU hotplug
10  *  Feb 2006 - Jacob Shin <jacob.shin@amd.com>
11  *	Fix handling for CPU hotplug -- affected CPUs
12  *
13  * This program is free software; you can redistribute it and/or modify
14  * it under the terms of the GNU General Public License version 2 as
15  * published by the Free Software Foundation.
16  */
17 
18 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
19 
20 #include <linux/cpu.h>
21 #include <linux/cpufreq.h>
22 #include <linux/delay.h>
23 #include <linux/device.h>
24 #include <linux/init.h>
25 #include <linux/kernel_stat.h>
26 #include <linux/module.h>
27 #include <linux/mutex.h>
28 #include <linux/slab.h>
29 #include <linux/suspend.h>
30 #include <linux/tick.h>
31 #include <trace/events/power.h>
32 
33 /**
34  * The "cpufreq driver" - the arch- or hardware-dependent low
35  * level driver of CPUFreq support, and its spinlock. This lock
36  * also protects the cpufreq_cpu_data array.
37  */
38 static struct cpufreq_driver *cpufreq_driver;
39 static DEFINE_PER_CPU(struct cpufreq_policy *, cpufreq_cpu_data);
40 static DEFINE_PER_CPU(struct cpufreq_policy *, cpufreq_cpu_data_fallback);
41 static DEFINE_RWLOCK(cpufreq_driver_lock);
42 DEFINE_MUTEX(cpufreq_governor_lock);
43 static LIST_HEAD(cpufreq_policy_list);
44 
45 /* This one keeps track of the previously set governor of a removed CPU */
46 static DEFINE_PER_CPU(char[CPUFREQ_NAME_LEN], cpufreq_cpu_governor);
47 
48 /* Flag to suspend/resume CPUFreq governors */
49 static bool cpufreq_suspended;
50 
51 static inline bool has_target(void)
52 {
53 	return cpufreq_driver->target_index || cpufreq_driver->target;
54 }
55 
56 /*
57  * rwsem to guarantee that cpufreq driver module doesn't unload during critical
58  * sections
59  */
60 static DECLARE_RWSEM(cpufreq_rwsem);
61 
62 /* internal prototypes */
63 static int __cpufreq_governor(struct cpufreq_policy *policy,
64 		unsigned int event);
65 static unsigned int __cpufreq_get(unsigned int cpu);
66 static void handle_update(struct work_struct *work);
67 
68 /**
69  * Two notifier lists: the "policy" list is involved in the
70  * validation process for a new CPU frequency policy; the
71  * "transition" list for kernel code that needs to handle
72  * changes to devices when the CPU clock speed changes.
73  * The mutex locks both lists.
74  */
75 static BLOCKING_NOTIFIER_HEAD(cpufreq_policy_notifier_list);
76 static struct srcu_notifier_head cpufreq_transition_notifier_list;
77 
78 static bool init_cpufreq_transition_notifier_list_called;
79 static int __init init_cpufreq_transition_notifier_list(void)
80 {
81 	srcu_init_notifier_head(&cpufreq_transition_notifier_list);
82 	init_cpufreq_transition_notifier_list_called = true;
83 	return 0;
84 }
85 pure_initcall(init_cpufreq_transition_notifier_list);
86 
87 static int off __read_mostly;
88 static int cpufreq_disabled(void)
89 {
90 	return off;
91 }
92 void disable_cpufreq(void)
93 {
94 	off = 1;
95 }
96 static LIST_HEAD(cpufreq_governor_list);
97 static DEFINE_MUTEX(cpufreq_governor_mutex);
98 
99 bool have_governor_per_policy(void)
100 {
101 	return !!(cpufreq_driver->flags & CPUFREQ_HAVE_GOVERNOR_PER_POLICY);
102 }
103 EXPORT_SYMBOL_GPL(have_governor_per_policy);
104 
105 struct kobject *get_governor_parent_kobj(struct cpufreq_policy *policy)
106 {
107 	if (have_governor_per_policy())
108 		return &policy->kobj;
109 	else
110 		return cpufreq_global_kobject;
111 }
112 EXPORT_SYMBOL_GPL(get_governor_parent_kobj);
113 
114 static inline u64 get_cpu_idle_time_jiffy(unsigned int cpu, u64 *wall)
115 {
116 	u64 idle_time;
117 	u64 cur_wall_time;
118 	u64 busy_time;
119 
120 	cur_wall_time = jiffies64_to_cputime64(get_jiffies_64());
121 
122 	busy_time = kcpustat_cpu(cpu).cpustat[CPUTIME_USER];
123 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_SYSTEM];
124 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_IRQ];
125 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_SOFTIRQ];
126 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_STEAL];
127 	busy_time += kcpustat_cpu(cpu).cpustat[CPUTIME_NICE];
128 
129 	idle_time = cur_wall_time - busy_time;
130 	if (wall)
131 		*wall = cputime_to_usecs(cur_wall_time);
132 
133 	return cputime_to_usecs(idle_time);
134 }
135 
136 u64 get_cpu_idle_time(unsigned int cpu, u64 *wall, int io_busy)
137 {
138 	u64 idle_time = get_cpu_idle_time_us(cpu, io_busy ? wall : NULL);
139 
140 	if (idle_time == -1ULL)
141 		return get_cpu_idle_time_jiffy(cpu, wall);
142 	else if (!io_busy)
143 		idle_time += get_cpu_iowait_time_us(cpu, wall);
144 
145 	return idle_time;
146 }
147 EXPORT_SYMBOL_GPL(get_cpu_idle_time);
148 
149 /*
150  * This is a generic cpufreq init() routine which can be used by cpufreq
151  * drivers of SMP systems. It will do following:
152  * - validate & show freq table passed
153  * - set policies transition latency
154  * - policy->cpus with all possible CPUs
155  */
156 int cpufreq_generic_init(struct cpufreq_policy *policy,
157 		struct cpufreq_frequency_table *table,
158 		unsigned int transition_latency)
159 {
160 	int ret;
161 
162 	ret = cpufreq_table_validate_and_show(policy, table);
163 	if (ret) {
164 		pr_err("%s: invalid frequency table: %d\n", __func__, ret);
165 		return ret;
166 	}
167 
168 	policy->cpuinfo.transition_latency = transition_latency;
169 
170 	/*
171 	 * The driver only supports the SMP configuartion where all processors
172 	 * share the clock and voltage and clock.
173 	 */
174 	cpumask_setall(policy->cpus);
175 
176 	return 0;
177 }
178 EXPORT_SYMBOL_GPL(cpufreq_generic_init);
179 
180 unsigned int cpufreq_generic_get(unsigned int cpu)
181 {
182 	struct cpufreq_policy *policy = per_cpu(cpufreq_cpu_data, cpu);
183 
184 	if (!policy || IS_ERR(policy->clk)) {
185 		pr_err("%s: No %s associated to cpu: %d\n",
186 		       __func__, policy ? "clk" : "policy", cpu);
187 		return 0;
188 	}
189 
190 	return clk_get_rate(policy->clk) / 1000;
191 }
192 EXPORT_SYMBOL_GPL(cpufreq_generic_get);
193 
194 /* Only for cpufreq core internal use */
195 struct cpufreq_policy *cpufreq_cpu_get_raw(unsigned int cpu)
196 {
197 	return per_cpu(cpufreq_cpu_data, cpu);
198 }
199 
200 struct cpufreq_policy *cpufreq_cpu_get(unsigned int cpu)
201 {
202 	struct cpufreq_policy *policy = NULL;
203 	unsigned long flags;
204 
205 	if (cpufreq_disabled() || (cpu >= nr_cpu_ids))
206 		return NULL;
207 
208 	if (!down_read_trylock(&cpufreq_rwsem))
209 		return NULL;
210 
211 	/* get the cpufreq driver */
212 	read_lock_irqsave(&cpufreq_driver_lock, flags);
213 
214 	if (cpufreq_driver) {
215 		/* get the CPU */
216 		policy = per_cpu(cpufreq_cpu_data, cpu);
217 		if (policy)
218 			kobject_get(&policy->kobj);
219 	}
220 
221 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
222 
223 	if (!policy)
224 		up_read(&cpufreq_rwsem);
225 
226 	return policy;
227 }
228 EXPORT_SYMBOL_GPL(cpufreq_cpu_get);
229 
230 void cpufreq_cpu_put(struct cpufreq_policy *policy)
231 {
232 	if (cpufreq_disabled())
233 		return;
234 
235 	kobject_put(&policy->kobj);
236 	up_read(&cpufreq_rwsem);
237 }
238 EXPORT_SYMBOL_GPL(cpufreq_cpu_put);
239 
240 /*********************************************************************
241  *            EXTERNALLY AFFECTING FREQUENCY CHANGES                 *
242  *********************************************************************/
243 
244 /**
245  * adjust_jiffies - adjust the system "loops_per_jiffy"
246  *
247  * This function alters the system "loops_per_jiffy" for the clock
248  * speed change. Note that loops_per_jiffy cannot be updated on SMP
249  * systems as each CPU might be scaled differently. So, use the arch
250  * per-CPU loops_per_jiffy value wherever possible.
251  */
252 #ifndef CONFIG_SMP
253 static unsigned long l_p_j_ref;
254 static unsigned int l_p_j_ref_freq;
255 
256 static void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
257 {
258 	if (ci->flags & CPUFREQ_CONST_LOOPS)
259 		return;
260 
261 	if (!l_p_j_ref_freq) {
262 		l_p_j_ref = loops_per_jiffy;
263 		l_p_j_ref_freq = ci->old;
264 		pr_debug("saving %lu as reference value for loops_per_jiffy; freq is %u kHz\n",
265 			 l_p_j_ref, l_p_j_ref_freq);
266 	}
267 	if (val == CPUFREQ_POSTCHANGE && ci->old != ci->new) {
268 		loops_per_jiffy = cpufreq_scale(l_p_j_ref, l_p_j_ref_freq,
269 								ci->new);
270 		pr_debug("scaling loops_per_jiffy to %lu for frequency %u kHz\n",
271 			 loops_per_jiffy, ci->new);
272 	}
273 }
274 #else
275 static inline void adjust_jiffies(unsigned long val, struct cpufreq_freqs *ci)
276 {
277 	return;
278 }
279 #endif
280 
281 static void __cpufreq_notify_transition(struct cpufreq_policy *policy,
282 		struct cpufreq_freqs *freqs, unsigned int state)
283 {
284 	BUG_ON(irqs_disabled());
285 
286 	if (cpufreq_disabled())
287 		return;
288 
289 	freqs->flags = cpufreq_driver->flags;
290 	pr_debug("notification %u of frequency transition to %u kHz\n",
291 		 state, freqs->new);
292 
293 	switch (state) {
294 
295 	case CPUFREQ_PRECHANGE:
296 		/* detect if the driver reported a value as "old frequency"
297 		 * which is not equal to what the cpufreq core thinks is
298 		 * "old frequency".
299 		 */
300 		if (!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
301 			if ((policy) && (policy->cpu == freqs->cpu) &&
302 			    (policy->cur) && (policy->cur != freqs->old)) {
303 				pr_debug("Warning: CPU frequency is %u, cpufreq assumed %u kHz\n",
304 					 freqs->old, policy->cur);
305 				freqs->old = policy->cur;
306 			}
307 		}
308 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
309 				CPUFREQ_PRECHANGE, freqs);
310 		adjust_jiffies(CPUFREQ_PRECHANGE, freqs);
311 		break;
312 
313 	case CPUFREQ_POSTCHANGE:
314 		adjust_jiffies(CPUFREQ_POSTCHANGE, freqs);
315 		pr_debug("FREQ: %lu - CPU: %lu\n",
316 			 (unsigned long)freqs->new, (unsigned long)freqs->cpu);
317 		trace_cpu_frequency(freqs->new, freqs->cpu);
318 		srcu_notifier_call_chain(&cpufreq_transition_notifier_list,
319 				CPUFREQ_POSTCHANGE, freqs);
320 		if (likely(policy) && likely(policy->cpu == freqs->cpu))
321 			policy->cur = freqs->new;
322 		break;
323 	}
324 }
325 
326 /**
327  * cpufreq_notify_transition - call notifier chain and adjust_jiffies
328  * on frequency transition.
329  *
330  * This function calls the transition notifiers and the "adjust_jiffies"
331  * function. It is called twice on all CPU frequency changes that have
332  * external effects.
333  */
334 static void cpufreq_notify_transition(struct cpufreq_policy *policy,
335 		struct cpufreq_freqs *freqs, unsigned int state)
336 {
337 	for_each_cpu(freqs->cpu, policy->cpus)
338 		__cpufreq_notify_transition(policy, freqs, state);
339 }
340 
341 /* Do post notifications when there are chances that transition has failed */
342 static void cpufreq_notify_post_transition(struct cpufreq_policy *policy,
343 		struct cpufreq_freqs *freqs, int transition_failed)
344 {
345 	cpufreq_notify_transition(policy, freqs, CPUFREQ_POSTCHANGE);
346 	if (!transition_failed)
347 		return;
348 
349 	swap(freqs->old, freqs->new);
350 	cpufreq_notify_transition(policy, freqs, CPUFREQ_PRECHANGE);
351 	cpufreq_notify_transition(policy, freqs, CPUFREQ_POSTCHANGE);
352 }
353 
354 void cpufreq_freq_transition_begin(struct cpufreq_policy *policy,
355 		struct cpufreq_freqs *freqs)
356 {
357 
358 	/*
359 	 * Catch double invocations of _begin() which lead to self-deadlock.
360 	 * ASYNC_NOTIFICATION drivers are left out because the cpufreq core
361 	 * doesn't invoke _begin() on their behalf, and hence the chances of
362 	 * double invocations are very low. Moreover, there are scenarios
363 	 * where these checks can emit false-positive warnings in these
364 	 * drivers; so we avoid that by skipping them altogether.
365 	 */
366 	WARN_ON(!(cpufreq_driver->flags & CPUFREQ_ASYNC_NOTIFICATION)
367 				&& current == policy->transition_task);
368 
369 wait:
370 	wait_event(policy->transition_wait, !policy->transition_ongoing);
371 
372 	spin_lock(&policy->transition_lock);
373 
374 	if (unlikely(policy->transition_ongoing)) {
375 		spin_unlock(&policy->transition_lock);
376 		goto wait;
377 	}
378 
379 	policy->transition_ongoing = true;
380 	policy->transition_task = current;
381 
382 	spin_unlock(&policy->transition_lock);
383 
384 	cpufreq_notify_transition(policy, freqs, CPUFREQ_PRECHANGE);
385 }
386 EXPORT_SYMBOL_GPL(cpufreq_freq_transition_begin);
387 
388 void cpufreq_freq_transition_end(struct cpufreq_policy *policy,
389 		struct cpufreq_freqs *freqs, int transition_failed)
390 {
391 	if (unlikely(WARN_ON(!policy->transition_ongoing)))
392 		return;
393 
394 	cpufreq_notify_post_transition(policy, freqs, transition_failed);
395 
396 	policy->transition_ongoing = false;
397 	policy->transition_task = NULL;
398 
399 	wake_up(&policy->transition_wait);
400 }
401 EXPORT_SYMBOL_GPL(cpufreq_freq_transition_end);
402 
403 
404 /*********************************************************************
405  *                          SYSFS INTERFACE                          *
406  *********************************************************************/
407 static ssize_t show_boost(struct kobject *kobj,
408 				 struct attribute *attr, char *buf)
409 {
410 	return sprintf(buf, "%d\n", cpufreq_driver->boost_enabled);
411 }
412 
413 static ssize_t store_boost(struct kobject *kobj, struct attribute *attr,
414 				  const char *buf, size_t count)
415 {
416 	int ret, enable;
417 
418 	ret = sscanf(buf, "%d", &enable);
419 	if (ret != 1 || enable < 0 || enable > 1)
420 		return -EINVAL;
421 
422 	if (cpufreq_boost_trigger_state(enable)) {
423 		pr_err("%s: Cannot %s BOOST!\n",
424 		       __func__, enable ? "enable" : "disable");
425 		return -EINVAL;
426 	}
427 
428 	pr_debug("%s: cpufreq BOOST %s\n",
429 		 __func__, enable ? "enabled" : "disabled");
430 
431 	return count;
432 }
433 define_one_global_rw(boost);
434 
435 static struct cpufreq_governor *__find_governor(const char *str_governor)
436 {
437 	struct cpufreq_governor *t;
438 
439 	list_for_each_entry(t, &cpufreq_governor_list, governor_list)
440 		if (!strnicmp(str_governor, t->name, CPUFREQ_NAME_LEN))
441 			return t;
442 
443 	return NULL;
444 }
445 
446 /**
447  * cpufreq_parse_governor - parse a governor string
448  */
449 static int cpufreq_parse_governor(char *str_governor, unsigned int *policy,
450 				struct cpufreq_governor **governor)
451 {
452 	int err = -EINVAL;
453 
454 	if (!cpufreq_driver)
455 		goto out;
456 
457 	if (cpufreq_driver->setpolicy) {
458 		if (!strnicmp(str_governor, "performance", CPUFREQ_NAME_LEN)) {
459 			*policy = CPUFREQ_POLICY_PERFORMANCE;
460 			err = 0;
461 		} else if (!strnicmp(str_governor, "powersave",
462 						CPUFREQ_NAME_LEN)) {
463 			*policy = CPUFREQ_POLICY_POWERSAVE;
464 			err = 0;
465 		}
466 	} else if (has_target()) {
467 		struct cpufreq_governor *t;
468 
469 		mutex_lock(&cpufreq_governor_mutex);
470 
471 		t = __find_governor(str_governor);
472 
473 		if (t == NULL) {
474 			int ret;
475 
476 			mutex_unlock(&cpufreq_governor_mutex);
477 			ret = request_module("cpufreq_%s", str_governor);
478 			mutex_lock(&cpufreq_governor_mutex);
479 
480 			if (ret == 0)
481 				t = __find_governor(str_governor);
482 		}
483 
484 		if (t != NULL) {
485 			*governor = t;
486 			err = 0;
487 		}
488 
489 		mutex_unlock(&cpufreq_governor_mutex);
490 	}
491 out:
492 	return err;
493 }
494 
495 /**
496  * cpufreq_per_cpu_attr_read() / show_##file_name() -
497  * print out cpufreq information
498  *
499  * Write out information from cpufreq_driver->policy[cpu]; object must be
500  * "unsigned int".
501  */
502 
503 #define show_one(file_name, object)			\
504 static ssize_t show_##file_name				\
505 (struct cpufreq_policy *policy, char *buf)		\
506 {							\
507 	return sprintf(buf, "%u\n", policy->object);	\
508 }
509 
510 show_one(cpuinfo_min_freq, cpuinfo.min_freq);
511 show_one(cpuinfo_max_freq, cpuinfo.max_freq);
512 show_one(cpuinfo_transition_latency, cpuinfo.transition_latency);
513 show_one(scaling_min_freq, min);
514 show_one(scaling_max_freq, max);
515 show_one(scaling_cur_freq, cur);
516 
517 static int cpufreq_set_policy(struct cpufreq_policy *policy,
518 				struct cpufreq_policy *new_policy);
519 
520 /**
521  * cpufreq_per_cpu_attr_write() / store_##file_name() - sysfs write access
522  */
523 #define store_one(file_name, object)			\
524 static ssize_t store_##file_name					\
525 (struct cpufreq_policy *policy, const char *buf, size_t count)		\
526 {									\
527 	int ret;							\
528 	struct cpufreq_policy new_policy;				\
529 									\
530 	ret = cpufreq_get_policy(&new_policy, policy->cpu);		\
531 	if (ret)							\
532 		return -EINVAL;						\
533 									\
534 	ret = sscanf(buf, "%u", &new_policy.object);			\
535 	if (ret != 1)							\
536 		return -EINVAL;						\
537 									\
538 	ret = cpufreq_set_policy(policy, &new_policy);		\
539 	policy->user_policy.object = policy->object;			\
540 									\
541 	return ret ? ret : count;					\
542 }
543 
544 store_one(scaling_min_freq, min);
545 store_one(scaling_max_freq, max);
546 
547 /**
548  * show_cpuinfo_cur_freq - current CPU frequency as detected by hardware
549  */
550 static ssize_t show_cpuinfo_cur_freq(struct cpufreq_policy *policy,
551 					char *buf)
552 {
553 	unsigned int cur_freq = __cpufreq_get(policy->cpu);
554 	if (!cur_freq)
555 		return sprintf(buf, "<unknown>");
556 	return sprintf(buf, "%u\n", cur_freq);
557 }
558 
559 /**
560  * show_scaling_governor - show the current policy for the specified CPU
561  */
562 static ssize_t show_scaling_governor(struct cpufreq_policy *policy, char *buf)
563 {
564 	if (policy->policy == CPUFREQ_POLICY_POWERSAVE)
565 		return sprintf(buf, "powersave\n");
566 	else if (policy->policy == CPUFREQ_POLICY_PERFORMANCE)
567 		return sprintf(buf, "performance\n");
568 	else if (policy->governor)
569 		return scnprintf(buf, CPUFREQ_NAME_PLEN, "%s\n",
570 				policy->governor->name);
571 	return -EINVAL;
572 }
573 
574 /**
575  * store_scaling_governor - store policy for the specified CPU
576  */
577 static ssize_t store_scaling_governor(struct cpufreq_policy *policy,
578 					const char *buf, size_t count)
579 {
580 	int ret;
581 	char	str_governor[16];
582 	struct cpufreq_policy new_policy;
583 
584 	ret = cpufreq_get_policy(&new_policy, policy->cpu);
585 	if (ret)
586 		return ret;
587 
588 	ret = sscanf(buf, "%15s", str_governor);
589 	if (ret != 1)
590 		return -EINVAL;
591 
592 	if (cpufreq_parse_governor(str_governor, &new_policy.policy,
593 						&new_policy.governor))
594 		return -EINVAL;
595 
596 	ret = cpufreq_set_policy(policy, &new_policy);
597 
598 	policy->user_policy.policy = policy->policy;
599 	policy->user_policy.governor = policy->governor;
600 
601 	if (ret)
602 		return ret;
603 	else
604 		return count;
605 }
606 
607 /**
608  * show_scaling_driver - show the cpufreq driver currently loaded
609  */
610 static ssize_t show_scaling_driver(struct cpufreq_policy *policy, char *buf)
611 {
612 	return scnprintf(buf, CPUFREQ_NAME_PLEN, "%s\n", cpufreq_driver->name);
613 }
614 
615 /**
616  * show_scaling_available_governors - show the available CPUfreq governors
617  */
618 static ssize_t show_scaling_available_governors(struct cpufreq_policy *policy,
619 						char *buf)
620 {
621 	ssize_t i = 0;
622 	struct cpufreq_governor *t;
623 
624 	if (!has_target()) {
625 		i += sprintf(buf, "performance powersave");
626 		goto out;
627 	}
628 
629 	list_for_each_entry(t, &cpufreq_governor_list, governor_list) {
630 		if (i >= (ssize_t) ((PAGE_SIZE / sizeof(char))
631 		    - (CPUFREQ_NAME_LEN + 2)))
632 			goto out;
633 		i += scnprintf(&buf[i], CPUFREQ_NAME_PLEN, "%s ", t->name);
634 	}
635 out:
636 	i += sprintf(&buf[i], "\n");
637 	return i;
638 }
639 
640 ssize_t cpufreq_show_cpus(const struct cpumask *mask, char *buf)
641 {
642 	ssize_t i = 0;
643 	unsigned int cpu;
644 
645 	for_each_cpu(cpu, mask) {
646 		if (i)
647 			i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), " ");
648 		i += scnprintf(&buf[i], (PAGE_SIZE - i - 2), "%u", cpu);
649 		if (i >= (PAGE_SIZE - 5))
650 			break;
651 	}
652 	i += sprintf(&buf[i], "\n");
653 	return i;
654 }
655 EXPORT_SYMBOL_GPL(cpufreq_show_cpus);
656 
657 /**
658  * show_related_cpus - show the CPUs affected by each transition even if
659  * hw coordination is in use
660  */
661 static ssize_t show_related_cpus(struct cpufreq_policy *policy, char *buf)
662 {
663 	return cpufreq_show_cpus(policy->related_cpus, buf);
664 }
665 
666 /**
667  * show_affected_cpus - show the CPUs affected by each transition
668  */
669 static ssize_t show_affected_cpus(struct cpufreq_policy *policy, char *buf)
670 {
671 	return cpufreq_show_cpus(policy->cpus, buf);
672 }
673 
674 static ssize_t store_scaling_setspeed(struct cpufreq_policy *policy,
675 					const char *buf, size_t count)
676 {
677 	unsigned int freq = 0;
678 	unsigned int ret;
679 
680 	if (!policy->governor || !policy->governor->store_setspeed)
681 		return -EINVAL;
682 
683 	ret = sscanf(buf, "%u", &freq);
684 	if (ret != 1)
685 		return -EINVAL;
686 
687 	policy->governor->store_setspeed(policy, freq);
688 
689 	return count;
690 }
691 
692 static ssize_t show_scaling_setspeed(struct cpufreq_policy *policy, char *buf)
693 {
694 	if (!policy->governor || !policy->governor->show_setspeed)
695 		return sprintf(buf, "<unsupported>\n");
696 
697 	return policy->governor->show_setspeed(policy, buf);
698 }
699 
700 /**
701  * show_bios_limit - show the current cpufreq HW/BIOS limitation
702  */
703 static ssize_t show_bios_limit(struct cpufreq_policy *policy, char *buf)
704 {
705 	unsigned int limit;
706 	int ret;
707 	if (cpufreq_driver->bios_limit) {
708 		ret = cpufreq_driver->bios_limit(policy->cpu, &limit);
709 		if (!ret)
710 			return sprintf(buf, "%u\n", limit);
711 	}
712 	return sprintf(buf, "%u\n", policy->cpuinfo.max_freq);
713 }
714 
715 cpufreq_freq_attr_ro_perm(cpuinfo_cur_freq, 0400);
716 cpufreq_freq_attr_ro(cpuinfo_min_freq);
717 cpufreq_freq_attr_ro(cpuinfo_max_freq);
718 cpufreq_freq_attr_ro(cpuinfo_transition_latency);
719 cpufreq_freq_attr_ro(scaling_available_governors);
720 cpufreq_freq_attr_ro(scaling_driver);
721 cpufreq_freq_attr_ro(scaling_cur_freq);
722 cpufreq_freq_attr_ro(bios_limit);
723 cpufreq_freq_attr_ro(related_cpus);
724 cpufreq_freq_attr_ro(affected_cpus);
725 cpufreq_freq_attr_rw(scaling_min_freq);
726 cpufreq_freq_attr_rw(scaling_max_freq);
727 cpufreq_freq_attr_rw(scaling_governor);
728 cpufreq_freq_attr_rw(scaling_setspeed);
729 
730 static struct attribute *default_attrs[] = {
731 	&cpuinfo_min_freq.attr,
732 	&cpuinfo_max_freq.attr,
733 	&cpuinfo_transition_latency.attr,
734 	&scaling_min_freq.attr,
735 	&scaling_max_freq.attr,
736 	&affected_cpus.attr,
737 	&related_cpus.attr,
738 	&scaling_governor.attr,
739 	&scaling_driver.attr,
740 	&scaling_available_governors.attr,
741 	&scaling_setspeed.attr,
742 	NULL
743 };
744 
745 #define to_policy(k) container_of(k, struct cpufreq_policy, kobj)
746 #define to_attr(a) container_of(a, struct freq_attr, attr)
747 
748 static ssize_t show(struct kobject *kobj, struct attribute *attr, char *buf)
749 {
750 	struct cpufreq_policy *policy = to_policy(kobj);
751 	struct freq_attr *fattr = to_attr(attr);
752 	ssize_t ret;
753 
754 	if (!down_read_trylock(&cpufreq_rwsem))
755 		return -EINVAL;
756 
757 	down_read(&policy->rwsem);
758 
759 	if (fattr->show)
760 		ret = fattr->show(policy, buf);
761 	else
762 		ret = -EIO;
763 
764 	up_read(&policy->rwsem);
765 	up_read(&cpufreq_rwsem);
766 
767 	return ret;
768 }
769 
770 static ssize_t store(struct kobject *kobj, struct attribute *attr,
771 		     const char *buf, size_t count)
772 {
773 	struct cpufreq_policy *policy = to_policy(kobj);
774 	struct freq_attr *fattr = to_attr(attr);
775 	ssize_t ret = -EINVAL;
776 
777 	get_online_cpus();
778 
779 	if (!cpu_online(policy->cpu))
780 		goto unlock;
781 
782 	if (!down_read_trylock(&cpufreq_rwsem))
783 		goto unlock;
784 
785 	down_write(&policy->rwsem);
786 
787 	if (fattr->store)
788 		ret = fattr->store(policy, buf, count);
789 	else
790 		ret = -EIO;
791 
792 	up_write(&policy->rwsem);
793 
794 	up_read(&cpufreq_rwsem);
795 unlock:
796 	put_online_cpus();
797 
798 	return ret;
799 }
800 
801 static void cpufreq_sysfs_release(struct kobject *kobj)
802 {
803 	struct cpufreq_policy *policy = to_policy(kobj);
804 	pr_debug("last reference is dropped\n");
805 	complete(&policy->kobj_unregister);
806 }
807 
808 static const struct sysfs_ops sysfs_ops = {
809 	.show	= show,
810 	.store	= store,
811 };
812 
813 static struct kobj_type ktype_cpufreq = {
814 	.sysfs_ops	= &sysfs_ops,
815 	.default_attrs	= default_attrs,
816 	.release	= cpufreq_sysfs_release,
817 };
818 
819 struct kobject *cpufreq_global_kobject;
820 EXPORT_SYMBOL(cpufreq_global_kobject);
821 
822 static int cpufreq_global_kobject_usage;
823 
824 int cpufreq_get_global_kobject(void)
825 {
826 	if (!cpufreq_global_kobject_usage++)
827 		return kobject_add(cpufreq_global_kobject,
828 				&cpu_subsys.dev_root->kobj, "%s", "cpufreq");
829 
830 	return 0;
831 }
832 EXPORT_SYMBOL(cpufreq_get_global_kobject);
833 
834 void cpufreq_put_global_kobject(void)
835 {
836 	if (!--cpufreq_global_kobject_usage)
837 		kobject_del(cpufreq_global_kobject);
838 }
839 EXPORT_SYMBOL(cpufreq_put_global_kobject);
840 
841 int cpufreq_sysfs_create_file(const struct attribute *attr)
842 {
843 	int ret = cpufreq_get_global_kobject();
844 
845 	if (!ret) {
846 		ret = sysfs_create_file(cpufreq_global_kobject, attr);
847 		if (ret)
848 			cpufreq_put_global_kobject();
849 	}
850 
851 	return ret;
852 }
853 EXPORT_SYMBOL(cpufreq_sysfs_create_file);
854 
855 void cpufreq_sysfs_remove_file(const struct attribute *attr)
856 {
857 	sysfs_remove_file(cpufreq_global_kobject, attr);
858 	cpufreq_put_global_kobject();
859 }
860 EXPORT_SYMBOL(cpufreq_sysfs_remove_file);
861 
862 /* symlink affected CPUs */
863 static int cpufreq_add_dev_symlink(struct cpufreq_policy *policy)
864 {
865 	unsigned int j;
866 	int ret = 0;
867 
868 	for_each_cpu(j, policy->cpus) {
869 		struct device *cpu_dev;
870 
871 		if (j == policy->cpu)
872 			continue;
873 
874 		pr_debug("Adding link for CPU: %u\n", j);
875 		cpu_dev = get_cpu_device(j);
876 		ret = sysfs_create_link(&cpu_dev->kobj, &policy->kobj,
877 					"cpufreq");
878 		if (ret)
879 			break;
880 	}
881 	return ret;
882 }
883 
884 static int cpufreq_add_dev_interface(struct cpufreq_policy *policy,
885 				     struct device *dev)
886 {
887 	struct freq_attr **drv_attr;
888 	int ret = 0;
889 
890 	/* prepare interface data */
891 	ret = kobject_init_and_add(&policy->kobj, &ktype_cpufreq,
892 				   &dev->kobj, "cpufreq");
893 	if (ret)
894 		return ret;
895 
896 	/* set up files for this cpu device */
897 	drv_attr = cpufreq_driver->attr;
898 	while ((drv_attr) && (*drv_attr)) {
899 		ret = sysfs_create_file(&policy->kobj, &((*drv_attr)->attr));
900 		if (ret)
901 			goto err_out_kobj_put;
902 		drv_attr++;
903 	}
904 	if (cpufreq_driver->get) {
905 		ret = sysfs_create_file(&policy->kobj, &cpuinfo_cur_freq.attr);
906 		if (ret)
907 			goto err_out_kobj_put;
908 	}
909 	if (has_target()) {
910 		ret = sysfs_create_file(&policy->kobj, &scaling_cur_freq.attr);
911 		if (ret)
912 			goto err_out_kobj_put;
913 	}
914 	if (cpufreq_driver->bios_limit) {
915 		ret = sysfs_create_file(&policy->kobj, &bios_limit.attr);
916 		if (ret)
917 			goto err_out_kobj_put;
918 	}
919 
920 	ret = cpufreq_add_dev_symlink(policy);
921 	if (ret)
922 		goto err_out_kobj_put;
923 
924 	return ret;
925 
926 err_out_kobj_put:
927 	kobject_put(&policy->kobj);
928 	wait_for_completion(&policy->kobj_unregister);
929 	return ret;
930 }
931 
932 static void cpufreq_init_policy(struct cpufreq_policy *policy)
933 {
934 	struct cpufreq_governor *gov = NULL;
935 	struct cpufreq_policy new_policy;
936 	int ret = 0;
937 
938 	memcpy(&new_policy, policy, sizeof(*policy));
939 
940 	/* Update governor of new_policy to the governor used before hotplug */
941 	gov = __find_governor(per_cpu(cpufreq_cpu_governor, policy->cpu));
942 	if (gov)
943 		pr_debug("Restoring governor %s for cpu %d\n",
944 				policy->governor->name, policy->cpu);
945 	else
946 		gov = CPUFREQ_DEFAULT_GOVERNOR;
947 
948 	new_policy.governor = gov;
949 
950 	/* Use the default policy if its valid. */
951 	if (cpufreq_driver->setpolicy)
952 		cpufreq_parse_governor(gov->name, &new_policy.policy, NULL);
953 
954 	/* set default policy */
955 	ret = cpufreq_set_policy(policy, &new_policy);
956 	if (ret) {
957 		pr_debug("setting policy failed\n");
958 		if (cpufreq_driver->exit)
959 			cpufreq_driver->exit(policy);
960 	}
961 }
962 
963 #ifdef CONFIG_HOTPLUG_CPU
964 static int cpufreq_add_policy_cpu(struct cpufreq_policy *policy,
965 				  unsigned int cpu, struct device *dev)
966 {
967 	int ret = 0;
968 	unsigned long flags;
969 
970 	if (has_target()) {
971 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_STOP);
972 		if (ret) {
973 			pr_err("%s: Failed to stop governor\n", __func__);
974 			return ret;
975 		}
976 	}
977 
978 	down_write(&policy->rwsem);
979 
980 	write_lock_irqsave(&cpufreq_driver_lock, flags);
981 
982 	cpumask_set_cpu(cpu, policy->cpus);
983 	per_cpu(cpufreq_cpu_data, cpu) = policy;
984 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
985 
986 	up_write(&policy->rwsem);
987 
988 	if (has_target()) {
989 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_START);
990 		if (!ret)
991 			ret = __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS);
992 
993 		if (ret) {
994 			pr_err("%s: Failed to start governor\n", __func__);
995 			return ret;
996 		}
997 	}
998 
999 	return sysfs_create_link(&dev->kobj, &policy->kobj, "cpufreq");
1000 }
1001 #endif
1002 
1003 static struct cpufreq_policy *cpufreq_policy_restore(unsigned int cpu)
1004 {
1005 	struct cpufreq_policy *policy;
1006 	unsigned long flags;
1007 
1008 	read_lock_irqsave(&cpufreq_driver_lock, flags);
1009 
1010 	policy = per_cpu(cpufreq_cpu_data_fallback, cpu);
1011 
1012 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1013 
1014 	policy->governor = NULL;
1015 
1016 	return policy;
1017 }
1018 
1019 static struct cpufreq_policy *cpufreq_policy_alloc(void)
1020 {
1021 	struct cpufreq_policy *policy;
1022 
1023 	policy = kzalloc(sizeof(*policy), GFP_KERNEL);
1024 	if (!policy)
1025 		return NULL;
1026 
1027 	if (!alloc_cpumask_var(&policy->cpus, GFP_KERNEL))
1028 		goto err_free_policy;
1029 
1030 	if (!zalloc_cpumask_var(&policy->related_cpus, GFP_KERNEL))
1031 		goto err_free_cpumask;
1032 
1033 	INIT_LIST_HEAD(&policy->policy_list);
1034 	init_rwsem(&policy->rwsem);
1035 	spin_lock_init(&policy->transition_lock);
1036 	init_waitqueue_head(&policy->transition_wait);
1037 
1038 	return policy;
1039 
1040 err_free_cpumask:
1041 	free_cpumask_var(policy->cpus);
1042 err_free_policy:
1043 	kfree(policy);
1044 
1045 	return NULL;
1046 }
1047 
1048 static void cpufreq_policy_put_kobj(struct cpufreq_policy *policy)
1049 {
1050 	struct kobject *kobj;
1051 	struct completion *cmp;
1052 
1053 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1054 			CPUFREQ_REMOVE_POLICY, policy);
1055 
1056 	down_read(&policy->rwsem);
1057 	kobj = &policy->kobj;
1058 	cmp = &policy->kobj_unregister;
1059 	up_read(&policy->rwsem);
1060 	kobject_put(kobj);
1061 
1062 	/*
1063 	 * We need to make sure that the underlying kobj is
1064 	 * actually not referenced anymore by anybody before we
1065 	 * proceed with unloading.
1066 	 */
1067 	pr_debug("waiting for dropping of refcount\n");
1068 	wait_for_completion(cmp);
1069 	pr_debug("wait complete\n");
1070 }
1071 
1072 static void cpufreq_policy_free(struct cpufreq_policy *policy)
1073 {
1074 	free_cpumask_var(policy->related_cpus);
1075 	free_cpumask_var(policy->cpus);
1076 	kfree(policy);
1077 }
1078 
1079 static void update_policy_cpu(struct cpufreq_policy *policy, unsigned int cpu)
1080 {
1081 	if (WARN_ON(cpu == policy->cpu))
1082 		return;
1083 
1084 	down_write(&policy->rwsem);
1085 
1086 	policy->last_cpu = policy->cpu;
1087 	policy->cpu = cpu;
1088 
1089 	up_write(&policy->rwsem);
1090 
1091 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1092 			CPUFREQ_UPDATE_POLICY_CPU, policy);
1093 }
1094 
1095 static int __cpufreq_add_dev(struct device *dev, struct subsys_interface *sif)
1096 {
1097 	unsigned int j, cpu = dev->id;
1098 	int ret = -ENOMEM;
1099 	struct cpufreq_policy *policy;
1100 	unsigned long flags;
1101 	bool recover_policy = cpufreq_suspended;
1102 #ifdef CONFIG_HOTPLUG_CPU
1103 	struct cpufreq_policy *tpolicy;
1104 #endif
1105 
1106 	if (cpu_is_offline(cpu))
1107 		return 0;
1108 
1109 	pr_debug("adding CPU %u\n", cpu);
1110 
1111 #ifdef CONFIG_SMP
1112 	/* check whether a different CPU already registered this
1113 	 * CPU because it is in the same boat. */
1114 	policy = cpufreq_cpu_get(cpu);
1115 	if (unlikely(policy)) {
1116 		cpufreq_cpu_put(policy);
1117 		return 0;
1118 	}
1119 #endif
1120 
1121 	if (!down_read_trylock(&cpufreq_rwsem))
1122 		return 0;
1123 
1124 #ifdef CONFIG_HOTPLUG_CPU
1125 	/* Check if this cpu was hot-unplugged earlier and has siblings */
1126 	read_lock_irqsave(&cpufreq_driver_lock, flags);
1127 	list_for_each_entry(tpolicy, &cpufreq_policy_list, policy_list) {
1128 		if (cpumask_test_cpu(cpu, tpolicy->related_cpus)) {
1129 			read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1130 			ret = cpufreq_add_policy_cpu(tpolicy, cpu, dev);
1131 			up_read(&cpufreq_rwsem);
1132 			return ret;
1133 		}
1134 	}
1135 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1136 #endif
1137 
1138 	/*
1139 	 * Restore the saved policy when doing light-weight init and fall back
1140 	 * to the full init if that fails.
1141 	 */
1142 	policy = recover_policy ? cpufreq_policy_restore(cpu) : NULL;
1143 	if (!policy) {
1144 		recover_policy = false;
1145 		policy = cpufreq_policy_alloc();
1146 		if (!policy)
1147 			goto nomem_out;
1148 	}
1149 
1150 	/*
1151 	 * In the resume path, since we restore a saved policy, the assignment
1152 	 * to policy->cpu is like an update of the existing policy, rather than
1153 	 * the creation of a brand new one. So we need to perform this update
1154 	 * by invoking update_policy_cpu().
1155 	 */
1156 	if (recover_policy && cpu != policy->cpu) {
1157 		update_policy_cpu(policy, cpu);
1158 		WARN_ON(kobject_move(&policy->kobj, &dev->kobj));
1159 	} else {
1160 		policy->cpu = cpu;
1161 	}
1162 
1163 	cpumask_copy(policy->cpus, cpumask_of(cpu));
1164 
1165 	init_completion(&policy->kobj_unregister);
1166 	INIT_WORK(&policy->update, handle_update);
1167 
1168 	/* call driver. From then on the cpufreq must be able
1169 	 * to accept all calls to ->verify and ->setpolicy for this CPU
1170 	 */
1171 	ret = cpufreq_driver->init(policy);
1172 	if (ret) {
1173 		pr_debug("initialization failed\n");
1174 		goto err_set_policy_cpu;
1175 	}
1176 
1177 	/* related cpus should atleast have policy->cpus */
1178 	cpumask_or(policy->related_cpus, policy->related_cpus, policy->cpus);
1179 
1180 	/*
1181 	 * affected cpus must always be the one, which are online. We aren't
1182 	 * managing offline cpus here.
1183 	 */
1184 	cpumask_and(policy->cpus, policy->cpus, cpu_online_mask);
1185 
1186 	if (!recover_policy) {
1187 		policy->user_policy.min = policy->min;
1188 		policy->user_policy.max = policy->max;
1189 	}
1190 
1191 	down_write(&policy->rwsem);
1192 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1193 	for_each_cpu(j, policy->cpus)
1194 		per_cpu(cpufreq_cpu_data, j) = policy;
1195 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1196 
1197 	if (cpufreq_driver->get && !cpufreq_driver->setpolicy) {
1198 		policy->cur = cpufreq_driver->get(policy->cpu);
1199 		if (!policy->cur) {
1200 			pr_err("%s: ->get() failed\n", __func__);
1201 			goto err_get_freq;
1202 		}
1203 	}
1204 
1205 	/*
1206 	 * Sometimes boot loaders set CPU frequency to a value outside of
1207 	 * frequency table present with cpufreq core. In such cases CPU might be
1208 	 * unstable if it has to run on that frequency for long duration of time
1209 	 * and so its better to set it to a frequency which is specified in
1210 	 * freq-table. This also makes cpufreq stats inconsistent as
1211 	 * cpufreq-stats would fail to register because current frequency of CPU
1212 	 * isn't found in freq-table.
1213 	 *
1214 	 * Because we don't want this change to effect boot process badly, we go
1215 	 * for the next freq which is >= policy->cur ('cur' must be set by now,
1216 	 * otherwise we will end up setting freq to lowest of the table as 'cur'
1217 	 * is initialized to zero).
1218 	 *
1219 	 * We are passing target-freq as "policy->cur - 1" otherwise
1220 	 * __cpufreq_driver_target() would simply fail, as policy->cur will be
1221 	 * equal to target-freq.
1222 	 */
1223 	if ((cpufreq_driver->flags & CPUFREQ_NEED_INITIAL_FREQ_CHECK)
1224 	    && has_target()) {
1225 		/* Are we running at unknown frequency ? */
1226 		ret = cpufreq_frequency_table_get_index(policy, policy->cur);
1227 		if (ret == -EINVAL) {
1228 			/* Warn user and fix it */
1229 			pr_warn("%s: CPU%d: Running at unlisted freq: %u KHz\n",
1230 				__func__, policy->cpu, policy->cur);
1231 			ret = __cpufreq_driver_target(policy, policy->cur - 1,
1232 				CPUFREQ_RELATION_L);
1233 
1234 			/*
1235 			 * Reaching here after boot in a few seconds may not
1236 			 * mean that system will remain stable at "unknown"
1237 			 * frequency for longer duration. Hence, a BUG_ON().
1238 			 */
1239 			BUG_ON(ret);
1240 			pr_warn("%s: CPU%d: Unlisted initial frequency changed to: %u KHz\n",
1241 				__func__, policy->cpu, policy->cur);
1242 		}
1243 	}
1244 
1245 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1246 				     CPUFREQ_START, policy);
1247 
1248 	if (!recover_policy) {
1249 		ret = cpufreq_add_dev_interface(policy, dev);
1250 		if (ret)
1251 			goto err_out_unregister;
1252 		blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
1253 				CPUFREQ_CREATE_POLICY, policy);
1254 	}
1255 
1256 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1257 	list_add(&policy->policy_list, &cpufreq_policy_list);
1258 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1259 
1260 	cpufreq_init_policy(policy);
1261 
1262 	if (!recover_policy) {
1263 		policy->user_policy.policy = policy->policy;
1264 		policy->user_policy.governor = policy->governor;
1265 	}
1266 	up_write(&policy->rwsem);
1267 
1268 	kobject_uevent(&policy->kobj, KOBJ_ADD);
1269 	up_read(&cpufreq_rwsem);
1270 
1271 	pr_debug("initialization complete\n");
1272 
1273 	return 0;
1274 
1275 err_out_unregister:
1276 err_get_freq:
1277 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1278 	for_each_cpu(j, policy->cpus)
1279 		per_cpu(cpufreq_cpu_data, j) = NULL;
1280 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1281 
1282 	if (cpufreq_driver->exit)
1283 		cpufreq_driver->exit(policy);
1284 err_set_policy_cpu:
1285 	if (recover_policy) {
1286 		/* Do not leave stale fallback data behind. */
1287 		per_cpu(cpufreq_cpu_data_fallback, cpu) = NULL;
1288 		cpufreq_policy_put_kobj(policy);
1289 	}
1290 	cpufreq_policy_free(policy);
1291 
1292 nomem_out:
1293 	up_read(&cpufreq_rwsem);
1294 
1295 	return ret;
1296 }
1297 
1298 /**
1299  * cpufreq_add_dev - add a CPU device
1300  *
1301  * Adds the cpufreq interface for a CPU device.
1302  *
1303  * The Oracle says: try running cpufreq registration/unregistration concurrently
1304  * with with cpu hotplugging and all hell will break loose. Tried to clean this
1305  * mess up, but more thorough testing is needed. - Mathieu
1306  */
1307 static int cpufreq_add_dev(struct device *dev, struct subsys_interface *sif)
1308 {
1309 	return __cpufreq_add_dev(dev, sif);
1310 }
1311 
1312 static int cpufreq_nominate_new_policy_cpu(struct cpufreq_policy *policy,
1313 					   unsigned int old_cpu)
1314 {
1315 	struct device *cpu_dev;
1316 	int ret;
1317 
1318 	/* first sibling now owns the new sysfs dir */
1319 	cpu_dev = get_cpu_device(cpumask_any_but(policy->cpus, old_cpu));
1320 
1321 	sysfs_remove_link(&cpu_dev->kobj, "cpufreq");
1322 	ret = kobject_move(&policy->kobj, &cpu_dev->kobj);
1323 	if (ret) {
1324 		pr_err("%s: Failed to move kobj: %d\n", __func__, ret);
1325 
1326 		down_write(&policy->rwsem);
1327 		cpumask_set_cpu(old_cpu, policy->cpus);
1328 		up_write(&policy->rwsem);
1329 
1330 		ret = sysfs_create_link(&cpu_dev->kobj, &policy->kobj,
1331 					"cpufreq");
1332 
1333 		return -EINVAL;
1334 	}
1335 
1336 	return cpu_dev->id;
1337 }
1338 
1339 static int __cpufreq_remove_dev_prepare(struct device *dev,
1340 					struct subsys_interface *sif)
1341 {
1342 	unsigned int cpu = dev->id, cpus;
1343 	int new_cpu, ret;
1344 	unsigned long flags;
1345 	struct cpufreq_policy *policy;
1346 
1347 	pr_debug("%s: unregistering CPU %u\n", __func__, cpu);
1348 
1349 	write_lock_irqsave(&cpufreq_driver_lock, flags);
1350 
1351 	policy = per_cpu(cpufreq_cpu_data, cpu);
1352 
1353 	/* Save the policy somewhere when doing a light-weight tear-down */
1354 	if (cpufreq_suspended)
1355 		per_cpu(cpufreq_cpu_data_fallback, cpu) = policy;
1356 
1357 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1358 
1359 	if (!policy) {
1360 		pr_debug("%s: No cpu_data found\n", __func__);
1361 		return -EINVAL;
1362 	}
1363 
1364 	if (has_target()) {
1365 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_STOP);
1366 		if (ret) {
1367 			pr_err("%s: Failed to stop governor\n", __func__);
1368 			return ret;
1369 		}
1370 	}
1371 
1372 	if (!cpufreq_driver->setpolicy)
1373 		strncpy(per_cpu(cpufreq_cpu_governor, cpu),
1374 			policy->governor->name, CPUFREQ_NAME_LEN);
1375 
1376 	down_read(&policy->rwsem);
1377 	cpus = cpumask_weight(policy->cpus);
1378 	up_read(&policy->rwsem);
1379 
1380 	if (cpu != policy->cpu) {
1381 		sysfs_remove_link(&dev->kobj, "cpufreq");
1382 	} else if (cpus > 1) {
1383 		new_cpu = cpufreq_nominate_new_policy_cpu(policy, cpu);
1384 		if (new_cpu >= 0) {
1385 			update_policy_cpu(policy, new_cpu);
1386 
1387 			if (!cpufreq_suspended)
1388 				pr_debug("%s: policy Kobject moved to cpu: %d from: %d\n",
1389 					 __func__, new_cpu, cpu);
1390 		}
1391 	} else if (cpufreq_driver->stop_cpu && cpufreq_driver->setpolicy) {
1392 		cpufreq_driver->stop_cpu(policy);
1393 	}
1394 
1395 	return 0;
1396 }
1397 
1398 static int __cpufreq_remove_dev_finish(struct device *dev,
1399 				       struct subsys_interface *sif)
1400 {
1401 	unsigned int cpu = dev->id, cpus;
1402 	int ret;
1403 	unsigned long flags;
1404 	struct cpufreq_policy *policy;
1405 
1406 	read_lock_irqsave(&cpufreq_driver_lock, flags);
1407 	policy = per_cpu(cpufreq_cpu_data, cpu);
1408 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1409 
1410 	if (!policy) {
1411 		pr_debug("%s: No cpu_data found\n", __func__);
1412 		return -EINVAL;
1413 	}
1414 
1415 	down_write(&policy->rwsem);
1416 	cpus = cpumask_weight(policy->cpus);
1417 
1418 	if (cpus > 1)
1419 		cpumask_clear_cpu(cpu, policy->cpus);
1420 	up_write(&policy->rwsem);
1421 
1422 	/* If cpu is last user of policy, free policy */
1423 	if (cpus == 1) {
1424 		if (has_target()) {
1425 			ret = __cpufreq_governor(policy,
1426 					CPUFREQ_GOV_POLICY_EXIT);
1427 			if (ret) {
1428 				pr_err("%s: Failed to exit governor\n",
1429 				       __func__);
1430 				return ret;
1431 			}
1432 		}
1433 
1434 		if (!cpufreq_suspended)
1435 			cpufreq_policy_put_kobj(policy);
1436 
1437 		/*
1438 		 * Perform the ->exit() even during light-weight tear-down,
1439 		 * since this is a core component, and is essential for the
1440 		 * subsequent light-weight ->init() to succeed.
1441 		 */
1442 		if (cpufreq_driver->exit)
1443 			cpufreq_driver->exit(policy);
1444 
1445 		/* Remove policy from list of active policies */
1446 		write_lock_irqsave(&cpufreq_driver_lock, flags);
1447 		list_del(&policy->policy_list);
1448 		write_unlock_irqrestore(&cpufreq_driver_lock, flags);
1449 
1450 		if (!cpufreq_suspended)
1451 			cpufreq_policy_free(policy);
1452 	} else if (has_target()) {
1453 		ret = __cpufreq_governor(policy, CPUFREQ_GOV_START);
1454 		if (!ret)
1455 			ret = __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS);
1456 
1457 		if (ret) {
1458 			pr_err("%s: Failed to start governor\n", __func__);
1459 			return ret;
1460 		}
1461 	}
1462 
1463 	per_cpu(cpufreq_cpu_data, cpu) = NULL;
1464 	return 0;
1465 }
1466 
1467 /**
1468  * cpufreq_remove_dev - remove a CPU device
1469  *
1470  * Removes the cpufreq interface for a CPU device.
1471  */
1472 static int cpufreq_remove_dev(struct device *dev, struct subsys_interface *sif)
1473 {
1474 	unsigned int cpu = dev->id;
1475 	int ret;
1476 
1477 	if (cpu_is_offline(cpu))
1478 		return 0;
1479 
1480 	ret = __cpufreq_remove_dev_prepare(dev, sif);
1481 
1482 	if (!ret)
1483 		ret = __cpufreq_remove_dev_finish(dev, sif);
1484 
1485 	return ret;
1486 }
1487 
1488 static void handle_update(struct work_struct *work)
1489 {
1490 	struct cpufreq_policy *policy =
1491 		container_of(work, struct cpufreq_policy, update);
1492 	unsigned int cpu = policy->cpu;
1493 	pr_debug("handle_update for cpu %u called\n", cpu);
1494 	cpufreq_update_policy(cpu);
1495 }
1496 
1497 /**
1498  *	cpufreq_out_of_sync - If actual and saved CPU frequency differs, we're
1499  *	in deep trouble.
1500  *	@cpu: cpu number
1501  *	@old_freq: CPU frequency the kernel thinks the CPU runs at
1502  *	@new_freq: CPU frequency the CPU actually runs at
1503  *
1504  *	We adjust to current frequency first, and need to clean up later.
1505  *	So either call to cpufreq_update_policy() or schedule handle_update()).
1506  */
1507 static void cpufreq_out_of_sync(unsigned int cpu, unsigned int old_freq,
1508 				unsigned int new_freq)
1509 {
1510 	struct cpufreq_policy *policy;
1511 	struct cpufreq_freqs freqs;
1512 	unsigned long flags;
1513 
1514 	pr_debug("Warning: CPU frequency out of sync: cpufreq and timing core thinks of %u, is %u kHz\n",
1515 		 old_freq, new_freq);
1516 
1517 	freqs.old = old_freq;
1518 	freqs.new = new_freq;
1519 
1520 	read_lock_irqsave(&cpufreq_driver_lock, flags);
1521 	policy = per_cpu(cpufreq_cpu_data, cpu);
1522 	read_unlock_irqrestore(&cpufreq_driver_lock, flags);
1523 
1524 	cpufreq_freq_transition_begin(policy, &freqs);
1525 	cpufreq_freq_transition_end(policy, &freqs, 0);
1526 }
1527 
1528 /**
1529  * cpufreq_quick_get - get the CPU frequency (in kHz) from policy->cur
1530  * @cpu: CPU number
1531  *
1532  * This is the last known freq, without actually getting it from the driver.
1533  * Return value will be same as what is shown in scaling_cur_freq in sysfs.
1534  */
1535 unsigned int cpufreq_quick_get(unsigned int cpu)
1536 {
1537 	struct cpufreq_policy *policy;
1538 	unsigned int ret_freq = 0;
1539 
1540 	if (cpufreq_driver && cpufreq_driver->setpolicy && cpufreq_driver->get)
1541 		return cpufreq_driver->get(cpu);
1542 
1543 	policy = cpufreq_cpu_get(cpu);
1544 	if (policy) {
1545 		ret_freq = policy->cur;
1546 		cpufreq_cpu_put(policy);
1547 	}
1548 
1549 	return ret_freq;
1550 }
1551 EXPORT_SYMBOL(cpufreq_quick_get);
1552 
1553 /**
1554  * cpufreq_quick_get_max - get the max reported CPU frequency for this CPU
1555  * @cpu: CPU number
1556  *
1557  * Just return the max possible frequency for a given CPU.
1558  */
1559 unsigned int cpufreq_quick_get_max(unsigned int cpu)
1560 {
1561 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1562 	unsigned int ret_freq = 0;
1563 
1564 	if (policy) {
1565 		ret_freq = policy->max;
1566 		cpufreq_cpu_put(policy);
1567 	}
1568 
1569 	return ret_freq;
1570 }
1571 EXPORT_SYMBOL(cpufreq_quick_get_max);
1572 
1573 static unsigned int __cpufreq_get(unsigned int cpu)
1574 {
1575 	struct cpufreq_policy *policy = per_cpu(cpufreq_cpu_data, cpu);
1576 	unsigned int ret_freq = 0;
1577 
1578 	if (!cpufreq_driver->get)
1579 		return ret_freq;
1580 
1581 	ret_freq = cpufreq_driver->get(cpu);
1582 
1583 	if (ret_freq && policy->cur &&
1584 		!(cpufreq_driver->flags & CPUFREQ_CONST_LOOPS)) {
1585 		/* verify no discrepancy between actual and
1586 					saved value exists */
1587 		if (unlikely(ret_freq != policy->cur)) {
1588 			cpufreq_out_of_sync(cpu, policy->cur, ret_freq);
1589 			schedule_work(&policy->update);
1590 		}
1591 	}
1592 
1593 	return ret_freq;
1594 }
1595 
1596 /**
1597  * cpufreq_get - get the current CPU frequency (in kHz)
1598  * @cpu: CPU number
1599  *
1600  * Get the CPU current (static) CPU frequency
1601  */
1602 unsigned int cpufreq_get(unsigned int cpu)
1603 {
1604 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
1605 	unsigned int ret_freq = 0;
1606 
1607 	if (policy) {
1608 		down_read(&policy->rwsem);
1609 		ret_freq = __cpufreq_get(cpu);
1610 		up_read(&policy->rwsem);
1611 
1612 		cpufreq_cpu_put(policy);
1613 	}
1614 
1615 	return ret_freq;
1616 }
1617 EXPORT_SYMBOL(cpufreq_get);
1618 
1619 static struct subsys_interface cpufreq_interface = {
1620 	.name		= "cpufreq",
1621 	.subsys		= &cpu_subsys,
1622 	.add_dev	= cpufreq_add_dev,
1623 	.remove_dev	= cpufreq_remove_dev,
1624 };
1625 
1626 /*
1627  * In case platform wants some specific frequency to be configured
1628  * during suspend..
1629  */
1630 int cpufreq_generic_suspend(struct cpufreq_policy *policy)
1631 {
1632 	int ret;
1633 
1634 	if (!policy->suspend_freq) {
1635 		pr_err("%s: suspend_freq can't be zero\n", __func__);
1636 		return -EINVAL;
1637 	}
1638 
1639 	pr_debug("%s: Setting suspend-freq: %u\n", __func__,
1640 			policy->suspend_freq);
1641 
1642 	ret = __cpufreq_driver_target(policy, policy->suspend_freq,
1643 			CPUFREQ_RELATION_H);
1644 	if (ret)
1645 		pr_err("%s: unable to set suspend-freq: %u. err: %d\n",
1646 				__func__, policy->suspend_freq, ret);
1647 
1648 	return ret;
1649 }
1650 EXPORT_SYMBOL(cpufreq_generic_suspend);
1651 
1652 /**
1653  * cpufreq_suspend() - Suspend CPUFreq governors
1654  *
1655  * Called during system wide Suspend/Hibernate cycles for suspending governors
1656  * as some platforms can't change frequency after this point in suspend cycle.
1657  * Because some of the devices (like: i2c, regulators, etc) they use for
1658  * changing frequency are suspended quickly after this point.
1659  */
1660 void cpufreq_suspend(void)
1661 {
1662 	struct cpufreq_policy *policy;
1663 
1664 	if (!cpufreq_driver)
1665 		return;
1666 
1667 	if (!has_target())
1668 		return;
1669 
1670 	pr_debug("%s: Suspending Governors\n", __func__);
1671 
1672 	list_for_each_entry(policy, &cpufreq_policy_list, policy_list) {
1673 		if (__cpufreq_governor(policy, CPUFREQ_GOV_STOP))
1674 			pr_err("%s: Failed to stop governor for policy: %p\n",
1675 				__func__, policy);
1676 		else if (cpufreq_driver->suspend
1677 		    && cpufreq_driver->suspend(policy))
1678 			pr_err("%s: Failed to suspend driver: %p\n", __func__,
1679 				policy);
1680 	}
1681 
1682 	cpufreq_suspended = true;
1683 }
1684 
1685 /**
1686  * cpufreq_resume() - Resume CPUFreq governors
1687  *
1688  * Called during system wide Suspend/Hibernate cycle for resuming governors that
1689  * are suspended with cpufreq_suspend().
1690  */
1691 void cpufreq_resume(void)
1692 {
1693 	struct cpufreq_policy *policy;
1694 
1695 	if (!cpufreq_driver)
1696 		return;
1697 
1698 	if (!has_target())
1699 		return;
1700 
1701 	pr_debug("%s: Resuming Governors\n", __func__);
1702 
1703 	cpufreq_suspended = false;
1704 
1705 	list_for_each_entry(policy, &cpufreq_policy_list, policy_list) {
1706 		if (cpufreq_driver->resume && cpufreq_driver->resume(policy))
1707 			pr_err("%s: Failed to resume driver: %p\n", __func__,
1708 				policy);
1709 		else if (__cpufreq_governor(policy, CPUFREQ_GOV_START)
1710 		    || __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS))
1711 			pr_err("%s: Failed to start governor for policy: %p\n",
1712 				__func__, policy);
1713 
1714 		/*
1715 		 * schedule call cpufreq_update_policy() for boot CPU, i.e. last
1716 		 * policy in list. It will verify that the current freq is in
1717 		 * sync with what we believe it to be.
1718 		 */
1719 		if (list_is_last(&policy->policy_list, &cpufreq_policy_list))
1720 			schedule_work(&policy->update);
1721 	}
1722 }
1723 
1724 /**
1725  *	cpufreq_get_current_driver - return current driver's name
1726  *
1727  *	Return the name string of the currently loaded cpufreq driver
1728  *	or NULL, if none.
1729  */
1730 const char *cpufreq_get_current_driver(void)
1731 {
1732 	if (cpufreq_driver)
1733 		return cpufreq_driver->name;
1734 
1735 	return NULL;
1736 }
1737 EXPORT_SYMBOL_GPL(cpufreq_get_current_driver);
1738 
1739 /*********************************************************************
1740  *                     NOTIFIER LISTS INTERFACE                      *
1741  *********************************************************************/
1742 
1743 /**
1744  *	cpufreq_register_notifier - register a driver with cpufreq
1745  *	@nb: notifier function to register
1746  *      @list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1747  *
1748  *	Add a driver to one of two lists: either a list of drivers that
1749  *      are notified about clock rate changes (once before and once after
1750  *      the transition), or a list of drivers that are notified about
1751  *      changes in cpufreq policy.
1752  *
1753  *	This function may sleep, and has the same return conditions as
1754  *	blocking_notifier_chain_register.
1755  */
1756 int cpufreq_register_notifier(struct notifier_block *nb, unsigned int list)
1757 {
1758 	int ret;
1759 
1760 	if (cpufreq_disabled())
1761 		return -EINVAL;
1762 
1763 	WARN_ON(!init_cpufreq_transition_notifier_list_called);
1764 
1765 	switch (list) {
1766 	case CPUFREQ_TRANSITION_NOTIFIER:
1767 		ret = srcu_notifier_chain_register(
1768 				&cpufreq_transition_notifier_list, nb);
1769 		break;
1770 	case CPUFREQ_POLICY_NOTIFIER:
1771 		ret = blocking_notifier_chain_register(
1772 				&cpufreq_policy_notifier_list, nb);
1773 		break;
1774 	default:
1775 		ret = -EINVAL;
1776 	}
1777 
1778 	return ret;
1779 }
1780 EXPORT_SYMBOL(cpufreq_register_notifier);
1781 
1782 /**
1783  *	cpufreq_unregister_notifier - unregister a driver with cpufreq
1784  *	@nb: notifier block to be unregistered
1785  *	@list: CPUFREQ_TRANSITION_NOTIFIER or CPUFREQ_POLICY_NOTIFIER
1786  *
1787  *	Remove a driver from the CPU frequency notifier list.
1788  *
1789  *	This function may sleep, and has the same return conditions as
1790  *	blocking_notifier_chain_unregister.
1791  */
1792 int cpufreq_unregister_notifier(struct notifier_block *nb, unsigned int list)
1793 {
1794 	int ret;
1795 
1796 	if (cpufreq_disabled())
1797 		return -EINVAL;
1798 
1799 	switch (list) {
1800 	case CPUFREQ_TRANSITION_NOTIFIER:
1801 		ret = srcu_notifier_chain_unregister(
1802 				&cpufreq_transition_notifier_list, nb);
1803 		break;
1804 	case CPUFREQ_POLICY_NOTIFIER:
1805 		ret = blocking_notifier_chain_unregister(
1806 				&cpufreq_policy_notifier_list, nb);
1807 		break;
1808 	default:
1809 		ret = -EINVAL;
1810 	}
1811 
1812 	return ret;
1813 }
1814 EXPORT_SYMBOL(cpufreq_unregister_notifier);
1815 
1816 
1817 /*********************************************************************
1818  *                              GOVERNORS                            *
1819  *********************************************************************/
1820 
1821 /* Must set freqs->new to intermediate frequency */
1822 static int __target_intermediate(struct cpufreq_policy *policy,
1823 				 struct cpufreq_freqs *freqs, int index)
1824 {
1825 	int ret;
1826 
1827 	freqs->new = cpufreq_driver->get_intermediate(policy, index);
1828 
1829 	/* We don't need to switch to intermediate freq */
1830 	if (!freqs->new)
1831 		return 0;
1832 
1833 	pr_debug("%s: cpu: %d, switching to intermediate freq: oldfreq: %u, intermediate freq: %u\n",
1834 		 __func__, policy->cpu, freqs->old, freqs->new);
1835 
1836 	cpufreq_freq_transition_begin(policy, freqs);
1837 	ret = cpufreq_driver->target_intermediate(policy, index);
1838 	cpufreq_freq_transition_end(policy, freqs, ret);
1839 
1840 	if (ret)
1841 		pr_err("%s: Failed to change to intermediate frequency: %d\n",
1842 		       __func__, ret);
1843 
1844 	return ret;
1845 }
1846 
1847 static int __target_index(struct cpufreq_policy *policy,
1848 			  struct cpufreq_frequency_table *freq_table, int index)
1849 {
1850 	struct cpufreq_freqs freqs = {.old = policy->cur, .flags = 0};
1851 	unsigned int intermediate_freq = 0;
1852 	int retval = -EINVAL;
1853 	bool notify;
1854 
1855 	notify = !(cpufreq_driver->flags & CPUFREQ_ASYNC_NOTIFICATION);
1856 	if (notify) {
1857 		/* Handle switching to intermediate frequency */
1858 		if (cpufreq_driver->get_intermediate) {
1859 			retval = __target_intermediate(policy, &freqs, index);
1860 			if (retval)
1861 				return retval;
1862 
1863 			intermediate_freq = freqs.new;
1864 			/* Set old freq to intermediate */
1865 			if (intermediate_freq)
1866 				freqs.old = freqs.new;
1867 		}
1868 
1869 		freqs.new = freq_table[index].frequency;
1870 		pr_debug("%s: cpu: %d, oldfreq: %u, new freq: %u\n",
1871 			 __func__, policy->cpu, freqs.old, freqs.new);
1872 
1873 		cpufreq_freq_transition_begin(policy, &freqs);
1874 	}
1875 
1876 	retval = cpufreq_driver->target_index(policy, index);
1877 	if (retval)
1878 		pr_err("%s: Failed to change cpu frequency: %d\n", __func__,
1879 		       retval);
1880 
1881 	if (notify) {
1882 		cpufreq_freq_transition_end(policy, &freqs, retval);
1883 
1884 		/*
1885 		 * Failed after setting to intermediate freq? Driver should have
1886 		 * reverted back to initial frequency and so should we. Check
1887 		 * here for intermediate_freq instead of get_intermediate, in
1888 		 * case we have't switched to intermediate freq at all.
1889 		 */
1890 		if (unlikely(retval && intermediate_freq)) {
1891 			freqs.old = intermediate_freq;
1892 			freqs.new = policy->restore_freq;
1893 			cpufreq_freq_transition_begin(policy, &freqs);
1894 			cpufreq_freq_transition_end(policy, &freqs, 0);
1895 		}
1896 	}
1897 
1898 	return retval;
1899 }
1900 
1901 int __cpufreq_driver_target(struct cpufreq_policy *policy,
1902 			    unsigned int target_freq,
1903 			    unsigned int relation)
1904 {
1905 	unsigned int old_target_freq = target_freq;
1906 	int retval = -EINVAL;
1907 
1908 	if (cpufreq_disabled())
1909 		return -ENODEV;
1910 
1911 	/* Make sure that target_freq is within supported range */
1912 	if (target_freq > policy->max)
1913 		target_freq = policy->max;
1914 	if (target_freq < policy->min)
1915 		target_freq = policy->min;
1916 
1917 	pr_debug("target for CPU %u: %u kHz, relation %u, requested %u kHz\n",
1918 		 policy->cpu, target_freq, relation, old_target_freq);
1919 
1920 	/*
1921 	 * This might look like a redundant call as we are checking it again
1922 	 * after finding index. But it is left intentionally for cases where
1923 	 * exactly same freq is called again and so we can save on few function
1924 	 * calls.
1925 	 */
1926 	if (target_freq == policy->cur)
1927 		return 0;
1928 
1929 	/* Save last value to restore later on errors */
1930 	policy->restore_freq = policy->cur;
1931 
1932 	if (cpufreq_driver->target)
1933 		retval = cpufreq_driver->target(policy, target_freq, relation);
1934 	else if (cpufreq_driver->target_index) {
1935 		struct cpufreq_frequency_table *freq_table;
1936 		int index;
1937 
1938 		freq_table = cpufreq_frequency_get_table(policy->cpu);
1939 		if (unlikely(!freq_table)) {
1940 			pr_err("%s: Unable to find freq_table\n", __func__);
1941 			goto out;
1942 		}
1943 
1944 		retval = cpufreq_frequency_table_target(policy, freq_table,
1945 				target_freq, relation, &index);
1946 		if (unlikely(retval)) {
1947 			pr_err("%s: Unable to find matching freq\n", __func__);
1948 			goto out;
1949 		}
1950 
1951 		if (freq_table[index].frequency == policy->cur) {
1952 			retval = 0;
1953 			goto out;
1954 		}
1955 
1956 		retval = __target_index(policy, freq_table, index);
1957 	}
1958 
1959 out:
1960 	return retval;
1961 }
1962 EXPORT_SYMBOL_GPL(__cpufreq_driver_target);
1963 
1964 int cpufreq_driver_target(struct cpufreq_policy *policy,
1965 			  unsigned int target_freq,
1966 			  unsigned int relation)
1967 {
1968 	int ret = -EINVAL;
1969 
1970 	down_write(&policy->rwsem);
1971 
1972 	ret = __cpufreq_driver_target(policy, target_freq, relation);
1973 
1974 	up_write(&policy->rwsem);
1975 
1976 	return ret;
1977 }
1978 EXPORT_SYMBOL_GPL(cpufreq_driver_target);
1979 
1980 /*
1981  * when "event" is CPUFREQ_GOV_LIMITS
1982  */
1983 
1984 static int __cpufreq_governor(struct cpufreq_policy *policy,
1985 					unsigned int event)
1986 {
1987 	int ret;
1988 
1989 	/* Only must be defined when default governor is known to have latency
1990 	   restrictions, like e.g. conservative or ondemand.
1991 	   That this is the case is already ensured in Kconfig
1992 	*/
1993 #ifdef CONFIG_CPU_FREQ_GOV_PERFORMANCE
1994 	struct cpufreq_governor *gov = &cpufreq_gov_performance;
1995 #else
1996 	struct cpufreq_governor *gov = NULL;
1997 #endif
1998 
1999 	/* Don't start any governor operations if we are entering suspend */
2000 	if (cpufreq_suspended)
2001 		return 0;
2002 
2003 	if (policy->governor->max_transition_latency &&
2004 	    policy->cpuinfo.transition_latency >
2005 	    policy->governor->max_transition_latency) {
2006 		if (!gov)
2007 			return -EINVAL;
2008 		else {
2009 			pr_warn("%s governor failed, too long transition latency of HW, fallback to %s governor\n",
2010 				policy->governor->name, gov->name);
2011 			policy->governor = gov;
2012 		}
2013 	}
2014 
2015 	if (event == CPUFREQ_GOV_POLICY_INIT)
2016 		if (!try_module_get(policy->governor->owner))
2017 			return -EINVAL;
2018 
2019 	pr_debug("__cpufreq_governor for CPU %u, event %u\n",
2020 		 policy->cpu, event);
2021 
2022 	mutex_lock(&cpufreq_governor_lock);
2023 	if ((policy->governor_enabled && event == CPUFREQ_GOV_START)
2024 	    || (!policy->governor_enabled
2025 	    && (event == CPUFREQ_GOV_LIMITS || event == CPUFREQ_GOV_STOP))) {
2026 		mutex_unlock(&cpufreq_governor_lock);
2027 		return -EBUSY;
2028 	}
2029 
2030 	if (event == CPUFREQ_GOV_STOP)
2031 		policy->governor_enabled = false;
2032 	else if (event == CPUFREQ_GOV_START)
2033 		policy->governor_enabled = true;
2034 
2035 	mutex_unlock(&cpufreq_governor_lock);
2036 
2037 	ret = policy->governor->governor(policy, event);
2038 
2039 	if (!ret) {
2040 		if (event == CPUFREQ_GOV_POLICY_INIT)
2041 			policy->governor->initialized++;
2042 		else if (event == CPUFREQ_GOV_POLICY_EXIT)
2043 			policy->governor->initialized--;
2044 	} else {
2045 		/* Restore original values */
2046 		mutex_lock(&cpufreq_governor_lock);
2047 		if (event == CPUFREQ_GOV_STOP)
2048 			policy->governor_enabled = true;
2049 		else if (event == CPUFREQ_GOV_START)
2050 			policy->governor_enabled = false;
2051 		mutex_unlock(&cpufreq_governor_lock);
2052 	}
2053 
2054 	if (((event == CPUFREQ_GOV_POLICY_INIT) && ret) ||
2055 			((event == CPUFREQ_GOV_POLICY_EXIT) && !ret))
2056 		module_put(policy->governor->owner);
2057 
2058 	return ret;
2059 }
2060 
2061 int cpufreq_register_governor(struct cpufreq_governor *governor)
2062 {
2063 	int err;
2064 
2065 	if (!governor)
2066 		return -EINVAL;
2067 
2068 	if (cpufreq_disabled())
2069 		return -ENODEV;
2070 
2071 	mutex_lock(&cpufreq_governor_mutex);
2072 
2073 	governor->initialized = 0;
2074 	err = -EBUSY;
2075 	if (__find_governor(governor->name) == NULL) {
2076 		err = 0;
2077 		list_add(&governor->governor_list, &cpufreq_governor_list);
2078 	}
2079 
2080 	mutex_unlock(&cpufreq_governor_mutex);
2081 	return err;
2082 }
2083 EXPORT_SYMBOL_GPL(cpufreq_register_governor);
2084 
2085 void cpufreq_unregister_governor(struct cpufreq_governor *governor)
2086 {
2087 	int cpu;
2088 
2089 	if (!governor)
2090 		return;
2091 
2092 	if (cpufreq_disabled())
2093 		return;
2094 
2095 	for_each_present_cpu(cpu) {
2096 		if (cpu_online(cpu))
2097 			continue;
2098 		if (!strcmp(per_cpu(cpufreq_cpu_governor, cpu), governor->name))
2099 			strcpy(per_cpu(cpufreq_cpu_governor, cpu), "\0");
2100 	}
2101 
2102 	mutex_lock(&cpufreq_governor_mutex);
2103 	list_del(&governor->governor_list);
2104 	mutex_unlock(&cpufreq_governor_mutex);
2105 	return;
2106 }
2107 EXPORT_SYMBOL_GPL(cpufreq_unregister_governor);
2108 
2109 
2110 /*********************************************************************
2111  *                          POLICY INTERFACE                         *
2112  *********************************************************************/
2113 
2114 /**
2115  * cpufreq_get_policy - get the current cpufreq_policy
2116  * @policy: struct cpufreq_policy into which the current cpufreq_policy
2117  *	is written
2118  *
2119  * Reads the current cpufreq policy.
2120  */
2121 int cpufreq_get_policy(struct cpufreq_policy *policy, unsigned int cpu)
2122 {
2123 	struct cpufreq_policy *cpu_policy;
2124 	if (!policy)
2125 		return -EINVAL;
2126 
2127 	cpu_policy = cpufreq_cpu_get(cpu);
2128 	if (!cpu_policy)
2129 		return -EINVAL;
2130 
2131 	memcpy(policy, cpu_policy, sizeof(*policy));
2132 
2133 	cpufreq_cpu_put(cpu_policy);
2134 	return 0;
2135 }
2136 EXPORT_SYMBOL(cpufreq_get_policy);
2137 
2138 /*
2139  * policy : current policy.
2140  * new_policy: policy to be set.
2141  */
2142 static int cpufreq_set_policy(struct cpufreq_policy *policy,
2143 				struct cpufreq_policy *new_policy)
2144 {
2145 	struct cpufreq_governor *old_gov;
2146 	int ret;
2147 
2148 	pr_debug("setting new policy for CPU %u: %u - %u kHz\n",
2149 		 new_policy->cpu, new_policy->min, new_policy->max);
2150 
2151 	memcpy(&new_policy->cpuinfo, &policy->cpuinfo, sizeof(policy->cpuinfo));
2152 
2153 	if (new_policy->min > policy->max || new_policy->max < policy->min)
2154 		return -EINVAL;
2155 
2156 	/* verify the cpu speed can be set within this limit */
2157 	ret = cpufreq_driver->verify(new_policy);
2158 	if (ret)
2159 		return ret;
2160 
2161 	/* adjust if necessary - all reasons */
2162 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
2163 			CPUFREQ_ADJUST, new_policy);
2164 
2165 	/* adjust if necessary - hardware incompatibility*/
2166 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
2167 			CPUFREQ_INCOMPATIBLE, new_policy);
2168 
2169 	/*
2170 	 * verify the cpu speed can be set within this limit, which might be
2171 	 * different to the first one
2172 	 */
2173 	ret = cpufreq_driver->verify(new_policy);
2174 	if (ret)
2175 		return ret;
2176 
2177 	/* notification of the new policy */
2178 	blocking_notifier_call_chain(&cpufreq_policy_notifier_list,
2179 			CPUFREQ_NOTIFY, new_policy);
2180 
2181 	policy->min = new_policy->min;
2182 	policy->max = new_policy->max;
2183 
2184 	pr_debug("new min and max freqs are %u - %u kHz\n",
2185 		 policy->min, policy->max);
2186 
2187 	if (cpufreq_driver->setpolicy) {
2188 		policy->policy = new_policy->policy;
2189 		pr_debug("setting range\n");
2190 		return cpufreq_driver->setpolicy(new_policy);
2191 	}
2192 
2193 	if (new_policy->governor == policy->governor)
2194 		goto out;
2195 
2196 	pr_debug("governor switch\n");
2197 
2198 	/* save old, working values */
2199 	old_gov = policy->governor;
2200 	/* end old governor */
2201 	if (old_gov) {
2202 		__cpufreq_governor(policy, CPUFREQ_GOV_STOP);
2203 		up_write(&policy->rwsem);
2204 		__cpufreq_governor(policy, CPUFREQ_GOV_POLICY_EXIT);
2205 		down_write(&policy->rwsem);
2206 	}
2207 
2208 	/* start new governor */
2209 	policy->governor = new_policy->governor;
2210 	if (!__cpufreq_governor(policy, CPUFREQ_GOV_POLICY_INIT)) {
2211 		if (!__cpufreq_governor(policy, CPUFREQ_GOV_START))
2212 			goto out;
2213 
2214 		up_write(&policy->rwsem);
2215 		__cpufreq_governor(policy, CPUFREQ_GOV_POLICY_EXIT);
2216 		down_write(&policy->rwsem);
2217 	}
2218 
2219 	/* new governor failed, so re-start old one */
2220 	pr_debug("starting governor %s failed\n", policy->governor->name);
2221 	if (old_gov) {
2222 		policy->governor = old_gov;
2223 		__cpufreq_governor(policy, CPUFREQ_GOV_POLICY_INIT);
2224 		__cpufreq_governor(policy, CPUFREQ_GOV_START);
2225 	}
2226 
2227 	return -EINVAL;
2228 
2229  out:
2230 	pr_debug("governor: change or update limits\n");
2231 	return __cpufreq_governor(policy, CPUFREQ_GOV_LIMITS);
2232 }
2233 
2234 /**
2235  *	cpufreq_update_policy - re-evaluate an existing cpufreq policy
2236  *	@cpu: CPU which shall be re-evaluated
2237  *
2238  *	Useful for policy notifiers which have different necessities
2239  *	at different times.
2240  */
2241 int cpufreq_update_policy(unsigned int cpu)
2242 {
2243 	struct cpufreq_policy *policy = cpufreq_cpu_get(cpu);
2244 	struct cpufreq_policy new_policy;
2245 	int ret;
2246 
2247 	if (!policy)
2248 		return -ENODEV;
2249 
2250 	down_write(&policy->rwsem);
2251 
2252 	pr_debug("updating policy for CPU %u\n", cpu);
2253 	memcpy(&new_policy, policy, sizeof(*policy));
2254 	new_policy.min = policy->user_policy.min;
2255 	new_policy.max = policy->user_policy.max;
2256 	new_policy.policy = policy->user_policy.policy;
2257 	new_policy.governor = policy->user_policy.governor;
2258 
2259 	/*
2260 	 * BIOS might change freq behind our back
2261 	 * -> ask driver for current freq and notify governors about a change
2262 	 */
2263 	if (cpufreq_driver->get && !cpufreq_driver->setpolicy) {
2264 		new_policy.cur = cpufreq_driver->get(cpu);
2265 		if (WARN_ON(!new_policy.cur)) {
2266 			ret = -EIO;
2267 			goto unlock;
2268 		}
2269 
2270 		if (!policy->cur) {
2271 			pr_debug("Driver did not initialize current freq\n");
2272 			policy->cur = new_policy.cur;
2273 		} else {
2274 			if (policy->cur != new_policy.cur && has_target())
2275 				cpufreq_out_of_sync(cpu, policy->cur,
2276 								new_policy.cur);
2277 		}
2278 	}
2279 
2280 	ret = cpufreq_set_policy(policy, &new_policy);
2281 
2282 unlock:
2283 	up_write(&policy->rwsem);
2284 
2285 	cpufreq_cpu_put(policy);
2286 	return ret;
2287 }
2288 EXPORT_SYMBOL(cpufreq_update_policy);
2289 
2290 static int cpufreq_cpu_callback(struct notifier_block *nfb,
2291 					unsigned long action, void *hcpu)
2292 {
2293 	unsigned int cpu = (unsigned long)hcpu;
2294 	struct device *dev;
2295 
2296 	dev = get_cpu_device(cpu);
2297 	if (dev) {
2298 		switch (action & ~CPU_TASKS_FROZEN) {
2299 		case CPU_ONLINE:
2300 			__cpufreq_add_dev(dev, NULL);
2301 			break;
2302 
2303 		case CPU_DOWN_PREPARE:
2304 			__cpufreq_remove_dev_prepare(dev, NULL);
2305 			break;
2306 
2307 		case CPU_POST_DEAD:
2308 			__cpufreq_remove_dev_finish(dev, NULL);
2309 			break;
2310 
2311 		case CPU_DOWN_FAILED:
2312 			__cpufreq_add_dev(dev, NULL);
2313 			break;
2314 		}
2315 	}
2316 	return NOTIFY_OK;
2317 }
2318 
2319 static struct notifier_block __refdata cpufreq_cpu_notifier = {
2320 	.notifier_call = cpufreq_cpu_callback,
2321 };
2322 
2323 /*********************************************************************
2324  *               BOOST						     *
2325  *********************************************************************/
2326 static int cpufreq_boost_set_sw(int state)
2327 {
2328 	struct cpufreq_frequency_table *freq_table;
2329 	struct cpufreq_policy *policy;
2330 	int ret = -EINVAL;
2331 
2332 	list_for_each_entry(policy, &cpufreq_policy_list, policy_list) {
2333 		freq_table = cpufreq_frequency_get_table(policy->cpu);
2334 		if (freq_table) {
2335 			ret = cpufreq_frequency_table_cpuinfo(policy,
2336 							freq_table);
2337 			if (ret) {
2338 				pr_err("%s: Policy frequency update failed\n",
2339 				       __func__);
2340 				break;
2341 			}
2342 			policy->user_policy.max = policy->max;
2343 			__cpufreq_governor(policy, CPUFREQ_GOV_LIMITS);
2344 		}
2345 	}
2346 
2347 	return ret;
2348 }
2349 
2350 int cpufreq_boost_trigger_state(int state)
2351 {
2352 	unsigned long flags;
2353 	int ret = 0;
2354 
2355 	if (cpufreq_driver->boost_enabled == state)
2356 		return 0;
2357 
2358 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2359 	cpufreq_driver->boost_enabled = state;
2360 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2361 
2362 	ret = cpufreq_driver->set_boost(state);
2363 	if (ret) {
2364 		write_lock_irqsave(&cpufreq_driver_lock, flags);
2365 		cpufreq_driver->boost_enabled = !state;
2366 		write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2367 
2368 		pr_err("%s: Cannot %s BOOST\n",
2369 		       __func__, state ? "enable" : "disable");
2370 	}
2371 
2372 	return ret;
2373 }
2374 
2375 int cpufreq_boost_supported(void)
2376 {
2377 	if (likely(cpufreq_driver))
2378 		return cpufreq_driver->boost_supported;
2379 
2380 	return 0;
2381 }
2382 EXPORT_SYMBOL_GPL(cpufreq_boost_supported);
2383 
2384 int cpufreq_boost_enabled(void)
2385 {
2386 	return cpufreq_driver->boost_enabled;
2387 }
2388 EXPORT_SYMBOL_GPL(cpufreq_boost_enabled);
2389 
2390 /*********************************************************************
2391  *               REGISTER / UNREGISTER CPUFREQ DRIVER                *
2392  *********************************************************************/
2393 
2394 /**
2395  * cpufreq_register_driver - register a CPU Frequency driver
2396  * @driver_data: A struct cpufreq_driver containing the values#
2397  * submitted by the CPU Frequency driver.
2398  *
2399  * Registers a CPU Frequency driver to this core code. This code
2400  * returns zero on success, -EBUSY when another driver got here first
2401  * (and isn't unregistered in the meantime).
2402  *
2403  */
2404 int cpufreq_register_driver(struct cpufreq_driver *driver_data)
2405 {
2406 	unsigned long flags;
2407 	int ret;
2408 
2409 	if (cpufreq_disabled())
2410 		return -ENODEV;
2411 
2412 	if (!driver_data || !driver_data->verify || !driver_data->init ||
2413 	    !(driver_data->setpolicy || driver_data->target_index ||
2414 		    driver_data->target) ||
2415 	     (driver_data->setpolicy && (driver_data->target_index ||
2416 		    driver_data->target)) ||
2417 	     (!!driver_data->get_intermediate != !!driver_data->target_intermediate))
2418 		return -EINVAL;
2419 
2420 	pr_debug("trying to register driver %s\n", driver_data->name);
2421 
2422 	if (driver_data->setpolicy)
2423 		driver_data->flags |= CPUFREQ_CONST_LOOPS;
2424 
2425 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2426 	if (cpufreq_driver) {
2427 		write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2428 		return -EEXIST;
2429 	}
2430 	cpufreq_driver = driver_data;
2431 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2432 
2433 	if (cpufreq_boost_supported()) {
2434 		/*
2435 		 * Check if driver provides function to enable boost -
2436 		 * if not, use cpufreq_boost_set_sw as default
2437 		 */
2438 		if (!cpufreq_driver->set_boost)
2439 			cpufreq_driver->set_boost = cpufreq_boost_set_sw;
2440 
2441 		ret = cpufreq_sysfs_create_file(&boost.attr);
2442 		if (ret) {
2443 			pr_err("%s: cannot register global BOOST sysfs file\n",
2444 			       __func__);
2445 			goto err_null_driver;
2446 		}
2447 	}
2448 
2449 	ret = subsys_interface_register(&cpufreq_interface);
2450 	if (ret)
2451 		goto err_boost_unreg;
2452 
2453 	if (!(cpufreq_driver->flags & CPUFREQ_STICKY)) {
2454 		int i;
2455 		ret = -ENODEV;
2456 
2457 		/* check for at least one working CPU */
2458 		for (i = 0; i < nr_cpu_ids; i++)
2459 			if (cpu_possible(i) && per_cpu(cpufreq_cpu_data, i)) {
2460 				ret = 0;
2461 				break;
2462 			}
2463 
2464 		/* if all ->init() calls failed, unregister */
2465 		if (ret) {
2466 			pr_debug("no CPU initialized for driver %s\n",
2467 				 driver_data->name);
2468 			goto err_if_unreg;
2469 		}
2470 	}
2471 
2472 	register_hotcpu_notifier(&cpufreq_cpu_notifier);
2473 	pr_debug("driver %s up and running\n", driver_data->name);
2474 
2475 	return 0;
2476 err_if_unreg:
2477 	subsys_interface_unregister(&cpufreq_interface);
2478 err_boost_unreg:
2479 	if (cpufreq_boost_supported())
2480 		cpufreq_sysfs_remove_file(&boost.attr);
2481 err_null_driver:
2482 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2483 	cpufreq_driver = NULL;
2484 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2485 	return ret;
2486 }
2487 EXPORT_SYMBOL_GPL(cpufreq_register_driver);
2488 
2489 /**
2490  * cpufreq_unregister_driver - unregister the current CPUFreq driver
2491  *
2492  * Unregister the current CPUFreq driver. Only call this if you have
2493  * the right to do so, i.e. if you have succeeded in initialising before!
2494  * Returns zero if successful, and -EINVAL if the cpufreq_driver is
2495  * currently not initialised.
2496  */
2497 int cpufreq_unregister_driver(struct cpufreq_driver *driver)
2498 {
2499 	unsigned long flags;
2500 
2501 	if (!cpufreq_driver || (driver != cpufreq_driver))
2502 		return -EINVAL;
2503 
2504 	pr_debug("unregistering driver %s\n", driver->name);
2505 
2506 	subsys_interface_unregister(&cpufreq_interface);
2507 	if (cpufreq_boost_supported())
2508 		cpufreq_sysfs_remove_file(&boost.attr);
2509 
2510 	unregister_hotcpu_notifier(&cpufreq_cpu_notifier);
2511 
2512 	down_write(&cpufreq_rwsem);
2513 	write_lock_irqsave(&cpufreq_driver_lock, flags);
2514 
2515 	cpufreq_driver = NULL;
2516 
2517 	write_unlock_irqrestore(&cpufreq_driver_lock, flags);
2518 	up_write(&cpufreq_rwsem);
2519 
2520 	return 0;
2521 }
2522 EXPORT_SYMBOL_GPL(cpufreq_unregister_driver);
2523 
2524 static int __init cpufreq_core_init(void)
2525 {
2526 	if (cpufreq_disabled())
2527 		return -ENODEV;
2528 
2529 	cpufreq_global_kobject = kobject_create();
2530 	BUG_ON(!cpufreq_global_kobject);
2531 
2532 	return 0;
2533 }
2534 core_initcall(cpufreq_core_init);
2535