xref: /linux/drivers/thermal/thermal_core.c (revision 7f71507851fc7764b36a3221839607d3a45c2025)
1 // SPDX-License-Identifier: GPL-2.0
2 /*
3  *  thermal.c - Generic Thermal Management Sysfs support.
4  *
5  *  Copyright (C) 2008 Intel Corp
6  *  Copyright (C) 2008 Zhang Rui <rui.zhang@intel.com>
7  *  Copyright (C) 2008 Sujith Thomas <sujith.thomas@intel.com>
8  */
9 
10 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
11 
12 #include <linux/device.h>
13 #include <linux/err.h>
14 #include <linux/export.h>
15 #include <linux/slab.h>
16 #include <linux/kdev_t.h>
17 #include <linux/idr.h>
18 #include <linux/thermal.h>
19 #include <linux/reboot.h>
20 #include <linux/string.h>
21 #include <linux/of.h>
22 #include <linux/suspend.h>
23 
24 #define CREATE_TRACE_POINTS
25 #include "thermal_trace.h"
26 
27 #include "thermal_core.h"
28 #include "thermal_hwmon.h"
29 
30 static DEFINE_IDA(thermal_tz_ida);
31 static DEFINE_IDA(thermal_cdev_ida);
32 
33 static LIST_HEAD(thermal_tz_list);
34 static LIST_HEAD(thermal_cdev_list);
35 static LIST_HEAD(thermal_governor_list);
36 
37 static DEFINE_MUTEX(thermal_list_lock);
38 static DEFINE_MUTEX(thermal_governor_lock);
39 
40 static struct thermal_governor *def_governor;
41 
42 static bool thermal_pm_suspended;
43 
44 /*
45  * Governor section: set of functions to handle thermal governors
46  *
47  * Functions to help in the life cycle of thermal governors within
48  * the thermal core and by the thermal governor code.
49  */
50 
51 static struct thermal_governor *__find_governor(const char *name)
52 {
53 	struct thermal_governor *pos;
54 
55 	if (!name || !name[0])
56 		return def_governor;
57 
58 	list_for_each_entry(pos, &thermal_governor_list, governor_list)
59 		if (!strncasecmp(name, pos->name, THERMAL_NAME_LENGTH))
60 			return pos;
61 
62 	return NULL;
63 }
64 
65 /**
66  * bind_previous_governor() - bind the previous governor of the thermal zone
67  * @tz:		a valid pointer to a struct thermal_zone_device
68  * @failed_gov_name:	the name of the governor that failed to register
69  *
70  * Register the previous governor of the thermal zone after a new
71  * governor has failed to be bound.
72  */
73 static void bind_previous_governor(struct thermal_zone_device *tz,
74 				   const char *failed_gov_name)
75 {
76 	if (tz->governor && tz->governor->bind_to_tz) {
77 		if (tz->governor->bind_to_tz(tz)) {
78 			dev_err(&tz->device,
79 				"governor %s failed to bind and the previous one (%s) failed to bind again, thermal zone %s has no governor\n",
80 				failed_gov_name, tz->governor->name, tz->type);
81 			tz->governor = NULL;
82 		}
83 	}
84 }
85 
86 /**
87  * thermal_set_governor() - Switch to another governor
88  * @tz:		a valid pointer to a struct thermal_zone_device
89  * @new_gov:	pointer to the new governor
90  *
91  * Change the governor of thermal zone @tz.
92  *
93  * Return: 0 on success, an error if the new governor's bind_to_tz() failed.
94  */
95 static int thermal_set_governor(struct thermal_zone_device *tz,
96 				struct thermal_governor *new_gov)
97 {
98 	int ret = 0;
99 
100 	if (tz->governor && tz->governor->unbind_from_tz)
101 		tz->governor->unbind_from_tz(tz);
102 
103 	if (new_gov && new_gov->bind_to_tz) {
104 		ret = new_gov->bind_to_tz(tz);
105 		if (ret) {
106 			bind_previous_governor(tz, new_gov->name);
107 
108 			return ret;
109 		}
110 	}
111 
112 	tz->governor = new_gov;
113 
114 	return ret;
115 }
116 
117 int thermal_register_governor(struct thermal_governor *governor)
118 {
119 	int err;
120 	const char *name;
121 	struct thermal_zone_device *pos;
122 
123 	if (!governor)
124 		return -EINVAL;
125 
126 	guard(mutex)(&thermal_governor_lock);
127 
128 	err = -EBUSY;
129 	if (!__find_governor(governor->name)) {
130 		bool match_default;
131 
132 		err = 0;
133 		list_add(&governor->governor_list, &thermal_governor_list);
134 		match_default = !strncmp(governor->name,
135 					 DEFAULT_THERMAL_GOVERNOR,
136 					 THERMAL_NAME_LENGTH);
137 
138 		if (!def_governor && match_default)
139 			def_governor = governor;
140 	}
141 
142 	guard(mutex)(&thermal_list_lock);
143 
144 	list_for_each_entry(pos, &thermal_tz_list, node) {
145 		/*
146 		 * only thermal zones with specified tz->tzp->governor_name
147 		 * may run with tz->govenor unset
148 		 */
149 		if (pos->governor)
150 			continue;
151 
152 		name = pos->tzp->governor_name;
153 
154 		if (!strncasecmp(name, governor->name, THERMAL_NAME_LENGTH)) {
155 			int ret;
156 
157 			ret = thermal_set_governor(pos, governor);
158 			if (ret)
159 				dev_err(&pos->device,
160 					"Failed to set governor %s for thermal zone %s: %d\n",
161 					governor->name, pos->type, ret);
162 		}
163 	}
164 
165 	return err;
166 }
167 
168 void thermal_unregister_governor(struct thermal_governor *governor)
169 {
170 	struct thermal_zone_device *pos;
171 
172 	if (!governor)
173 		return;
174 
175 	guard(mutex)(&thermal_governor_lock);
176 
177 	if (!__find_governor(governor->name))
178 		return;
179 
180 	list_del(&governor->governor_list);
181 
182 	guard(mutex)(&thermal_list_lock);
183 
184 	list_for_each_entry(pos, &thermal_tz_list, node) {
185 		if (!strncasecmp(pos->governor->name, governor->name,
186 				 THERMAL_NAME_LENGTH))
187 			thermal_set_governor(pos, NULL);
188 	}
189 }
190 
191 int thermal_zone_device_set_policy(struct thermal_zone_device *tz,
192 				   char *policy)
193 {
194 	struct thermal_governor *gov;
195 	int ret = -EINVAL;
196 
197 	guard(mutex)(&thermal_governor_lock);
198 	guard(thermal_zone)(tz);
199 
200 	gov = __find_governor(strim(policy));
201 	if (gov)
202 		ret = thermal_set_governor(tz, gov);
203 
204 	thermal_notify_tz_gov_change(tz, policy);
205 
206 	return ret;
207 }
208 
209 int thermal_build_list_of_policies(char *buf)
210 {
211 	struct thermal_governor *pos;
212 	ssize_t count = 0;
213 
214 	guard(mutex)(&thermal_governor_lock);
215 
216 	list_for_each_entry(pos, &thermal_governor_list, governor_list) {
217 		count += sysfs_emit_at(buf, count, "%s ", pos->name);
218 	}
219 	count += sysfs_emit_at(buf, count, "\n");
220 
221 	return count;
222 }
223 
224 static void __init thermal_unregister_governors(void)
225 {
226 	struct thermal_governor **governor;
227 
228 	for_each_governor_table(governor)
229 		thermal_unregister_governor(*governor);
230 }
231 
232 static int __init thermal_register_governors(void)
233 {
234 	int ret = 0;
235 	struct thermal_governor **governor;
236 
237 	for_each_governor_table(governor) {
238 		ret = thermal_register_governor(*governor);
239 		if (ret) {
240 			pr_err("Failed to register governor: '%s'",
241 			       (*governor)->name);
242 			break;
243 		}
244 
245 		pr_info("Registered thermal governor '%s'",
246 			(*governor)->name);
247 	}
248 
249 	if (ret) {
250 		struct thermal_governor **gov;
251 
252 		for_each_governor_table(gov) {
253 			if (gov == governor)
254 				break;
255 			thermal_unregister_governor(*gov);
256 		}
257 	}
258 
259 	return ret;
260 }
261 
262 static int __thermal_zone_device_set_mode(struct thermal_zone_device *tz,
263 					  enum thermal_device_mode mode)
264 {
265 	if (tz->ops.change_mode) {
266 		int ret;
267 
268 		ret = tz->ops.change_mode(tz, mode);
269 		if (ret)
270 			return ret;
271 	}
272 
273 	tz->mode = mode;
274 
275 	return 0;
276 }
277 
278 static void thermal_zone_broken_disable(struct thermal_zone_device *tz)
279 {
280 	struct thermal_trip_desc *td;
281 
282 	dev_err(&tz->device, "Unable to get temperature, disabling!\n");
283 	/*
284 	 * This function only runs for enabled thermal zones, so no need to
285 	 * check for the current mode.
286 	 */
287 	__thermal_zone_device_set_mode(tz, THERMAL_DEVICE_DISABLED);
288 	thermal_notify_tz_disable(tz);
289 
290 	for_each_trip_desc(tz, td) {
291 		if (td->trip.type == THERMAL_TRIP_CRITICAL &&
292 		    td->trip.temperature > THERMAL_TEMP_INVALID) {
293 			dev_crit(&tz->device,
294 				 "Disabled thermal zone with critical trip point\n");
295 			return;
296 		}
297 	}
298 }
299 
300 /*
301  * Zone update section: main control loop applied to each zone while monitoring
302  * in polling mode. The monitoring is done using a workqueue.
303  * Same update may be done on a zone by calling thermal_zone_device_update().
304  *
305  * An update means:
306  * - Non-critical trips will invoke the governor responsible for that zone;
307  * - Hot trips will produce a notification to userspace;
308  * - Critical trip point will cause a system shutdown.
309  */
310 static void thermal_zone_device_set_polling(struct thermal_zone_device *tz,
311 					    unsigned long delay)
312 {
313 	if (delay > HZ)
314 		delay = round_jiffies_relative(delay);
315 
316 	mod_delayed_work(system_freezable_power_efficient_wq, &tz->poll_queue, delay);
317 }
318 
319 static void thermal_zone_recheck(struct thermal_zone_device *tz, int error)
320 {
321 	if (error == -EAGAIN) {
322 		thermal_zone_device_set_polling(tz, THERMAL_RECHECK_DELAY);
323 		return;
324 	}
325 
326 	/*
327 	 * Print the message once to reduce log noise.  It will be followed by
328 	 * another one if the temperature cannot be determined after multiple
329 	 * attempts.
330 	 */
331 	if (tz->recheck_delay_jiffies == THERMAL_RECHECK_DELAY)
332 		dev_info(&tz->device, "Temperature check failed (%d)\n", error);
333 
334 	thermal_zone_device_set_polling(tz, tz->recheck_delay_jiffies);
335 
336 	tz->recheck_delay_jiffies += max(tz->recheck_delay_jiffies >> 1, 1ULL);
337 	if (tz->recheck_delay_jiffies > THERMAL_MAX_RECHECK_DELAY) {
338 		thermal_zone_broken_disable(tz);
339 		/*
340 		 * Restore the original recheck delay value to allow the thermal
341 		 * zone to try to recover when it is reenabled by user space.
342 		 */
343 		tz->recheck_delay_jiffies = THERMAL_RECHECK_DELAY;
344 	}
345 }
346 
347 static void monitor_thermal_zone(struct thermal_zone_device *tz)
348 {
349 	if (tz->passive > 0 && tz->passive_delay_jiffies)
350 		thermal_zone_device_set_polling(tz, tz->passive_delay_jiffies);
351 	else if (tz->polling_delay_jiffies)
352 		thermal_zone_device_set_polling(tz, tz->polling_delay_jiffies);
353 }
354 
355 static struct thermal_governor *thermal_get_tz_governor(struct thermal_zone_device *tz)
356 {
357 	if (tz->governor)
358 		return tz->governor;
359 
360 	return def_governor;
361 }
362 
363 void thermal_governor_update_tz(struct thermal_zone_device *tz,
364 				enum thermal_notify_event reason)
365 {
366 	if (!tz->governor || !tz->governor->update_tz)
367 		return;
368 
369 	tz->governor->update_tz(tz, reason);
370 }
371 
372 static void thermal_zone_device_halt(struct thermal_zone_device *tz, bool shutdown)
373 {
374 	/*
375 	 * poweroff_delay_ms must be a carefully profiled positive value.
376 	 * Its a must for forced_emergency_poweroff_work to be scheduled.
377 	 */
378 	int poweroff_delay_ms = CONFIG_THERMAL_EMERGENCY_POWEROFF_DELAY_MS;
379 	const char *msg = "Temperature too high";
380 
381 	dev_emerg(&tz->device, "%s: critical temperature reached\n", tz->type);
382 
383 	if (shutdown)
384 		hw_protection_shutdown(msg, poweroff_delay_ms);
385 	else
386 		hw_protection_reboot(msg, poweroff_delay_ms);
387 }
388 
389 void thermal_zone_device_critical(struct thermal_zone_device *tz)
390 {
391 	thermal_zone_device_halt(tz, true);
392 }
393 EXPORT_SYMBOL(thermal_zone_device_critical);
394 
395 void thermal_zone_device_critical_reboot(struct thermal_zone_device *tz)
396 {
397 	thermal_zone_device_halt(tz, false);
398 }
399 
400 static void handle_critical_trips(struct thermal_zone_device *tz,
401 				  const struct thermal_trip *trip)
402 {
403 	trace_thermal_zone_trip(tz, thermal_zone_trip_id(tz, trip), trip->type);
404 
405 	if (trip->type == THERMAL_TRIP_CRITICAL)
406 		tz->ops.critical(tz);
407 	else if (tz->ops.hot)
408 		tz->ops.hot(tz);
409 }
410 
411 static void move_trip_to_sorted_list(struct thermal_trip_desc *td,
412 				     struct list_head *list)
413 {
414 	struct thermal_trip_desc *entry;
415 
416 	/*
417 	 * Delete upfront and then add to make relocation within the same list
418 	 * work.
419 	 */
420 	list_del(&td->list_node);
421 
422 	/* Assume that the new entry is likely to be the last one. */
423 	list_for_each_entry_reverse(entry, list, list_node) {
424 		if (entry->threshold <= td->threshold) {
425 			list_add(&td->list_node, &entry->list_node);
426 			return;
427 		}
428 	}
429 	list_add(&td->list_node, list);
430 }
431 
432 static void move_to_trips_high(struct thermal_zone_device *tz,
433 			       struct thermal_trip_desc *td)
434 {
435 	td->threshold = td->trip.temperature;
436 	move_trip_to_sorted_list(td, &tz->trips_high);
437 }
438 
439 static void move_to_trips_reached(struct thermal_zone_device *tz,
440 				  struct thermal_trip_desc *td)
441 {
442 	td->threshold = td->trip.temperature - td->trip.hysteresis;
443 	move_trip_to_sorted_list(td, &tz->trips_reached);
444 }
445 
446 static void move_to_trips_invalid(struct thermal_zone_device *tz,
447 				  struct thermal_trip_desc *td)
448 {
449 	td->threshold = INT_MAX;
450 	list_move(&td->list_node, &tz->trips_invalid);
451 }
452 
453 static void thermal_governor_trip_crossed(struct thermal_governor *governor,
454 					  struct thermal_zone_device *tz,
455 					  const struct thermal_trip *trip,
456 					  bool crossed_up)
457 {
458 	if (trip->type == THERMAL_TRIP_HOT || trip->type == THERMAL_TRIP_CRITICAL)
459 		return;
460 
461 	if (governor->trip_crossed)
462 		governor->trip_crossed(tz, trip, crossed_up);
463 }
464 
465 static void thermal_trip_crossed(struct thermal_zone_device *tz,
466 				 struct thermal_trip_desc *td,
467 				 struct thermal_governor *governor,
468 				 bool crossed_up)
469 {
470 	const struct thermal_trip *trip = &td->trip;
471 
472 	if (crossed_up) {
473 		if (trip->type == THERMAL_TRIP_PASSIVE)
474 			tz->passive++;
475 		else if (trip->type == THERMAL_TRIP_CRITICAL ||
476 			 trip->type == THERMAL_TRIP_HOT)
477 			handle_critical_trips(tz, trip);
478 
479 		thermal_notify_tz_trip_up(tz, trip);
480 		thermal_debug_tz_trip_up(tz, trip);
481 	} else {
482 		if (trip->type == THERMAL_TRIP_PASSIVE) {
483 			tz->passive--;
484 			WARN_ON(tz->passive < 0);
485 		}
486 		thermal_notify_tz_trip_down(tz, trip);
487 		thermal_debug_tz_trip_down(tz, trip);
488 	}
489 	thermal_governor_trip_crossed(governor, tz, trip, crossed_up);
490 }
491 
492 void thermal_zone_set_trip_hyst(struct thermal_zone_device *tz,
493 				struct thermal_trip *trip, int hyst)
494 {
495 	struct thermal_trip_desc *td = trip_to_trip_desc(trip);
496 
497 	WRITE_ONCE(trip->hysteresis, hyst);
498 	thermal_notify_tz_trip_change(tz, trip);
499 	/*
500 	 * If the zone temperature is above or at the trip tmperature, the trip
501 	 * is in the trips_reached list and its threshold is equal to its low
502 	 * temperature.  It needs to stay in that list, but its threshold needs
503 	 * to be updated and the list ordering may need to be restored.
504 	 */
505 	if (tz->temperature >= td->threshold)
506 		move_to_trips_reached(tz, td);
507 }
508 
509 void thermal_zone_set_trip_temp(struct thermal_zone_device *tz,
510 				struct thermal_trip *trip, int temp)
511 {
512 	struct thermal_trip_desc *td = trip_to_trip_desc(trip);
513 	int old_temp = trip->temperature;
514 
515 	if (old_temp == temp)
516 		return;
517 
518 	WRITE_ONCE(trip->temperature, temp);
519 	thermal_notify_tz_trip_change(tz, trip);
520 
521 	if (old_temp == THERMAL_TEMP_INVALID) {
522 		/*
523 		 * The trip was invalid before the change, so move it to the
524 		 * trips_high list regardless of the new temperature value
525 		 * because there is no mitigation under way for it.  If a
526 		 * mitigation needs to be started, the trip will be moved to the
527 		 * trips_reached list later.
528 		 */
529 		move_to_trips_high(tz, td);
530 		return;
531 	}
532 
533 	if (temp == THERMAL_TEMP_INVALID) {
534 		/*
535 		 * If the trip is in the trips_reached list, mitigation is under
536 		 * way for it and it needs to be stopped because the trip is
537 		 * effectively going away.
538 		 */
539 		if (tz->temperature >= td->threshold)
540 			thermal_trip_crossed(tz, td, thermal_get_tz_governor(tz), false);
541 
542 		move_to_trips_invalid(tz, td);
543 		return;
544 	}
545 
546 	/*
547 	 * The trip stays on its current list, but its threshold needs to be
548 	 * updated due to the temperature change and the list ordering may need
549 	 * to be restored.
550 	 */
551 	if (tz->temperature >= td->threshold)
552 		move_to_trips_reached(tz, td);
553 	else
554 		move_to_trips_high(tz, td);
555 }
556 EXPORT_SYMBOL_GPL(thermal_zone_set_trip_temp);
557 
558 static void thermal_zone_handle_trips(struct thermal_zone_device *tz,
559 				      struct thermal_governor *governor,
560 				      int *low, int *high)
561 {
562 	struct thermal_trip_desc *td, *next;
563 	LIST_HEAD(way_down_list);
564 
565 	/* Check the trips that were below or at the zone temperature. */
566 	list_for_each_entry_safe_reverse(td, next, &tz->trips_reached, list_node) {
567 		if (td->threshold <= tz->temperature)
568 			break;
569 
570 		thermal_trip_crossed(tz, td, governor, false);
571 		/*
572 		 * The current trips_high list needs to be processed before
573 		 * adding new entries to it, so put them on a temporary list.
574 		 */
575 		list_move(&td->list_node, &way_down_list);
576 	}
577 	/* Check the trips that were previously above the zone temperature. */
578 	list_for_each_entry_safe(td, next, &tz->trips_high, list_node) {
579 		if (td->threshold > tz->temperature)
580 			break;
581 
582 		thermal_trip_crossed(tz, td, governor, true);
583 		move_to_trips_reached(tz, td);
584 	}
585 	/* Move all of the trips from the temporary list to trips_high. */
586 	list_for_each_entry_safe(td, next, &way_down_list, list_node)
587 		move_to_trips_high(tz, td);
588 
589 	if (!list_empty(&tz->trips_reached)) {
590 		td = list_last_entry(&tz->trips_reached,
591 				     struct thermal_trip_desc, list_node);
592 		/*
593 		 * Set the "low" value below the current trip threshold in case
594 		 * the zone temperature is at that threshold and stays there,
595 		 * which would trigger a new interrupt immediately in vain.
596 		 */
597 		*low = td->threshold - 1;
598 	}
599 	if (!list_empty(&tz->trips_high)) {
600 		td = list_first_entry(&tz->trips_high,
601 				      struct thermal_trip_desc, list_node);
602 		*high = td->threshold;
603 	}
604 }
605 
606 void __thermal_zone_device_update(struct thermal_zone_device *tz,
607 				  enum thermal_notify_event event)
608 {
609 	struct thermal_governor *governor = thermal_get_tz_governor(tz);
610 	int low = -INT_MAX, high = INT_MAX;
611 	int temp, ret;
612 
613 	if (tz->state != TZ_STATE_READY || tz->mode != THERMAL_DEVICE_ENABLED)
614 		return;
615 
616 	ret = __thermal_zone_get_temp(tz, &temp);
617 	if (ret) {
618 		thermal_zone_recheck(tz, ret);
619 		return;
620 	} else if (temp <= THERMAL_TEMP_INVALID) {
621 		/*
622 		 * Special case: No valid temperature value is available, but
623 		 * the zone owner does not want the core to do anything about
624 		 * it.  Continue regular zone polling if needed, so that this
625 		 * function can be called again, but skip everything else.
626 		 */
627 		goto monitor;
628 	}
629 
630 	tz->recheck_delay_jiffies = THERMAL_RECHECK_DELAY;
631 
632 	tz->last_temperature = tz->temperature;
633 	tz->temperature = temp;
634 
635 	trace_thermal_temperature(tz);
636 
637 	thermal_genl_sampling_temp(tz->id, temp);
638 
639 	tz->notify_event = event;
640 
641 	thermal_zone_handle_trips(tz, governor, &low, &high);
642 
643 	thermal_thresholds_handle(tz, &low, &high);
644 
645 	thermal_zone_set_trips(tz, low, high);
646 
647 	if (governor->manage)
648 		governor->manage(tz);
649 
650 	thermal_debug_update_trip_stats(tz);
651 
652 monitor:
653 	monitor_thermal_zone(tz);
654 }
655 
656 static int thermal_zone_device_set_mode(struct thermal_zone_device *tz,
657 					enum thermal_device_mode mode)
658 {
659 	int ret;
660 
661 	guard(thermal_zone)(tz);
662 
663 	/* do nothing if mode isn't changing */
664 	if (mode == tz->mode)
665 		return 0;
666 
667 	ret = __thermal_zone_device_set_mode(tz, mode);
668 	if (ret)
669 		return ret;
670 
671 	__thermal_zone_device_update(tz, THERMAL_EVENT_UNSPECIFIED);
672 
673 	if (mode == THERMAL_DEVICE_ENABLED)
674 		thermal_notify_tz_enable(tz);
675 	else
676 		thermal_notify_tz_disable(tz);
677 
678 	return 0;
679 }
680 
681 int thermal_zone_device_enable(struct thermal_zone_device *tz)
682 {
683 	return thermal_zone_device_set_mode(tz, THERMAL_DEVICE_ENABLED);
684 }
685 EXPORT_SYMBOL_GPL(thermal_zone_device_enable);
686 
687 int thermal_zone_device_disable(struct thermal_zone_device *tz)
688 {
689 	return thermal_zone_device_set_mode(tz, THERMAL_DEVICE_DISABLED);
690 }
691 EXPORT_SYMBOL_GPL(thermal_zone_device_disable);
692 
693 static bool thermal_zone_is_present(struct thermal_zone_device *tz)
694 {
695 	return !list_empty(&tz->node);
696 }
697 
698 void thermal_zone_device_update(struct thermal_zone_device *tz,
699 				enum thermal_notify_event event)
700 {
701 	guard(thermal_zone)(tz);
702 
703 	if (thermal_zone_is_present(tz))
704 		__thermal_zone_device_update(tz, event);
705 }
706 EXPORT_SYMBOL_GPL(thermal_zone_device_update);
707 
708 int for_each_thermal_governor(int (*cb)(struct thermal_governor *, void *),
709 			      void *data)
710 {
711 	struct thermal_governor *gov;
712 
713 	guard(mutex)(&thermal_governor_lock);
714 
715 	list_for_each_entry(gov, &thermal_governor_list, governor_list) {
716 		int ret;
717 
718 		ret = cb(gov, data);
719 		if (ret)
720 			return ret;
721 	}
722 
723 	return 0;
724 }
725 
726 int for_each_thermal_cooling_device(int (*cb)(struct thermal_cooling_device *,
727 					      void *), void *data)
728 {
729 	struct thermal_cooling_device *cdev;
730 
731 	guard(mutex)(&thermal_list_lock);
732 
733 	list_for_each_entry(cdev, &thermal_cdev_list, node) {
734 		int ret;
735 
736 		ret = cb(cdev, data);
737 		if (ret)
738 			return ret;
739 	}
740 
741 	return 0;
742 }
743 
744 int for_each_thermal_zone(int (*cb)(struct thermal_zone_device *, void *),
745 			  void *data)
746 {
747 	struct thermal_zone_device *tz;
748 
749 	guard(mutex)(&thermal_list_lock);
750 
751 	list_for_each_entry(tz, &thermal_tz_list, node) {
752 		int ret;
753 
754 		ret = cb(tz, data);
755 		if (ret)
756 			return ret;
757 	}
758 
759 	return 0;
760 }
761 
762 struct thermal_zone_device *thermal_zone_get_by_id(int id)
763 {
764 	struct thermal_zone_device *tz;
765 
766 	guard(mutex)(&thermal_list_lock);
767 
768 	list_for_each_entry(tz, &thermal_tz_list, node) {
769 		if (tz->id == id) {
770 			get_device(&tz->device);
771 			return tz;
772 		}
773 	}
774 
775 	return NULL;
776 }
777 
778 /*
779  * Device management section: cooling devices, zones devices, and binding
780  *
781  * Set of functions provided by the thermal core for:
782  * - cooling devices lifecycle: registration, unregistration,
783  *				binding, and unbinding.
784  * - thermal zone devices lifecycle: registration, unregistration,
785  *				     binding, and unbinding.
786  */
787 
788 static int thermal_instance_add(struct thermal_instance *new_instance,
789 				struct thermal_cooling_device *cdev,
790 				struct thermal_trip_desc *td)
791 {
792 	struct thermal_instance *instance;
793 
794 	list_for_each_entry(instance, &td->thermal_instances, trip_node) {
795 		if (instance->cdev == cdev)
796 			return -EEXIST;
797 	}
798 
799 	list_add_tail(&new_instance->trip_node, &td->thermal_instances);
800 
801 	guard(cooling_dev)(cdev);
802 
803 	list_add_tail(&new_instance->cdev_node, &cdev->thermal_instances);
804 
805 	return 0;
806 }
807 
808 /**
809  * thermal_bind_cdev_to_trip - bind a cooling device to a thermal zone
810  * @tz:		pointer to struct thermal_zone_device
811  * @td:		descriptor of the trip point to bind @cdev to
812  * @cdev:	pointer to struct thermal_cooling_device
813  * @cool_spec:	cooling specification for the trip point and @cdev
814  *
815  * This interface function bind a thermal cooling device to the certain trip
816  * point of a thermal zone device.
817  * This function is usually called in the thermal zone device .bind callback.
818  *
819  * Return: 0 on success, the proper error value otherwise.
820  */
821 static int thermal_bind_cdev_to_trip(struct thermal_zone_device *tz,
822 				     struct thermal_trip_desc *td,
823 				     struct thermal_cooling_device *cdev,
824 				     struct cooling_spec *cool_spec)
825 {
826 	struct thermal_instance *dev;
827 	bool upper_no_limit;
828 	int result;
829 
830 	/* lower default 0, upper default max_state */
831 	if (cool_spec->lower == THERMAL_NO_LIMIT)
832 		cool_spec->lower = 0;
833 
834 	if (cool_spec->upper == THERMAL_NO_LIMIT) {
835 		cool_spec->upper = cdev->max_state;
836 		upper_no_limit = true;
837 	} else {
838 		upper_no_limit = false;
839 	}
840 
841 	if (cool_spec->lower > cool_spec->upper || cool_spec->upper > cdev->max_state)
842 		return -EINVAL;
843 
844 	dev = kzalloc(sizeof(*dev), GFP_KERNEL);
845 	if (!dev)
846 		return -ENOMEM;
847 
848 	dev->cdev = cdev;
849 	dev->trip = &td->trip;
850 	dev->upper = cool_spec->upper;
851 	dev->upper_no_limit = upper_no_limit;
852 	dev->lower = cool_spec->lower;
853 	dev->target = THERMAL_NO_TARGET;
854 	dev->weight = cool_spec->weight;
855 
856 	result = ida_alloc(&tz->ida, GFP_KERNEL);
857 	if (result < 0)
858 		goto free_mem;
859 
860 	dev->id = result;
861 	sprintf(dev->name, "cdev%d", dev->id);
862 	result =
863 	    sysfs_create_link(&tz->device.kobj, &cdev->device.kobj, dev->name);
864 	if (result)
865 		goto release_ida;
866 
867 	snprintf(dev->attr_name, sizeof(dev->attr_name), "cdev%d_trip_point",
868 		 dev->id);
869 	sysfs_attr_init(&dev->attr.attr);
870 	dev->attr.attr.name = dev->attr_name;
871 	dev->attr.attr.mode = 0444;
872 	dev->attr.show = trip_point_show;
873 	result = device_create_file(&tz->device, &dev->attr);
874 	if (result)
875 		goto remove_symbol_link;
876 
877 	snprintf(dev->weight_attr_name, sizeof(dev->weight_attr_name),
878 		 "cdev%d_weight", dev->id);
879 	sysfs_attr_init(&dev->weight_attr.attr);
880 	dev->weight_attr.attr.name = dev->weight_attr_name;
881 	dev->weight_attr.attr.mode = S_IWUSR | S_IRUGO;
882 	dev->weight_attr.show = weight_show;
883 	dev->weight_attr.store = weight_store;
884 	result = device_create_file(&tz->device, &dev->weight_attr);
885 	if (result)
886 		goto remove_trip_file;
887 
888 	result = thermal_instance_add(dev, cdev, td);
889 	if (result)
890 		goto remove_weight_file;
891 
892 	thermal_governor_update_tz(tz, THERMAL_TZ_BIND_CDEV);
893 
894 	return 0;
895 
896 remove_weight_file:
897 	device_remove_file(&tz->device, &dev->weight_attr);
898 remove_trip_file:
899 	device_remove_file(&tz->device, &dev->attr);
900 remove_symbol_link:
901 	sysfs_remove_link(&tz->device.kobj, dev->name);
902 release_ida:
903 	ida_free(&tz->ida, dev->id);
904 free_mem:
905 	kfree(dev);
906 	return result;
907 }
908 
909 static void thermal_instance_delete(struct thermal_instance *instance)
910 {
911 	list_del(&instance->trip_node);
912 
913 	guard(cooling_dev)(instance->cdev);
914 
915 	list_del(&instance->cdev_node);
916 }
917 
918 /**
919  * thermal_unbind_cdev_from_trip - unbind a cooling device from a thermal zone.
920  * @tz:		pointer to a struct thermal_zone_device.
921  * @td:		descriptor of the trip point to unbind @cdev from
922  * @cdev:	pointer to a struct thermal_cooling_device.
923  *
924  * This interface function unbind a thermal cooling device from the certain
925  * trip point of a thermal zone device.
926  * This function is usually called in the thermal zone device .unbind callback.
927  */
928 static void thermal_unbind_cdev_from_trip(struct thermal_zone_device *tz,
929 					  struct thermal_trip_desc *td,
930 					  struct thermal_cooling_device *cdev)
931 {
932 	struct thermal_instance *pos, *next;
933 
934 	list_for_each_entry_safe(pos, next, &td->thermal_instances, trip_node) {
935 		if (pos->cdev == cdev) {
936 			thermal_instance_delete(pos);
937 			goto unbind;
938 		}
939 	}
940 
941 	return;
942 
943 unbind:
944 	thermal_governor_update_tz(tz, THERMAL_TZ_UNBIND_CDEV);
945 
946 	device_remove_file(&tz->device, &pos->weight_attr);
947 	device_remove_file(&tz->device, &pos->attr);
948 	sysfs_remove_link(&tz->device.kobj, pos->name);
949 	ida_free(&tz->ida, pos->id);
950 	kfree(pos);
951 }
952 
953 static void thermal_release(struct device *dev)
954 {
955 	struct thermal_zone_device *tz;
956 	struct thermal_cooling_device *cdev;
957 
958 	if (!strncmp(dev_name(dev), "thermal_zone",
959 		     sizeof("thermal_zone") - 1)) {
960 		tz = to_thermal_zone(dev);
961 		thermal_zone_destroy_device_groups(tz);
962 		mutex_destroy(&tz->lock);
963 		complete(&tz->removal);
964 	} else if (!strncmp(dev_name(dev), "cooling_device",
965 			    sizeof("cooling_device") - 1)) {
966 		cdev = to_cooling_device(dev);
967 		thermal_cooling_device_destroy_sysfs(cdev);
968 		kfree_const(cdev->type);
969 		ida_free(&thermal_cdev_ida, cdev->id);
970 		kfree(cdev);
971 	}
972 }
973 
974 static struct class *thermal_class;
975 
976 static inline
977 void print_bind_err_msg(struct thermal_zone_device *tz,
978 			const struct thermal_trip_desc *td,
979 			struct thermal_cooling_device *cdev, int ret)
980 {
981 	dev_err(&tz->device, "binding cdev %s to trip %d failed: %d\n",
982 		cdev->type, thermal_zone_trip_id(tz, &td->trip), ret);
983 }
984 
985 static bool __thermal_zone_cdev_bind(struct thermal_zone_device *tz,
986 				     struct thermal_cooling_device *cdev)
987 {
988 	struct thermal_trip_desc *td;
989 	bool update_tz = false;
990 
991 	if (!tz->ops.should_bind)
992 		return false;
993 
994 	for_each_trip_desc(tz, td) {
995 		struct cooling_spec c = {
996 			.upper = THERMAL_NO_LIMIT,
997 			.lower = THERMAL_NO_LIMIT,
998 			.weight = THERMAL_WEIGHT_DEFAULT
999 		};
1000 		int ret;
1001 
1002 		if (!tz->ops.should_bind(tz, &td->trip, cdev, &c))
1003 			continue;
1004 
1005 		ret = thermal_bind_cdev_to_trip(tz, td, cdev, &c);
1006 		if (ret) {
1007 			print_bind_err_msg(tz, td, cdev, ret);
1008 			continue;
1009 		}
1010 
1011 		update_tz = true;
1012 	}
1013 
1014 	return update_tz;
1015 }
1016 
1017 static void thermal_zone_cdev_bind(struct thermal_zone_device *tz,
1018 				   struct thermal_cooling_device *cdev)
1019 {
1020 	guard(thermal_zone)(tz);
1021 
1022 	if (__thermal_zone_cdev_bind(tz, cdev))
1023 		__thermal_zone_device_update(tz, THERMAL_EVENT_UNSPECIFIED);
1024 }
1025 
1026 static void thermal_cooling_device_init_complete(struct thermal_cooling_device *cdev)
1027 {
1028 	struct thermal_zone_device *tz;
1029 
1030 	guard(mutex)(&thermal_list_lock);
1031 
1032 	list_add(&cdev->node, &thermal_cdev_list);
1033 
1034 	list_for_each_entry(tz, &thermal_tz_list, node)
1035 		thermal_zone_cdev_bind(tz, cdev);
1036 }
1037 
1038 /**
1039  * __thermal_cooling_device_register() - register a new thermal cooling device
1040  * @np:		a pointer to a device tree node.
1041  * @type:	the thermal cooling device type.
1042  * @devdata:	device private data.
1043  * @ops:		standard thermal cooling devices callbacks.
1044  *
1045  * This interface function adds a new thermal cooling device (fan/processor/...)
1046  * to /sys/class/thermal/ folder as cooling_device[0-*]. It tries to bind itself
1047  * to all the thermal zone devices registered at the same time.
1048  * It also gives the opportunity to link the cooling device to a device tree
1049  * node, so that it can be bound to a thermal zone created out of device tree.
1050  *
1051  * Return: a pointer to the created struct thermal_cooling_device or an
1052  * ERR_PTR. Caller must check return value with IS_ERR*() helpers.
1053  */
1054 static struct thermal_cooling_device *
1055 __thermal_cooling_device_register(struct device_node *np,
1056 				  const char *type, void *devdata,
1057 				  const struct thermal_cooling_device_ops *ops)
1058 {
1059 	struct thermal_cooling_device *cdev;
1060 	unsigned long current_state;
1061 	int id, ret;
1062 
1063 	if (!ops || !ops->get_max_state || !ops->get_cur_state ||
1064 	    !ops->set_cur_state)
1065 		return ERR_PTR(-EINVAL);
1066 
1067 	if (!thermal_class)
1068 		return ERR_PTR(-ENODEV);
1069 
1070 	cdev = kzalloc(sizeof(*cdev), GFP_KERNEL);
1071 	if (!cdev)
1072 		return ERR_PTR(-ENOMEM);
1073 
1074 	ret = ida_alloc(&thermal_cdev_ida, GFP_KERNEL);
1075 	if (ret < 0)
1076 		goto out_kfree_cdev;
1077 	cdev->id = ret;
1078 	id = ret;
1079 
1080 	cdev->type = kstrdup_const(type ? type : "", GFP_KERNEL);
1081 	if (!cdev->type) {
1082 		ret = -ENOMEM;
1083 		goto out_ida_remove;
1084 	}
1085 
1086 	mutex_init(&cdev->lock);
1087 	INIT_LIST_HEAD(&cdev->thermal_instances);
1088 	cdev->np = np;
1089 	cdev->ops = ops;
1090 	cdev->updated = false;
1091 	cdev->device.class = thermal_class;
1092 	cdev->devdata = devdata;
1093 
1094 	ret = cdev->ops->get_max_state(cdev, &cdev->max_state);
1095 	if (ret)
1096 		goto out_cdev_type;
1097 
1098 	/*
1099 	 * The cooling device's current state is only needed for debug
1100 	 * initialization below, so a failure to get it does not cause
1101 	 * the entire cooling device initialization to fail.  However,
1102 	 * the debug will not work for the device if its initial state
1103 	 * cannot be determined and drivers are responsible for ensuring
1104 	 * that this will not happen.
1105 	 */
1106 	ret = cdev->ops->get_cur_state(cdev, &current_state);
1107 	if (ret)
1108 		current_state = ULONG_MAX;
1109 
1110 	thermal_cooling_device_setup_sysfs(cdev);
1111 
1112 	ret = dev_set_name(&cdev->device, "cooling_device%d", cdev->id);
1113 	if (ret)
1114 		goto out_cooling_dev;
1115 
1116 	ret = device_register(&cdev->device);
1117 	if (ret) {
1118 		/* thermal_release() handles rest of the cleanup */
1119 		put_device(&cdev->device);
1120 		return ERR_PTR(ret);
1121 	}
1122 
1123 	if (current_state <= cdev->max_state)
1124 		thermal_debug_cdev_add(cdev, current_state);
1125 
1126 	thermal_cooling_device_init_complete(cdev);
1127 
1128 	return cdev;
1129 
1130 out_cooling_dev:
1131 	thermal_cooling_device_destroy_sysfs(cdev);
1132 out_cdev_type:
1133 	kfree_const(cdev->type);
1134 out_ida_remove:
1135 	ida_free(&thermal_cdev_ida, id);
1136 out_kfree_cdev:
1137 	kfree(cdev);
1138 	return ERR_PTR(ret);
1139 }
1140 
1141 /**
1142  * thermal_cooling_device_register() - register a new thermal cooling device
1143  * @type:	the thermal cooling device type.
1144  * @devdata:	device private data.
1145  * @ops:		standard thermal cooling devices callbacks.
1146  *
1147  * This interface function adds a new thermal cooling device (fan/processor/...)
1148  * to /sys/class/thermal/ folder as cooling_device[0-*]. It tries to bind itself
1149  * to all the thermal zone devices registered at the same time.
1150  *
1151  * Return: a pointer to the created struct thermal_cooling_device or an
1152  * ERR_PTR. Caller must check return value with IS_ERR*() helpers.
1153  */
1154 struct thermal_cooling_device *
1155 thermal_cooling_device_register(const char *type, void *devdata,
1156 				const struct thermal_cooling_device_ops *ops)
1157 {
1158 	return __thermal_cooling_device_register(NULL, type, devdata, ops);
1159 }
1160 EXPORT_SYMBOL_GPL(thermal_cooling_device_register);
1161 
1162 /**
1163  * thermal_of_cooling_device_register() - register an OF thermal cooling device
1164  * @np:		a pointer to a device tree node.
1165  * @type:	the thermal cooling device type.
1166  * @devdata:	device private data.
1167  * @ops:		standard thermal cooling devices callbacks.
1168  *
1169  * This function will register a cooling device with device tree node reference.
1170  * This interface function adds a new thermal cooling device (fan/processor/...)
1171  * to /sys/class/thermal/ folder as cooling_device[0-*]. It tries to bind itself
1172  * to all the thermal zone devices registered at the same time.
1173  *
1174  * Return: a pointer to the created struct thermal_cooling_device or an
1175  * ERR_PTR. Caller must check return value with IS_ERR*() helpers.
1176  */
1177 struct thermal_cooling_device *
1178 thermal_of_cooling_device_register(struct device_node *np,
1179 				   const char *type, void *devdata,
1180 				   const struct thermal_cooling_device_ops *ops)
1181 {
1182 	return __thermal_cooling_device_register(np, type, devdata, ops);
1183 }
1184 EXPORT_SYMBOL_GPL(thermal_of_cooling_device_register);
1185 
1186 static void thermal_cooling_device_release(struct device *dev, void *res)
1187 {
1188 	thermal_cooling_device_unregister(
1189 				*(struct thermal_cooling_device **)res);
1190 }
1191 
1192 /**
1193  * devm_thermal_of_cooling_device_register() - register an OF thermal cooling
1194  *					       device
1195  * @dev:	a valid struct device pointer of a sensor device.
1196  * @np:		a pointer to a device tree node.
1197  * @type:	the thermal cooling device type.
1198  * @devdata:	device private data.
1199  * @ops:	standard thermal cooling devices callbacks.
1200  *
1201  * This function will register a cooling device with device tree node reference.
1202  * This interface function adds a new thermal cooling device (fan/processor/...)
1203  * to /sys/class/thermal/ folder as cooling_device[0-*]. It tries to bind itself
1204  * to all the thermal zone devices registered at the same time.
1205  *
1206  * Return: a pointer to the created struct thermal_cooling_device or an
1207  * ERR_PTR. Caller must check return value with IS_ERR*() helpers.
1208  */
1209 struct thermal_cooling_device *
1210 devm_thermal_of_cooling_device_register(struct device *dev,
1211 				struct device_node *np,
1212 				const char *type, void *devdata,
1213 				const struct thermal_cooling_device_ops *ops)
1214 {
1215 	struct thermal_cooling_device **ptr, *tcd;
1216 
1217 	ptr = devres_alloc(thermal_cooling_device_release, sizeof(*ptr),
1218 			   GFP_KERNEL);
1219 	if (!ptr)
1220 		return ERR_PTR(-ENOMEM);
1221 
1222 	tcd = __thermal_cooling_device_register(np, type, devdata, ops);
1223 	if (IS_ERR(tcd)) {
1224 		devres_free(ptr);
1225 		return tcd;
1226 	}
1227 
1228 	*ptr = tcd;
1229 	devres_add(dev, ptr);
1230 
1231 	return tcd;
1232 }
1233 EXPORT_SYMBOL_GPL(devm_thermal_of_cooling_device_register);
1234 
1235 static bool thermal_cooling_device_present(struct thermal_cooling_device *cdev)
1236 {
1237 	struct thermal_cooling_device *pos = NULL;
1238 
1239 	list_for_each_entry(pos, &thermal_cdev_list, node) {
1240 		if (pos == cdev)
1241 			return true;
1242 	}
1243 
1244 	return false;
1245 }
1246 
1247 /**
1248  * thermal_cooling_device_update - Update a cooling device object
1249  * @cdev: Target cooling device.
1250  *
1251  * Update @cdev to reflect a change of the underlying hardware or platform.
1252  *
1253  * Must be called when the maximum cooling state of @cdev becomes invalid and so
1254  * its .get_max_state() callback needs to be run to produce the new maximum
1255  * cooling state value.
1256  */
1257 void thermal_cooling_device_update(struct thermal_cooling_device *cdev)
1258 {
1259 	struct thermal_instance *ti;
1260 	unsigned long state;
1261 
1262 	if (IS_ERR_OR_NULL(cdev))
1263 		return;
1264 
1265 	/*
1266 	 * Hold thermal_list_lock throughout the update to prevent the device
1267 	 * from going away while being updated.
1268 	 */
1269 	guard(mutex)(&thermal_list_lock);
1270 
1271 	if (!thermal_cooling_device_present(cdev))
1272 		return;
1273 
1274 	/*
1275 	 * Update under the cdev lock to prevent the state from being set beyond
1276 	 * the new limit concurrently.
1277 	 */
1278 	guard(cooling_dev)(cdev);
1279 
1280 	if (cdev->ops->get_max_state(cdev, &cdev->max_state))
1281 		return;
1282 
1283 	thermal_cooling_device_stats_reinit(cdev);
1284 
1285 	list_for_each_entry(ti, &cdev->thermal_instances, cdev_node) {
1286 		if (ti->upper == cdev->max_state)
1287 			continue;
1288 
1289 		if (ti->upper < cdev->max_state) {
1290 			if (ti->upper_no_limit)
1291 				ti->upper = cdev->max_state;
1292 
1293 			continue;
1294 		}
1295 
1296 		ti->upper = cdev->max_state;
1297 		if (ti->lower > ti->upper)
1298 			ti->lower = ti->upper;
1299 
1300 		if (ti->target == THERMAL_NO_TARGET)
1301 			continue;
1302 
1303 		if (ti->target > ti->upper)
1304 			ti->target = ti->upper;
1305 	}
1306 
1307 	if (cdev->ops->get_cur_state(cdev, &state) || state > cdev->max_state)
1308 		return;
1309 
1310 	thermal_cooling_device_stats_update(cdev, state);
1311 }
1312 EXPORT_SYMBOL_GPL(thermal_cooling_device_update);
1313 
1314 static void __thermal_zone_cdev_unbind(struct thermal_zone_device *tz,
1315 				       struct thermal_cooling_device *cdev)
1316 {
1317 	struct thermal_trip_desc *td;
1318 
1319 	for_each_trip_desc(tz, td)
1320 		thermal_unbind_cdev_from_trip(tz, td, cdev);
1321 }
1322 
1323 static void thermal_zone_cdev_unbind(struct thermal_zone_device *tz,
1324 				     struct thermal_cooling_device *cdev)
1325 {
1326 	guard(thermal_zone)(tz);
1327 
1328 	__thermal_zone_cdev_unbind(tz, cdev);
1329 }
1330 
1331 static bool thermal_cooling_device_exit(struct thermal_cooling_device *cdev)
1332 {
1333 	struct thermal_zone_device *tz;
1334 
1335 	guard(mutex)(&thermal_list_lock);
1336 
1337 	if (!thermal_cooling_device_present(cdev))
1338 		return false;
1339 
1340 	list_del(&cdev->node);
1341 
1342 	list_for_each_entry(tz, &thermal_tz_list, node)
1343 		thermal_zone_cdev_unbind(tz, cdev);
1344 
1345 	return true;
1346 }
1347 
1348 /**
1349  * thermal_cooling_device_unregister() - removes a thermal cooling device
1350  * @cdev: Thermal cooling device to remove.
1351  */
1352 void thermal_cooling_device_unregister(struct thermal_cooling_device *cdev)
1353 {
1354 	if (!cdev)
1355 		return;
1356 
1357 	thermal_debug_cdev_remove(cdev);
1358 
1359 	if (thermal_cooling_device_exit(cdev))
1360 		device_unregister(&cdev->device);
1361 }
1362 EXPORT_SYMBOL_GPL(thermal_cooling_device_unregister);
1363 
1364 int thermal_zone_get_crit_temp(struct thermal_zone_device *tz, int *temp)
1365 {
1366 	const struct thermal_trip_desc *td;
1367 	int ret = -EINVAL;
1368 
1369 	if (tz->ops.get_crit_temp)
1370 		return tz->ops.get_crit_temp(tz, temp);
1371 
1372 	guard(thermal_zone)(tz);
1373 
1374 	for_each_trip_desc(tz, td) {
1375 		const struct thermal_trip *trip = &td->trip;
1376 
1377 		if (trip->type == THERMAL_TRIP_CRITICAL) {
1378 			*temp = trip->temperature;
1379 			ret = 0;
1380 			break;
1381 		}
1382 	}
1383 
1384 	return ret;
1385 }
1386 EXPORT_SYMBOL_GPL(thermal_zone_get_crit_temp);
1387 
1388 static void thermal_zone_device_check(struct work_struct *work)
1389 {
1390 	struct thermal_zone_device *tz = container_of(work, struct
1391 						      thermal_zone_device,
1392 						      poll_queue.work);
1393 	thermal_zone_device_update(tz, THERMAL_EVENT_UNSPECIFIED);
1394 }
1395 
1396 static void thermal_zone_device_init(struct thermal_zone_device *tz)
1397 {
1398 	struct thermal_trip_desc *td, *next;
1399 
1400 	INIT_DELAYED_WORK(&tz->poll_queue, thermal_zone_device_check);
1401 
1402 	tz->temperature = THERMAL_TEMP_INIT;
1403 	tz->passive = 0;
1404 	tz->prev_low_trip = -INT_MAX;
1405 	tz->prev_high_trip = INT_MAX;
1406 	for_each_trip_desc(tz, td) {
1407 		struct thermal_instance *instance;
1408 
1409 		list_for_each_entry(instance, &td->thermal_instances, trip_node)
1410 			instance->initialized = false;
1411 	}
1412 	/*
1413 	 * At this point, all valid trips need to be moved to trips_high so that
1414 	 * mitigation can be started if the zone temperature is above them.
1415 	 */
1416 	list_for_each_entry_safe(td, next, &tz->trips_invalid, list_node) {
1417 		if (td->trip.temperature != THERMAL_TEMP_INVALID)
1418 			move_to_trips_high(tz, td);
1419 	}
1420 	/* The trips_reached list may not be empty during system resume. */
1421 	list_for_each_entry_safe(td, next, &tz->trips_reached, list_node) {
1422 		if (td->trip.temperature == THERMAL_TEMP_INVALID)
1423 			move_to_trips_invalid(tz, td);
1424 		else
1425 			move_to_trips_high(tz, td);
1426 	}
1427 }
1428 
1429 static int thermal_zone_init_governor(struct thermal_zone_device *tz)
1430 {
1431 	struct thermal_governor *governor;
1432 
1433 	guard(mutex)(&thermal_governor_lock);
1434 
1435 	if (tz->tzp)
1436 		governor = __find_governor(tz->tzp->governor_name);
1437 	else
1438 		governor = def_governor;
1439 
1440 	return thermal_set_governor(tz, governor);
1441 }
1442 
1443 static void thermal_zone_init_complete(struct thermal_zone_device *tz)
1444 {
1445 	struct thermal_cooling_device *cdev;
1446 
1447 	guard(mutex)(&thermal_list_lock);
1448 
1449 	list_add_tail(&tz->node, &thermal_tz_list);
1450 
1451 	guard(thermal_zone)(tz);
1452 
1453 	/* Bind cooling devices for this zone. */
1454 	list_for_each_entry(cdev, &thermal_cdev_list, node)
1455 		__thermal_zone_cdev_bind(tz, cdev);
1456 
1457 	tz->state &= ~TZ_STATE_FLAG_INIT;
1458 	/*
1459 	 * If system suspend or resume is in progress at this point, the
1460 	 * new thermal zone needs to be marked as suspended because
1461 	 * thermal_pm_notify() has run already.
1462 	 */
1463 	if (thermal_pm_suspended)
1464 		tz->state |= TZ_STATE_FLAG_SUSPENDED;
1465 
1466 	__thermal_zone_device_update(tz, THERMAL_EVENT_UNSPECIFIED);
1467 }
1468 
1469 /**
1470  * thermal_zone_device_register_with_trips() - register a new thermal zone device
1471  * @type:	the thermal zone device type
1472  * @trips:	a pointer to an array of thermal trips
1473  * @num_trips:	the number of trip points the thermal zone support
1474  * @devdata:	private device data
1475  * @ops:	standard thermal zone device callbacks
1476  * @tzp:	thermal zone platform parameters
1477  * @passive_delay: number of milliseconds to wait between polls when
1478  *		   performing passive cooling
1479  * @polling_delay: number of milliseconds to wait between polls when checking
1480  *		   whether trip points have been crossed (0 for interrupt
1481  *		   driven systems)
1482  *
1483  * This interface function adds a new thermal zone device (sensor) to
1484  * /sys/class/thermal folder as thermal_zone[0-*]. It tries to bind all the
1485  * thermal cooling devices registered at the same time.
1486  * thermal_zone_device_unregister() must be called when the device is no
1487  * longer needed. The passive cooling depends on the .get_trend() return value.
1488  *
1489  * Return: a pointer to the created struct thermal_zone_device or an
1490  * in case of error, an ERR_PTR. Caller must check return value with
1491  * IS_ERR*() helpers.
1492  */
1493 struct thermal_zone_device *
1494 thermal_zone_device_register_with_trips(const char *type,
1495 					const struct thermal_trip *trips,
1496 					int num_trips, void *devdata,
1497 					const struct thermal_zone_device_ops *ops,
1498 					const struct thermal_zone_params *tzp,
1499 					unsigned int passive_delay,
1500 					unsigned int polling_delay)
1501 {
1502 	const struct thermal_trip *trip = trips;
1503 	struct thermal_zone_device *tz;
1504 	struct thermal_trip_desc *td;
1505 	int id;
1506 	int result;
1507 
1508 	if (!type || strlen(type) == 0) {
1509 		pr_err("No thermal zone type defined\n");
1510 		return ERR_PTR(-EINVAL);
1511 	}
1512 
1513 	if (strlen(type) >= THERMAL_NAME_LENGTH) {
1514 		pr_err("Thermal zone name (%s) too long, should be under %d chars\n",
1515 		       type, THERMAL_NAME_LENGTH);
1516 		return ERR_PTR(-EINVAL);
1517 	}
1518 
1519 	if (num_trips < 0) {
1520 		pr_err("Incorrect number of thermal trips\n");
1521 		return ERR_PTR(-EINVAL);
1522 	}
1523 
1524 	if (!ops || !ops->get_temp) {
1525 		pr_err("Thermal zone device ops not defined or invalid\n");
1526 		return ERR_PTR(-EINVAL);
1527 	}
1528 
1529 	if (num_trips > 0 && !trips)
1530 		return ERR_PTR(-EINVAL);
1531 
1532 	if (polling_delay && passive_delay > polling_delay)
1533 		return ERR_PTR(-EINVAL);
1534 
1535 	if (!thermal_class)
1536 		return ERR_PTR(-ENODEV);
1537 
1538 	tz = kzalloc(struct_size(tz, trips, num_trips), GFP_KERNEL);
1539 	if (!tz)
1540 		return ERR_PTR(-ENOMEM);
1541 
1542 	if (tzp) {
1543 		tz->tzp = kmemdup(tzp, sizeof(*tzp), GFP_KERNEL);
1544 		if (!tz->tzp) {
1545 			result = -ENOMEM;
1546 			goto free_tz;
1547 		}
1548 	}
1549 
1550 	INIT_LIST_HEAD(&tz->node);
1551 	INIT_LIST_HEAD(&tz->trips_high);
1552 	INIT_LIST_HEAD(&tz->trips_reached);
1553 	INIT_LIST_HEAD(&tz->trips_invalid);
1554 	ida_init(&tz->ida);
1555 	mutex_init(&tz->lock);
1556 	init_completion(&tz->removal);
1557 	init_completion(&tz->resume);
1558 	id = ida_alloc(&thermal_tz_ida, GFP_KERNEL);
1559 	if (id < 0) {
1560 		result = id;
1561 		goto free_tzp;
1562 	}
1563 
1564 	tz->id = id;
1565 	strscpy(tz->type, type, sizeof(tz->type));
1566 
1567 	tz->ops = *ops;
1568 	if (!tz->ops.critical)
1569 		tz->ops.critical = thermal_zone_device_critical;
1570 
1571 	tz->device.class = thermal_class;
1572 	tz->devdata = devdata;
1573 	tz->num_trips = num_trips;
1574 	for_each_trip_desc(tz, td) {
1575 		td->trip = *trip++;
1576 		INIT_LIST_HEAD(&td->thermal_instances);
1577 		INIT_LIST_HEAD(&td->list_node);
1578 		/*
1579 		 * Mark all thresholds as invalid to start with even though
1580 		 * this only matters for the trips that start as invalid and
1581 		 * become valid later.
1582 		 */
1583 		move_to_trips_invalid(tz, td);
1584 	}
1585 
1586 	tz->polling_delay_jiffies = msecs_to_jiffies(polling_delay);
1587 	tz->passive_delay_jiffies = msecs_to_jiffies(passive_delay);
1588 	tz->recheck_delay_jiffies = THERMAL_RECHECK_DELAY;
1589 
1590 	tz->state = TZ_STATE_FLAG_INIT;
1591 
1592 	/* sys I/F */
1593 	/* Add nodes that are always present via .groups */
1594 	result = thermal_zone_create_device_groups(tz);
1595 	if (result)
1596 		goto remove_id;
1597 
1598 	result = dev_set_name(&tz->device, "thermal_zone%d", tz->id);
1599 	if (result) {
1600 		thermal_zone_destroy_device_groups(tz);
1601 		goto remove_id;
1602 	}
1603 	thermal_zone_device_init(tz);
1604 	result = device_register(&tz->device);
1605 	if (result)
1606 		goto release_device;
1607 
1608 	result = thermal_zone_init_governor(tz);
1609 	if (result)
1610 		goto unregister;
1611 
1612 	if (!tz->tzp || !tz->tzp->no_hwmon) {
1613 		result = thermal_add_hwmon_sysfs(tz);
1614 		if (result)
1615 			goto unregister;
1616 	}
1617 
1618 	result = thermal_thresholds_init(tz);
1619 	if (result)
1620 		goto remove_hwmon;
1621 
1622 	thermal_zone_init_complete(tz);
1623 
1624 	thermal_notify_tz_create(tz);
1625 
1626 	thermal_debug_tz_add(tz);
1627 
1628 	return tz;
1629 
1630 remove_hwmon:
1631 	thermal_remove_hwmon_sysfs(tz);
1632 unregister:
1633 	device_del(&tz->device);
1634 release_device:
1635 	put_device(&tz->device);
1636 remove_id:
1637 	ida_free(&thermal_tz_ida, id);
1638 free_tzp:
1639 	kfree(tz->tzp);
1640 free_tz:
1641 	kfree(tz);
1642 	return ERR_PTR(result);
1643 }
1644 EXPORT_SYMBOL_GPL(thermal_zone_device_register_with_trips);
1645 
1646 struct thermal_zone_device *thermal_tripless_zone_device_register(
1647 					const char *type,
1648 					void *devdata,
1649 					const struct thermal_zone_device_ops *ops,
1650 					const struct thermal_zone_params *tzp)
1651 {
1652 	return thermal_zone_device_register_with_trips(type, NULL, 0, devdata,
1653 						       ops, tzp, 0, 0);
1654 }
1655 EXPORT_SYMBOL_GPL(thermal_tripless_zone_device_register);
1656 
1657 void *thermal_zone_device_priv(struct thermal_zone_device *tzd)
1658 {
1659 	return tzd->devdata;
1660 }
1661 EXPORT_SYMBOL_GPL(thermal_zone_device_priv);
1662 
1663 const char *thermal_zone_device_type(struct thermal_zone_device *tzd)
1664 {
1665 	return tzd->type;
1666 }
1667 EXPORT_SYMBOL_GPL(thermal_zone_device_type);
1668 
1669 int thermal_zone_device_id(struct thermal_zone_device *tzd)
1670 {
1671 	return tzd->id;
1672 }
1673 EXPORT_SYMBOL_GPL(thermal_zone_device_id);
1674 
1675 struct device *thermal_zone_device(struct thermal_zone_device *tzd)
1676 {
1677 	return &tzd->device;
1678 }
1679 EXPORT_SYMBOL_GPL(thermal_zone_device);
1680 
1681 static bool thermal_zone_exit(struct thermal_zone_device *tz)
1682 {
1683 	struct thermal_cooling_device *cdev;
1684 
1685 	guard(mutex)(&thermal_list_lock);
1686 
1687 	if (list_empty(&tz->node))
1688 		return false;
1689 
1690 	guard(thermal_zone)(tz);
1691 
1692 	tz->state |= TZ_STATE_FLAG_EXIT;
1693 	list_del_init(&tz->node);
1694 
1695 	/* Unbind all cdevs associated with this thermal zone. */
1696 	list_for_each_entry(cdev, &thermal_cdev_list, node)
1697 		__thermal_zone_cdev_unbind(tz, cdev);
1698 
1699 	return true;
1700 }
1701 
1702 /**
1703  * thermal_zone_device_unregister - removes the registered thermal zone device
1704  * @tz: the thermal zone device to remove
1705  */
1706 void thermal_zone_device_unregister(struct thermal_zone_device *tz)
1707 {
1708 	if (!tz)
1709 		return;
1710 
1711 	thermal_debug_tz_remove(tz);
1712 
1713 	if (!thermal_zone_exit(tz))
1714 		return;
1715 
1716 	cancel_delayed_work_sync(&tz->poll_queue);
1717 
1718 	thermal_set_governor(tz, NULL);
1719 
1720 	thermal_thresholds_exit(tz);
1721 	thermal_remove_hwmon_sysfs(tz);
1722 	ida_free(&thermal_tz_ida, tz->id);
1723 	ida_destroy(&tz->ida);
1724 
1725 	device_del(&tz->device);
1726 	put_device(&tz->device);
1727 
1728 	thermal_notify_tz_delete(tz);
1729 
1730 	wait_for_completion(&tz->removal);
1731 	kfree(tz->tzp);
1732 	kfree(tz);
1733 }
1734 EXPORT_SYMBOL_GPL(thermal_zone_device_unregister);
1735 
1736 /**
1737  * thermal_zone_get_zone_by_name() - search for a zone and returns its ref
1738  * @name: thermal zone name to fetch the temperature
1739  *
1740  * When only one zone is found with the passed name, returns a reference to it.
1741  *
1742  * Return: On success returns a reference to an unique thermal zone with
1743  * matching name equals to @name, an ERR_PTR otherwise (-EINVAL for invalid
1744  * paramenters, -ENODEV for not found and -EEXIST for multiple matches).
1745  */
1746 struct thermal_zone_device *thermal_zone_get_zone_by_name(const char *name)
1747 {
1748 	struct thermal_zone_device *pos = NULL, *ref = ERR_PTR(-EINVAL);
1749 	unsigned int found = 0;
1750 
1751 	if (!name)
1752 		return ERR_PTR(-EINVAL);
1753 
1754 	guard(mutex)(&thermal_list_lock);
1755 
1756 	list_for_each_entry(pos, &thermal_tz_list, node)
1757 		if (!strncasecmp(name, pos->type, THERMAL_NAME_LENGTH)) {
1758 			found++;
1759 			ref = pos;
1760 		}
1761 
1762 	if (!found)
1763 		return ERR_PTR(-ENODEV);
1764 
1765 	/* Success only when one zone is found. */
1766 	if (found > 1)
1767 		return ERR_PTR(-EEXIST);
1768 
1769 	return ref;
1770 }
1771 EXPORT_SYMBOL_GPL(thermal_zone_get_zone_by_name);
1772 
1773 static void thermal_zone_device_resume(struct work_struct *work)
1774 {
1775 	struct thermal_zone_device *tz;
1776 
1777 	tz = container_of(work, struct thermal_zone_device, poll_queue.work);
1778 
1779 	guard(thermal_zone)(tz);
1780 
1781 	tz->state &= ~(TZ_STATE_FLAG_SUSPENDED | TZ_STATE_FLAG_RESUMING);
1782 
1783 	thermal_debug_tz_resume(tz);
1784 	thermal_zone_device_init(tz);
1785 	thermal_governor_update_tz(tz, THERMAL_TZ_RESUME);
1786 	__thermal_zone_device_update(tz, THERMAL_TZ_RESUME);
1787 
1788 	complete(&tz->resume);
1789 }
1790 
1791 static void thermal_zone_pm_prepare(struct thermal_zone_device *tz)
1792 {
1793 	guard(thermal_zone)(tz);
1794 
1795 	if (tz->state & TZ_STATE_FLAG_RESUMING) {
1796 		/*
1797 		 * thermal_zone_device_resume() queued up for this zone has not
1798 		 * acquired the lock yet, so release it to let the function run
1799 		 * and wait util it has done the work.
1800 		 */
1801 		scoped_guard(thermal_zone_reverse, tz) {
1802 			wait_for_completion(&tz->resume);
1803 		}
1804 	}
1805 
1806 	tz->state |= TZ_STATE_FLAG_SUSPENDED;
1807 }
1808 
1809 static void thermal_pm_notify_prepare(void)
1810 {
1811 	struct thermal_zone_device *tz;
1812 
1813 	guard(mutex)(&thermal_list_lock);
1814 
1815 	thermal_pm_suspended = true;
1816 
1817 	list_for_each_entry(tz, &thermal_tz_list, node)
1818 		thermal_zone_pm_prepare(tz);
1819 }
1820 
1821 static void thermal_zone_pm_complete(struct thermal_zone_device *tz)
1822 {
1823 	guard(thermal_zone)(tz);
1824 
1825 	cancel_delayed_work(&tz->poll_queue);
1826 
1827 	reinit_completion(&tz->resume);
1828 	tz->state |= TZ_STATE_FLAG_RESUMING;
1829 
1830 	/*
1831 	 * Replace the work function with the resume one, which will restore the
1832 	 * original work function and schedule the polling work if needed.
1833 	 */
1834 	INIT_DELAYED_WORK(&tz->poll_queue, thermal_zone_device_resume);
1835 	/* Queue up the work without a delay. */
1836 	mod_delayed_work(system_freezable_power_efficient_wq, &tz->poll_queue, 0);
1837 }
1838 
1839 static void thermal_pm_notify_complete(void)
1840 {
1841 	struct thermal_zone_device *tz;
1842 
1843 	guard(mutex)(&thermal_list_lock);
1844 
1845 	thermal_pm_suspended = false;
1846 
1847 	list_for_each_entry(tz, &thermal_tz_list, node)
1848 		thermal_zone_pm_complete(tz);
1849 }
1850 
1851 static int thermal_pm_notify(struct notifier_block *nb,
1852 			     unsigned long mode, void *_unused)
1853 {
1854 	switch (mode) {
1855 	case PM_HIBERNATION_PREPARE:
1856 	case PM_RESTORE_PREPARE:
1857 	case PM_SUSPEND_PREPARE:
1858 		thermal_pm_notify_prepare();
1859 		break;
1860 	case PM_POST_HIBERNATION:
1861 	case PM_POST_RESTORE:
1862 	case PM_POST_SUSPEND:
1863 		thermal_pm_notify_complete();
1864 		break;
1865 	default:
1866 		break;
1867 	}
1868 	return 0;
1869 }
1870 
1871 static struct notifier_block thermal_pm_nb = {
1872 	.notifier_call = thermal_pm_notify,
1873 	/*
1874 	 * Run at the lowest priority to avoid interference between the thermal
1875 	 * zone resume work items spawned by thermal_pm_notify() and the other
1876 	 * PM notifiers.
1877 	 */
1878 	.priority = INT_MIN,
1879 };
1880 
1881 static int __init thermal_init(void)
1882 {
1883 	int result;
1884 
1885 	thermal_debug_init();
1886 
1887 	result = thermal_netlink_init();
1888 	if (result)
1889 		goto error;
1890 
1891 	result = thermal_register_governors();
1892 	if (result)
1893 		goto unregister_netlink;
1894 
1895 	thermal_class = kzalloc(sizeof(*thermal_class), GFP_KERNEL);
1896 	if (!thermal_class) {
1897 		result = -ENOMEM;
1898 		goto unregister_governors;
1899 	}
1900 
1901 	thermal_class->name = "thermal";
1902 	thermal_class->dev_release = thermal_release;
1903 
1904 	result = class_register(thermal_class);
1905 	if (result) {
1906 		kfree(thermal_class);
1907 		thermal_class = NULL;
1908 		goto unregister_governors;
1909 	}
1910 
1911 	result = register_pm_notifier(&thermal_pm_nb);
1912 	if (result)
1913 		pr_warn("Thermal: Can not register suspend notifier, return %d\n",
1914 			result);
1915 
1916 	return 0;
1917 
1918 unregister_governors:
1919 	thermal_unregister_governors();
1920 unregister_netlink:
1921 	thermal_netlink_exit();
1922 error:
1923 	mutex_destroy(&thermal_list_lock);
1924 	mutex_destroy(&thermal_governor_lock);
1925 	return result;
1926 }
1927 postcore_initcall(thermal_init);
1928