xref: /linux/kernel/time/tick-broadcast.c (revision e8cdfb0509f48d44d95d68d4f42d8d71a9ba4acd)
1 /*
2  * linux/kernel/time/tick-broadcast.c
3  *
4  * This file contains functions which emulate a local clock-event
5  * device via a broadcast event source.
6  *
7  * Copyright(C) 2005-2006, Thomas Gleixner <tglx@linutronix.de>
8  * Copyright(C) 2005-2007, Red Hat, Inc., Ingo Molnar
9  * Copyright(C) 2006-2007, Timesys Corp., Thomas Gleixner
10  *
11  * This code is licenced under the GPL version 2. For details see
12  * kernel-base/COPYING.
13  */
14 #include <linux/cpu.h>
15 #include <linux/err.h>
16 #include <linux/hrtimer.h>
17 #include <linux/interrupt.h>
18 #include <linux/percpu.h>
19 #include <linux/profile.h>
20 #include <linux/sched.h>
21 #include <linux/tick.h>
22 
23 #include "tick-internal.h"
24 
25 /*
26  * Broadcast support for broken x86 hardware, where the local apic
27  * timer stops in C3 state.
28  */
29 
30 static struct tick_device tick_broadcast_device;
31 /* FIXME: Use cpumask_var_t. */
32 static DECLARE_BITMAP(tick_broadcast_mask, NR_CPUS);
33 static DECLARE_BITMAP(tmpmask, NR_CPUS);
34 static DEFINE_RAW_SPINLOCK(tick_broadcast_lock);
35 static int tick_broadcast_force;
36 
37 #ifdef CONFIG_TICK_ONESHOT
38 static void tick_broadcast_clear_oneshot(int cpu);
39 #else
40 static inline void tick_broadcast_clear_oneshot(int cpu) { }
41 #endif
42 
43 /*
44  * Debugging: see timer_list.c
45  */
46 struct tick_device *tick_get_broadcast_device(void)
47 {
48 	return &tick_broadcast_device;
49 }
50 
51 struct cpumask *tick_get_broadcast_mask(void)
52 {
53 	return to_cpumask(tick_broadcast_mask);
54 }
55 
56 /*
57  * Start the device in periodic mode
58  */
59 static void tick_broadcast_start_periodic(struct clock_event_device *bc)
60 {
61 	if (bc)
62 		tick_setup_periodic(bc, 1);
63 }
64 
65 /*
66  * Check, if the device can be utilized as broadcast device:
67  */
68 int tick_check_broadcast_device(struct clock_event_device *dev)
69 {
70 	if ((tick_broadcast_device.evtdev &&
71 	     tick_broadcast_device.evtdev->rating >= dev->rating) ||
72 	     (dev->features & CLOCK_EVT_FEAT_C3STOP))
73 		return 0;
74 
75 	clockevents_exchange_device(NULL, dev);
76 	tick_broadcast_device.evtdev = dev;
77 	if (!cpumask_empty(tick_get_broadcast_mask()))
78 		tick_broadcast_start_periodic(dev);
79 	return 1;
80 }
81 
82 /*
83  * Check, if the device is the broadcast device
84  */
85 int tick_is_broadcast_device(struct clock_event_device *dev)
86 {
87 	return (dev && tick_broadcast_device.evtdev == dev);
88 }
89 
90 /*
91  * Check, if the device is disfunctional and a place holder, which
92  * needs to be handled by the broadcast device.
93  */
94 int tick_device_uses_broadcast(struct clock_event_device *dev, int cpu)
95 {
96 	unsigned long flags;
97 	int ret = 0;
98 
99 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
100 
101 	/*
102 	 * Devices might be registered with both periodic and oneshot
103 	 * mode disabled. This signals, that the device needs to be
104 	 * operated from the broadcast device and is a placeholder for
105 	 * the cpu local device.
106 	 */
107 	if (!tick_device_is_functional(dev)) {
108 		dev->event_handler = tick_handle_periodic;
109 		cpumask_set_cpu(cpu, tick_get_broadcast_mask());
110 		tick_broadcast_start_periodic(tick_broadcast_device.evtdev);
111 		ret = 1;
112 	} else {
113 		/*
114 		 * When the new device is not affected by the stop
115 		 * feature and the cpu is marked in the broadcast mask
116 		 * then clear the broadcast bit.
117 		 */
118 		if (!(dev->features & CLOCK_EVT_FEAT_C3STOP)) {
119 			int cpu = smp_processor_id();
120 
121 			cpumask_clear_cpu(cpu, tick_get_broadcast_mask());
122 			tick_broadcast_clear_oneshot(cpu);
123 		}
124 	}
125 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
126 	return ret;
127 }
128 
129 /*
130  * Broadcast the event to the cpus, which are set in the mask (mangled).
131  */
132 static void tick_do_broadcast(struct cpumask *mask)
133 {
134 	int cpu = smp_processor_id();
135 	struct tick_device *td;
136 
137 	/*
138 	 * Check, if the current cpu is in the mask
139 	 */
140 	if (cpumask_test_cpu(cpu, mask)) {
141 		cpumask_clear_cpu(cpu, mask);
142 		td = &per_cpu(tick_cpu_device, cpu);
143 		td->evtdev->event_handler(td->evtdev);
144 	}
145 
146 	if (!cpumask_empty(mask)) {
147 		/*
148 		 * It might be necessary to actually check whether the devices
149 		 * have different broadcast functions. For now, just use the
150 		 * one of the first device. This works as long as we have this
151 		 * misfeature only on x86 (lapic)
152 		 */
153 		td = &per_cpu(tick_cpu_device, cpumask_first(mask));
154 		td->evtdev->broadcast(mask);
155 	}
156 }
157 
158 /*
159  * Periodic broadcast:
160  * - invoke the broadcast handlers
161  */
162 static void tick_do_periodic_broadcast(void)
163 {
164 	raw_spin_lock(&tick_broadcast_lock);
165 
166 	cpumask_and(to_cpumask(tmpmask),
167 		    cpu_online_mask, tick_get_broadcast_mask());
168 	tick_do_broadcast(to_cpumask(tmpmask));
169 
170 	raw_spin_unlock(&tick_broadcast_lock);
171 }
172 
173 /*
174  * Event handler for periodic broadcast ticks
175  */
176 static void tick_handle_periodic_broadcast(struct clock_event_device *dev)
177 {
178 	ktime_t next;
179 
180 	tick_do_periodic_broadcast();
181 
182 	/*
183 	 * The device is in periodic mode. No reprogramming necessary:
184 	 */
185 	if (dev->mode == CLOCK_EVT_MODE_PERIODIC)
186 		return;
187 
188 	/*
189 	 * Setup the next period for devices, which do not have
190 	 * periodic mode. We read dev->next_event first and add to it
191 	 * when the event already expired. clockevents_program_event()
192 	 * sets dev->next_event only when the event is really
193 	 * programmed to the device.
194 	 */
195 	for (next = dev->next_event; ;) {
196 		next = ktime_add(next, tick_period);
197 
198 		if (!clockevents_program_event(dev, next, ktime_get()))
199 			return;
200 		tick_do_periodic_broadcast();
201 	}
202 }
203 
204 /*
205  * Powerstate information: The system enters/leaves a state, where
206  * affected devices might stop
207  */
208 static void tick_do_broadcast_on_off(unsigned long *reason)
209 {
210 	struct clock_event_device *bc, *dev;
211 	struct tick_device *td;
212 	unsigned long flags;
213 	int cpu, bc_stopped;
214 
215 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
216 
217 	cpu = smp_processor_id();
218 	td = &per_cpu(tick_cpu_device, cpu);
219 	dev = td->evtdev;
220 	bc = tick_broadcast_device.evtdev;
221 
222 	/*
223 	 * Is the device not affected by the powerstate ?
224 	 */
225 	if (!dev || !(dev->features & CLOCK_EVT_FEAT_C3STOP))
226 		goto out;
227 
228 	if (!tick_device_is_functional(dev))
229 		goto out;
230 
231 	bc_stopped = cpumask_empty(tick_get_broadcast_mask());
232 
233 	switch (*reason) {
234 	case CLOCK_EVT_NOTIFY_BROADCAST_ON:
235 	case CLOCK_EVT_NOTIFY_BROADCAST_FORCE:
236 		if (!cpumask_test_cpu(cpu, tick_get_broadcast_mask())) {
237 			cpumask_set_cpu(cpu, tick_get_broadcast_mask());
238 			if (tick_broadcast_device.mode ==
239 			    TICKDEV_MODE_PERIODIC)
240 				clockevents_shutdown(dev);
241 		}
242 		if (*reason == CLOCK_EVT_NOTIFY_BROADCAST_FORCE)
243 			tick_broadcast_force = 1;
244 		break;
245 	case CLOCK_EVT_NOTIFY_BROADCAST_OFF:
246 		if (!tick_broadcast_force &&
247 		    cpumask_test_cpu(cpu, tick_get_broadcast_mask())) {
248 			cpumask_clear_cpu(cpu, tick_get_broadcast_mask());
249 			if (tick_broadcast_device.mode ==
250 			    TICKDEV_MODE_PERIODIC)
251 				tick_setup_periodic(dev, 0);
252 		}
253 		break;
254 	}
255 
256 	if (cpumask_empty(tick_get_broadcast_mask())) {
257 		if (!bc_stopped)
258 			clockevents_shutdown(bc);
259 	} else if (bc_stopped) {
260 		if (tick_broadcast_device.mode == TICKDEV_MODE_PERIODIC)
261 			tick_broadcast_start_periodic(bc);
262 		else
263 			tick_broadcast_setup_oneshot(bc);
264 	}
265 out:
266 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
267 }
268 
269 /*
270  * Powerstate information: The system enters/leaves a state, where
271  * affected devices might stop.
272  */
273 void tick_broadcast_on_off(unsigned long reason, int *oncpu)
274 {
275 	if (!cpumask_test_cpu(*oncpu, cpu_online_mask))
276 		printk(KERN_ERR "tick-broadcast: ignoring broadcast for "
277 		       "offline CPU #%d\n", *oncpu);
278 	else
279 		tick_do_broadcast_on_off(&reason);
280 }
281 
282 /*
283  * Set the periodic handler depending on broadcast on/off
284  */
285 void tick_set_periodic_handler(struct clock_event_device *dev, int broadcast)
286 {
287 	if (!broadcast)
288 		dev->event_handler = tick_handle_periodic;
289 	else
290 		dev->event_handler = tick_handle_periodic_broadcast;
291 }
292 
293 /*
294  * Remove a CPU from broadcasting
295  */
296 void tick_shutdown_broadcast(unsigned int *cpup)
297 {
298 	struct clock_event_device *bc;
299 	unsigned long flags;
300 	unsigned int cpu = *cpup;
301 
302 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
303 
304 	bc = tick_broadcast_device.evtdev;
305 	cpumask_clear_cpu(cpu, tick_get_broadcast_mask());
306 
307 	if (tick_broadcast_device.mode == TICKDEV_MODE_PERIODIC) {
308 		if (bc && cpumask_empty(tick_get_broadcast_mask()))
309 			clockevents_shutdown(bc);
310 	}
311 
312 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
313 }
314 
315 void tick_suspend_broadcast(void)
316 {
317 	struct clock_event_device *bc;
318 	unsigned long flags;
319 
320 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
321 
322 	bc = tick_broadcast_device.evtdev;
323 	if (bc)
324 		clockevents_shutdown(bc);
325 
326 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
327 }
328 
329 int tick_resume_broadcast(void)
330 {
331 	struct clock_event_device *bc;
332 	unsigned long flags;
333 	int broadcast = 0;
334 
335 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
336 
337 	bc = tick_broadcast_device.evtdev;
338 
339 	if (bc) {
340 		clockevents_set_mode(bc, CLOCK_EVT_MODE_RESUME);
341 
342 		switch (tick_broadcast_device.mode) {
343 		case TICKDEV_MODE_PERIODIC:
344 			if (!cpumask_empty(tick_get_broadcast_mask()))
345 				tick_broadcast_start_periodic(bc);
346 			broadcast = cpumask_test_cpu(smp_processor_id(),
347 						     tick_get_broadcast_mask());
348 			break;
349 		case TICKDEV_MODE_ONESHOT:
350 			broadcast = tick_resume_broadcast_oneshot(bc);
351 			break;
352 		}
353 	}
354 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
355 
356 	return broadcast;
357 }
358 
359 
360 #ifdef CONFIG_TICK_ONESHOT
361 
362 /* FIXME: use cpumask_var_t. */
363 static DECLARE_BITMAP(tick_broadcast_oneshot_mask, NR_CPUS);
364 
365 /*
366  * Exposed for debugging: see timer_list.c
367  */
368 struct cpumask *tick_get_broadcast_oneshot_mask(void)
369 {
370 	return to_cpumask(tick_broadcast_oneshot_mask);
371 }
372 
373 static int tick_broadcast_set_event(ktime_t expires, int force)
374 {
375 	struct clock_event_device *bc = tick_broadcast_device.evtdev;
376 
377 	return tick_dev_program_event(bc, expires, force);
378 }
379 
380 int tick_resume_broadcast_oneshot(struct clock_event_device *bc)
381 {
382 	clockevents_set_mode(bc, CLOCK_EVT_MODE_ONESHOT);
383 	return 0;
384 }
385 
386 /*
387  * Called from irq_enter() when idle was interrupted to reenable the
388  * per cpu device.
389  */
390 void tick_check_oneshot_broadcast(int cpu)
391 {
392 	if (cpumask_test_cpu(cpu, to_cpumask(tick_broadcast_oneshot_mask))) {
393 		struct tick_device *td = &per_cpu(tick_cpu_device, cpu);
394 
395 		clockevents_set_mode(td->evtdev, CLOCK_EVT_MODE_ONESHOT);
396 	}
397 }
398 
399 /*
400  * Handle oneshot mode broadcasting
401  */
402 static void tick_handle_oneshot_broadcast(struct clock_event_device *dev)
403 {
404 	struct tick_device *td;
405 	ktime_t now, next_event;
406 	int cpu;
407 
408 	raw_spin_lock(&tick_broadcast_lock);
409 again:
410 	dev->next_event.tv64 = KTIME_MAX;
411 	next_event.tv64 = KTIME_MAX;
412 	cpumask_clear(to_cpumask(tmpmask));
413 	now = ktime_get();
414 	/* Find all expired events */
415 	for_each_cpu(cpu, tick_get_broadcast_oneshot_mask()) {
416 		td = &per_cpu(tick_cpu_device, cpu);
417 		if (td->evtdev->next_event.tv64 <= now.tv64)
418 			cpumask_set_cpu(cpu, to_cpumask(tmpmask));
419 		else if (td->evtdev->next_event.tv64 < next_event.tv64)
420 			next_event.tv64 = td->evtdev->next_event.tv64;
421 	}
422 
423 	/*
424 	 * Wakeup the cpus which have an expired event.
425 	 */
426 	tick_do_broadcast(to_cpumask(tmpmask));
427 
428 	/*
429 	 * Two reasons for reprogram:
430 	 *
431 	 * - The global event did not expire any CPU local
432 	 * events. This happens in dyntick mode, as the maximum PIT
433 	 * delta is quite small.
434 	 *
435 	 * - There are pending events on sleeping CPUs which were not
436 	 * in the event mask
437 	 */
438 	if (next_event.tv64 != KTIME_MAX) {
439 		/*
440 		 * Rearm the broadcast device. If event expired,
441 		 * repeat the above
442 		 */
443 		if (tick_broadcast_set_event(next_event, 0))
444 			goto again;
445 	}
446 	raw_spin_unlock(&tick_broadcast_lock);
447 }
448 
449 /*
450  * Powerstate information: The system enters/leaves a state, where
451  * affected devices might stop
452  */
453 void tick_broadcast_oneshot_control(unsigned long reason)
454 {
455 	struct clock_event_device *bc, *dev;
456 	struct tick_device *td;
457 	unsigned long flags;
458 	int cpu;
459 
460 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
461 
462 	/*
463 	 * Periodic mode does not care about the enter/exit of power
464 	 * states
465 	 */
466 	if (tick_broadcast_device.mode == TICKDEV_MODE_PERIODIC)
467 		goto out;
468 
469 	bc = tick_broadcast_device.evtdev;
470 	cpu = smp_processor_id();
471 	td = &per_cpu(tick_cpu_device, cpu);
472 	dev = td->evtdev;
473 
474 	if (!(dev->features & CLOCK_EVT_FEAT_C3STOP))
475 		goto out;
476 
477 	if (reason == CLOCK_EVT_NOTIFY_BROADCAST_ENTER) {
478 		if (!cpumask_test_cpu(cpu, tick_get_broadcast_oneshot_mask())) {
479 			cpumask_set_cpu(cpu, tick_get_broadcast_oneshot_mask());
480 			clockevents_set_mode(dev, CLOCK_EVT_MODE_SHUTDOWN);
481 			if (dev->next_event.tv64 < bc->next_event.tv64)
482 				tick_broadcast_set_event(dev->next_event, 1);
483 		}
484 	} else {
485 		if (cpumask_test_cpu(cpu, tick_get_broadcast_oneshot_mask())) {
486 			cpumask_clear_cpu(cpu,
487 					  tick_get_broadcast_oneshot_mask());
488 			clockevents_set_mode(dev, CLOCK_EVT_MODE_ONESHOT);
489 			if (dev->next_event.tv64 != KTIME_MAX)
490 				tick_program_event(dev->next_event, 1);
491 		}
492 	}
493 
494 out:
495 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
496 }
497 
498 /*
499  * Reset the one shot broadcast for a cpu
500  *
501  * Called with tick_broadcast_lock held
502  */
503 static void tick_broadcast_clear_oneshot(int cpu)
504 {
505 	cpumask_clear_cpu(cpu, tick_get_broadcast_oneshot_mask());
506 }
507 
508 static void tick_broadcast_init_next_event(struct cpumask *mask,
509 					   ktime_t expires)
510 {
511 	struct tick_device *td;
512 	int cpu;
513 
514 	for_each_cpu(cpu, mask) {
515 		td = &per_cpu(tick_cpu_device, cpu);
516 		if (td->evtdev)
517 			td->evtdev->next_event = expires;
518 	}
519 }
520 
521 /**
522  * tick_broadcast_setup_oneshot - setup the broadcast device
523  */
524 void tick_broadcast_setup_oneshot(struct clock_event_device *bc)
525 {
526 	/* Set it up only once ! */
527 	if (bc->event_handler != tick_handle_oneshot_broadcast) {
528 		int was_periodic = bc->mode == CLOCK_EVT_MODE_PERIODIC;
529 		int cpu = smp_processor_id();
530 
531 		bc->event_handler = tick_handle_oneshot_broadcast;
532 		clockevents_set_mode(bc, CLOCK_EVT_MODE_ONESHOT);
533 
534 		/* Take the do_timer update */
535 		tick_do_timer_cpu = cpu;
536 
537 		/*
538 		 * We must be careful here. There might be other CPUs
539 		 * waiting for periodic broadcast. We need to set the
540 		 * oneshot_mask bits for those and program the
541 		 * broadcast device to fire.
542 		 */
543 		cpumask_copy(to_cpumask(tmpmask), tick_get_broadcast_mask());
544 		cpumask_clear_cpu(cpu, to_cpumask(tmpmask));
545 		cpumask_or(tick_get_broadcast_oneshot_mask(),
546 			   tick_get_broadcast_oneshot_mask(),
547 			   to_cpumask(tmpmask));
548 
549 		if (was_periodic && !cpumask_empty(to_cpumask(tmpmask))) {
550 			tick_broadcast_init_next_event(to_cpumask(tmpmask),
551 						       tick_next_period);
552 			tick_broadcast_set_event(tick_next_period, 1);
553 		} else
554 			bc->next_event.tv64 = KTIME_MAX;
555 	}
556 }
557 
558 /*
559  * Select oneshot operating mode for the broadcast device
560  */
561 void tick_broadcast_switch_to_oneshot(void)
562 {
563 	struct clock_event_device *bc;
564 	unsigned long flags;
565 
566 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
567 
568 	tick_broadcast_device.mode = TICKDEV_MODE_ONESHOT;
569 	bc = tick_broadcast_device.evtdev;
570 	if (bc)
571 		tick_broadcast_setup_oneshot(bc);
572 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
573 }
574 
575 
576 /*
577  * Remove a dead CPU from broadcasting
578  */
579 void tick_shutdown_broadcast_oneshot(unsigned int *cpup)
580 {
581 	unsigned long flags;
582 	unsigned int cpu = *cpup;
583 
584 	raw_spin_lock_irqsave(&tick_broadcast_lock, flags);
585 
586 	/*
587 	 * Clear the broadcast mask flag for the dead cpu, but do not
588 	 * stop the broadcast device!
589 	 */
590 	cpumask_clear_cpu(cpu, tick_get_broadcast_oneshot_mask());
591 
592 	raw_spin_unlock_irqrestore(&tick_broadcast_lock, flags);
593 }
594 
595 /*
596  * Check, whether the broadcast device is in one shot mode
597  */
598 int tick_broadcast_oneshot_active(void)
599 {
600 	return tick_broadcast_device.mode == TICKDEV_MODE_ONESHOT;
601 }
602 
603 #endif
604