xref: /linux/drivers/xen/xenbus/xenbus_probe.c (revision a174910917a8e93cb5334e9dce8bac32bff22c47)
1 /******************************************************************************
2  * Talks to Xen Store to figure out what devices we have.
3  *
4  * Copyright (C) 2005 Rusty Russell, IBM Corporation
5  * Copyright (C) 2005 Mike Wray, Hewlett-Packard
6  * Copyright (C) 2005, 2006 XenSource Ltd
7  *
8  * This program is free software; you can redistribute it and/or
9  * modify it under the terms of the GNU General Public License version 2
10  * as published by the Free Software Foundation; or, when distributed
11  * separately from the Linux kernel or incorporated into other
12  * software packages, subject to the following license:
13  *
14  * Permission is hereby granted, free of charge, to any person obtaining a copy
15  * of this source file (the "Software"), to deal in the Software without
16  * restriction, including without limitation the rights to use, copy, modify,
17  * merge, publish, distribute, sublicense, and/or sell copies of the Software,
18  * and to permit persons to whom the Software is furnished to do so, subject to
19  * the following conditions:
20  *
21  * The above copyright notice and this permission notice shall be included in
22  * all copies or substantial portions of the Software.
23  *
24  * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
25  * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
26  * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
27  * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
28  * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
29  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
30  * IN THE SOFTWARE.
31  */
32 
33 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
34 #define dev_fmt pr_fmt
35 
36 #define DPRINTK(fmt, args...)				\
37 	pr_debug("xenbus_probe (%s:%d) " fmt ".\n",	\
38 		 __func__, __LINE__, ##args)
39 
40 #include <linux/kernel.h>
41 #include <linux/err.h>
42 #include <linux/string.h>
43 #include <linux/ctype.h>
44 #include <linux/fcntl.h>
45 #include <linux/mm.h>
46 #include <linux/proc_fs.h>
47 #include <linux/notifier.h>
48 #include <linux/kthread.h>
49 #include <linux/mutex.h>
50 #include <linux/io.h>
51 #include <linux/slab.h>
52 #include <linux/module.h>
53 
54 #include <asm/page.h>
55 #include <asm/xen/hypervisor.h>
56 
57 #include <xen/xen.h>
58 #include <xen/xenbus.h>
59 #include <xen/events.h>
60 #include <xen/xen-ops.h>
61 #include <xen/page.h>
62 
63 #include <xen/hvm.h>
64 
65 #include "xenbus.h"
66 
67 
68 static int xs_init_irq = -1;
69 int xen_store_evtchn;
70 EXPORT_SYMBOL_GPL(xen_store_evtchn);
71 
72 struct xenstore_domain_interface *xen_store_interface;
73 EXPORT_SYMBOL_GPL(xen_store_interface);
74 
75 #define XS_INTERFACE_READY \
76 	((xen_store_interface != NULL) && \
77 	 (xen_store_interface->connection == XENSTORE_CONNECTED))
78 
79 enum xenstore_init xen_store_domain_type;
80 EXPORT_SYMBOL_GPL(xen_store_domain_type);
81 
82 static unsigned long xen_store_gfn;
83 
84 static BLOCKING_NOTIFIER_HEAD(xenstore_chain);
85 
86 /* If something in array of ids matches this device, return it. */
87 static const struct xenbus_device_id *
88 match_device(const struct xenbus_device_id *arr, struct xenbus_device *dev)
89 {
90 	for (; *arr->devicetype != '\0'; arr++) {
91 		if (!strcmp(arr->devicetype, dev->devicetype))
92 			return arr;
93 	}
94 	return NULL;
95 }
96 
97 int xenbus_match(struct device *_dev, const struct device_driver *_drv)
98 {
99 	const struct xenbus_driver *drv = to_xenbus_driver(_drv);
100 
101 	if (!drv->ids)
102 		return 0;
103 
104 	return match_device(drv->ids, to_xenbus_device(_dev)) != NULL;
105 }
106 EXPORT_SYMBOL_GPL(xenbus_match);
107 
108 
109 static void free_otherend_details(struct xenbus_device *dev)
110 {
111 	kfree(dev->otherend);
112 	dev->otherend = NULL;
113 }
114 
115 
116 static void free_otherend_watch(struct xenbus_device *dev)
117 {
118 	if (dev->otherend_watch.node) {
119 		unregister_xenbus_watch(&dev->otherend_watch);
120 		kfree(dev->otherend_watch.node);
121 		dev->otherend_watch.node = NULL;
122 	}
123 }
124 
125 
126 static int talk_to_otherend(struct xenbus_device *dev)
127 {
128 	struct xenbus_driver *drv = to_xenbus_driver(dev->dev.driver);
129 
130 	free_otherend_watch(dev);
131 	free_otherend_details(dev);
132 
133 	return drv->read_otherend_details(dev);
134 }
135 
136 
137 
138 static int watch_otherend(struct xenbus_device *dev)
139 {
140 	struct xen_bus_type *bus =
141 		container_of(dev->dev.bus, struct xen_bus_type, bus);
142 
143 	return xenbus_watch_pathfmt(dev, &dev->otherend_watch,
144 				    bus->otherend_will_handle,
145 				    bus->otherend_changed,
146 				    "%s/%s", dev->otherend, "state");
147 }
148 
149 
150 int xenbus_read_otherend_details(struct xenbus_device *xendev,
151 				 char *id_node, char *path_node)
152 {
153 	int err = xenbus_gather(XBT_NIL, xendev->nodename,
154 				id_node, "%i", &xendev->otherend_id,
155 				path_node, NULL, &xendev->otherend,
156 				NULL);
157 	if (err) {
158 		xenbus_dev_fatal(xendev, err,
159 				 "reading other end details from %s",
160 				 xendev->nodename);
161 		return err;
162 	}
163 	if (strlen(xendev->otherend) == 0 ||
164 	    !xenbus_exists(XBT_NIL, xendev->otherend, "")) {
165 		xenbus_dev_fatal(xendev, -ENOENT,
166 				 "unable to read other end from %s.  "
167 				 "missing or inaccessible.",
168 				 xendev->nodename);
169 		free_otherend_details(xendev);
170 		return -ENOENT;
171 	}
172 
173 	return 0;
174 }
175 EXPORT_SYMBOL_GPL(xenbus_read_otherend_details);
176 
177 void xenbus_otherend_changed(struct xenbus_watch *watch,
178 			     const char *path, const char *token,
179 			     int ignore_on_shutdown)
180 {
181 	struct xenbus_device *dev =
182 		container_of(watch, struct xenbus_device, otherend_watch);
183 	struct xenbus_driver *drv = to_xenbus_driver(dev->dev.driver);
184 	enum xenbus_state state;
185 
186 	/* Protect us against watches firing on old details when the otherend
187 	   details change, say immediately after a resume. */
188 	if (!dev->otherend ||
189 	    strncmp(dev->otherend, path, strlen(dev->otherend))) {
190 		dev_dbg(&dev->dev, "Ignoring watch at %s\n", path);
191 		return;
192 	}
193 
194 	state = xenbus_read_driver_state(dev, dev->otherend);
195 
196 	dev_dbg(&dev->dev, "state is %d, (%s), %s, %s\n",
197 		state, xenbus_strstate(state), dev->otherend_watch.node, path);
198 
199 	/*
200 	 * Ignore xenbus transitions during shutdown. This prevents us doing
201 	 * work that can fail e.g., when the rootfs is gone.
202 	 */
203 	if (system_state > SYSTEM_RUNNING) {
204 		if (ignore_on_shutdown && (state == XenbusStateClosing))
205 			xenbus_frontend_closed(dev);
206 		return;
207 	}
208 
209 	if (drv->otherend_changed)
210 		drv->otherend_changed(dev, state);
211 }
212 EXPORT_SYMBOL_GPL(xenbus_otherend_changed);
213 
214 #define XENBUS_SHOW_STAT(name)						\
215 static ssize_t name##_show(struct device *_dev,				\
216 			   struct device_attribute *attr,		\
217 			   char *buf)					\
218 {									\
219 	struct xenbus_device *dev = to_xenbus_device(_dev);		\
220 									\
221 	return sprintf(buf, "%d\n", atomic_read(&dev->name));		\
222 }									\
223 static DEVICE_ATTR_RO(name)
224 
225 XENBUS_SHOW_STAT(event_channels);
226 XENBUS_SHOW_STAT(events);
227 XENBUS_SHOW_STAT(spurious_events);
228 XENBUS_SHOW_STAT(jiffies_eoi_delayed);
229 
230 static ssize_t spurious_threshold_show(struct device *_dev,
231 				       struct device_attribute *attr,
232 				       char *buf)
233 {
234 	struct xenbus_device *dev = to_xenbus_device(_dev);
235 
236 	return sprintf(buf, "%d\n", dev->spurious_threshold);
237 }
238 
239 static ssize_t spurious_threshold_store(struct device *_dev,
240 					struct device_attribute *attr,
241 					const char *buf, size_t count)
242 {
243 	struct xenbus_device *dev = to_xenbus_device(_dev);
244 	unsigned int val;
245 	ssize_t ret;
246 
247 	ret = kstrtouint(buf, 0, &val);
248 	if (ret)
249 		return ret;
250 
251 	dev->spurious_threshold = val;
252 
253 	return count;
254 }
255 
256 static DEVICE_ATTR_RW(spurious_threshold);
257 
258 static struct attribute *xenbus_attrs[] = {
259 	&dev_attr_event_channels.attr,
260 	&dev_attr_events.attr,
261 	&dev_attr_spurious_events.attr,
262 	&dev_attr_jiffies_eoi_delayed.attr,
263 	&dev_attr_spurious_threshold.attr,
264 	NULL
265 };
266 
267 static const struct attribute_group xenbus_group = {
268 	.name = "xenbus",
269 	.attrs = xenbus_attrs,
270 };
271 
272 int xenbus_dev_probe(struct device *_dev)
273 {
274 	struct xenbus_device *dev = to_xenbus_device(_dev);
275 	struct xenbus_driver *drv = to_xenbus_driver(_dev->driver);
276 	const struct xenbus_device_id *id;
277 	int err;
278 
279 	DPRINTK("%s", dev->nodename);
280 
281 	if (!drv->probe) {
282 		err = -ENODEV;
283 		goto fail;
284 	}
285 
286 	id = match_device(drv->ids, dev);
287 	if (!id) {
288 		err = -ENODEV;
289 		goto fail;
290 	}
291 
292 	err = talk_to_otherend(dev);
293 	if (err) {
294 		dev_warn(&dev->dev, "talk_to_otherend on %s failed.\n",
295 			 dev->nodename);
296 		return err;
297 	}
298 
299 	if (!try_module_get(drv->driver.owner)) {
300 		dev_warn(&dev->dev, "failed to acquire module reference on '%s'\n",
301 			 drv->driver.name);
302 		err = -ESRCH;
303 		goto fail;
304 	}
305 
306 	down(&dev->reclaim_sem);
307 	err = drv->probe(dev, id);
308 	up(&dev->reclaim_sem);
309 	if (err)
310 		goto fail_put;
311 
312 	err = watch_otherend(dev);
313 	if (err) {
314 		dev_warn(&dev->dev, "watch_otherend on %s failed.\n",
315 		       dev->nodename);
316 		goto fail_remove;
317 	}
318 
319 	dev->spurious_threshold = 1;
320 	if (sysfs_create_group(&dev->dev.kobj, &xenbus_group))
321 		dev_warn(&dev->dev, "sysfs_create_group on %s failed.\n",
322 			 dev->nodename);
323 
324 	return 0;
325 fail_remove:
326 	if (drv->remove) {
327 		down(&dev->reclaim_sem);
328 		drv->remove(dev);
329 		up(&dev->reclaim_sem);
330 	}
331 fail_put:
332 	module_put(drv->driver.owner);
333 fail:
334 	xenbus_dev_error(dev, err, "xenbus_dev_probe on %s", dev->nodename);
335 	return err;
336 }
337 EXPORT_SYMBOL_GPL(xenbus_dev_probe);
338 
339 void xenbus_dev_remove(struct device *_dev)
340 {
341 	struct xenbus_device *dev = to_xenbus_device(_dev);
342 	struct xenbus_driver *drv = to_xenbus_driver(_dev->driver);
343 
344 	DPRINTK("%s", dev->nodename);
345 
346 	sysfs_remove_group(&dev->dev.kobj, &xenbus_group);
347 
348 	free_otherend_watch(dev);
349 
350 	if (drv->remove) {
351 		down(&dev->reclaim_sem);
352 		drv->remove(dev);
353 		up(&dev->reclaim_sem);
354 	}
355 
356 	module_put(drv->driver.owner);
357 
358 	free_otherend_details(dev);
359 
360 	/*
361 	 * If the toolstack has forced the device state to closing then set
362 	 * the state to closed now to allow it to be cleaned up.
363 	 * Similarly, if the driver does not support re-bind, set the
364 	 * closed.
365 	 */
366 	if (!drv->allow_rebind ||
367 	    xenbus_read_driver_state(dev, dev->nodename) == XenbusStateClosing)
368 		xenbus_switch_state(dev, XenbusStateClosed);
369 }
370 EXPORT_SYMBOL_GPL(xenbus_dev_remove);
371 
372 int xenbus_register_driver_common(struct xenbus_driver *drv,
373 				  struct xen_bus_type *bus,
374 				  struct module *owner, const char *mod_name)
375 {
376 	drv->driver.name = drv->name ? drv->name : drv->ids[0].devicetype;
377 	drv->driver.bus = &bus->bus;
378 	drv->driver.owner = owner;
379 	drv->driver.mod_name = mod_name;
380 
381 	return driver_register(&drv->driver);
382 }
383 EXPORT_SYMBOL_GPL(xenbus_register_driver_common);
384 
385 void xenbus_unregister_driver(struct xenbus_driver *drv)
386 {
387 	driver_unregister(&drv->driver);
388 }
389 EXPORT_SYMBOL_GPL(xenbus_unregister_driver);
390 
391 struct xb_find_info {
392 	struct xenbus_device *dev;
393 	const char *nodename;
394 };
395 
396 static int cmp_dev(struct device *dev, void *data)
397 {
398 	struct xenbus_device *xendev = to_xenbus_device(dev);
399 	struct xb_find_info *info = data;
400 
401 	if (!strcmp(xendev->nodename, info->nodename)) {
402 		info->dev = xendev;
403 		get_device(dev);
404 		return 1;
405 	}
406 	return 0;
407 }
408 
409 static struct xenbus_device *xenbus_device_find(const char *nodename,
410 						struct bus_type *bus)
411 {
412 	struct xb_find_info info = { .dev = NULL, .nodename = nodename };
413 
414 	bus_for_each_dev(bus, NULL, &info, cmp_dev);
415 	return info.dev;
416 }
417 
418 static int cleanup_dev(struct device *dev, void *data)
419 {
420 	struct xenbus_device *xendev = to_xenbus_device(dev);
421 	struct xb_find_info *info = data;
422 	int len = strlen(info->nodename);
423 
424 	DPRINTK("%s", info->nodename);
425 
426 	/* Match the info->nodename path, or any subdirectory of that path. */
427 	if (strncmp(xendev->nodename, info->nodename, len))
428 		return 0;
429 
430 	/* If the node name is longer, ensure it really is a subdirectory. */
431 	if ((strlen(xendev->nodename) > len) && (xendev->nodename[len] != '/'))
432 		return 0;
433 
434 	info->dev = xendev;
435 	get_device(dev);
436 	return 1;
437 }
438 
439 static void xenbus_cleanup_devices(const char *path, struct bus_type *bus)
440 {
441 	struct xb_find_info info = { .nodename = path };
442 
443 	do {
444 		info.dev = NULL;
445 		bus_for_each_dev(bus, NULL, &info, cleanup_dev);
446 		if (info.dev) {
447 			dev_warn(&info.dev->dev,
448 				 "device forcefully removed from xenstore\n");
449 			info.dev->vanished = true;
450 			device_unregister(&info.dev->dev);
451 			put_device(&info.dev->dev);
452 		}
453 	} while (info.dev);
454 }
455 
456 static void xenbus_dev_release(struct device *dev)
457 {
458 	if (dev)
459 		kfree(to_xenbus_device(dev));
460 }
461 
462 static ssize_t nodename_show(struct device *dev,
463 			     struct device_attribute *attr, char *buf)
464 {
465 	return sprintf(buf, "%s\n", to_xenbus_device(dev)->nodename);
466 }
467 static DEVICE_ATTR_RO(nodename);
468 
469 static ssize_t devtype_show(struct device *dev,
470 			    struct device_attribute *attr, char *buf)
471 {
472 	return sprintf(buf, "%s\n", to_xenbus_device(dev)->devicetype);
473 }
474 static DEVICE_ATTR_RO(devtype);
475 
476 static ssize_t modalias_show(struct device *dev,
477 			     struct device_attribute *attr, char *buf)
478 {
479 	return sprintf(buf, "%s:%s\n", dev->bus->name,
480 		       to_xenbus_device(dev)->devicetype);
481 }
482 static DEVICE_ATTR_RO(modalias);
483 
484 static ssize_t state_show(struct device *dev,
485 			    struct device_attribute *attr, char *buf)
486 {
487 	return sprintf(buf, "%s\n",
488 			xenbus_strstate(to_xenbus_device(dev)->state));
489 }
490 static DEVICE_ATTR_RO(state);
491 
492 static struct attribute *xenbus_dev_attrs[] = {
493 	&dev_attr_nodename.attr,
494 	&dev_attr_devtype.attr,
495 	&dev_attr_modalias.attr,
496 	&dev_attr_state.attr,
497 	NULL,
498 };
499 
500 static const struct attribute_group xenbus_dev_group = {
501 	.attrs = xenbus_dev_attrs,
502 };
503 
504 const struct attribute_group *xenbus_dev_groups[] = {
505 	&xenbus_dev_group,
506 	NULL,
507 };
508 EXPORT_SYMBOL_GPL(xenbus_dev_groups);
509 
510 int xenbus_probe_node(struct xen_bus_type *bus,
511 		      const char *type,
512 		      const char *nodename)
513 {
514 	char devname[XEN_BUS_ID_SIZE];
515 	int err;
516 	struct xenbus_device *xendev;
517 	size_t name_len, type_len;
518 	char *tmpstring;
519 
520 	enum xenbus_state state = xenbus_read_driver_state(NULL, nodename);
521 
522 	if (state != XenbusStateInitialising) {
523 		/* Device is not new, so ignore it.  This can happen if a
524 		   device is going away after switching to Closed.  */
525 		return 0;
526 	}
527 
528 	name_len = strlen(nodename);
529 	type_len = strlen(type);
530 	xendev = kzalloc(sizeof(*xendev) + name_len + 1 + type_len + 1, GFP_KERNEL);
531 	if (!xendev)
532 		return -ENOMEM;
533 
534 	xendev->state = XenbusStateInitialising;
535 
536 	/* Copy the strings into the extra space. */
537 
538 	tmpstring = (char *)(xendev + 1);
539 	memcpy(tmpstring, nodename, name_len);
540 	xendev->nodename = tmpstring;
541 
542 	tmpstring += name_len + 1;
543 	memcpy(tmpstring, type, type_len);
544 	xendev->devicetype = tmpstring;
545 	init_completion(&xendev->down);
546 
547 	xendev->dev.bus = &bus->bus;
548 	xendev->dev.release = xenbus_dev_release;
549 
550 	err = bus->get_bus_id(devname, xendev->nodename);
551 	if (err)
552 		goto fail;
553 
554 	dev_set_name(&xendev->dev, "%s", devname);
555 	sema_init(&xendev->reclaim_sem, 1);
556 
557 	/* Register with generic device framework. */
558 	err = device_register(&xendev->dev);
559 	if (err) {
560 		put_device(&xendev->dev);
561 		xendev = NULL;
562 		goto fail;
563 	}
564 
565 	return 0;
566 fail:
567 	kfree(xendev);
568 	return err;
569 }
570 EXPORT_SYMBOL_GPL(xenbus_probe_node);
571 
572 static int xenbus_probe_device_type(struct xen_bus_type *bus, const char *type)
573 {
574 	int err = 0;
575 	char **dir;
576 	unsigned int dir_n = 0;
577 	int i;
578 
579 	dir = xenbus_directory(XBT_NIL, bus->root, type, &dir_n);
580 	if (IS_ERR(dir))
581 		return PTR_ERR(dir);
582 
583 	for (i = 0; i < dir_n; i++) {
584 		err = bus->probe(bus, type, dir[i]);
585 		if (err)
586 			break;
587 	}
588 
589 	kfree(dir);
590 	return err;
591 }
592 
593 int xenbus_probe_devices(struct xen_bus_type *bus)
594 {
595 	int err = 0;
596 	char **dir;
597 	unsigned int i, dir_n;
598 
599 	dir = xenbus_directory(XBT_NIL, bus->root, "", &dir_n);
600 	if (IS_ERR(dir))
601 		return PTR_ERR(dir);
602 
603 	for (i = 0; i < dir_n; i++) {
604 		err = xenbus_probe_device_type(bus, dir[i]);
605 		if (err)
606 			break;
607 	}
608 
609 	kfree(dir);
610 	return err;
611 }
612 EXPORT_SYMBOL_GPL(xenbus_probe_devices);
613 
614 static unsigned int char_count(const char *str, char c)
615 {
616 	unsigned int i, ret = 0;
617 
618 	for (i = 0; str[i]; i++)
619 		if (str[i] == c)
620 			ret++;
621 	return ret;
622 }
623 
624 static int strsep_len(const char *str, char c, unsigned int len)
625 {
626 	unsigned int i;
627 
628 	for (i = 0; str[i]; i++)
629 		if (str[i] == c) {
630 			if (len == 0)
631 				return i;
632 			len--;
633 		}
634 	return (len == 0) ? i : -ERANGE;
635 }
636 
637 void xenbus_dev_changed(const char *node, struct xen_bus_type *bus)
638 {
639 	int exists, rootlen;
640 	struct xenbus_device *dev;
641 	char type[XEN_BUS_ID_SIZE];
642 	const char *p, *root;
643 
644 	if (char_count(node, '/') < 2)
645 		return;
646 
647 	exists = xenbus_exists(XBT_NIL, node, "");
648 	if (!exists) {
649 		xenbus_cleanup_devices(node, &bus->bus);
650 		return;
651 	}
652 
653 	/* backend/<type>/... or device/<type>/... */
654 	p = strchr(node, '/') + 1;
655 	snprintf(type, XEN_BUS_ID_SIZE, "%.*s", (int)strcspn(p, "/"), p);
656 	type[XEN_BUS_ID_SIZE-1] = '\0';
657 
658 	rootlen = strsep_len(node, '/', bus->levels);
659 	if (rootlen < 0)
660 		return;
661 	root = kasprintf(GFP_KERNEL, "%.*s", rootlen, node);
662 	if (!root)
663 		return;
664 
665 	dev = xenbus_device_find(root, &bus->bus);
666 	/*
667 	 * Backend domain crash results in not coordinated frontend removal,
668 	 * without going through XenbusStateClosing. If this is a new instance
669 	 * of the same device Xen tools will have reset the state to
670 	 * XenbusStateInitializing.
671 	 * It might be that the backend crashed early during the init phase of
672 	 * device setup, in which case the known state would have been
673 	 * XenbusStateInitializing. So test the backend domid to match the
674 	 * saved one. In case the new backend happens to have the same domid as
675 	 * the old one, we can just carry on, as there is no inconsistency
676 	 * resulting in this case.
677 	 */
678 	if (dev && !strcmp(bus->root, "device")) {
679 		enum xenbus_state state = xenbus_read_driver_state(dev, dev->nodename);
680 		unsigned int backend = xenbus_read_unsigned(root, "backend-id",
681 							    dev->otherend_id);
682 
683 		if (state == XenbusStateInitialising &&
684 		    (state != dev->state || backend != dev->otherend_id)) {
685 			/*
686 			 * State has been reset, assume the old one vanished
687 			 * and new one needs to be probed.
688 			 */
689 			dev_warn(&dev->dev,
690 				 "state reset occurred, reconnecting\n");
691 			dev->vanished = true;
692 		}
693 		if (dev->vanished) {
694 			device_unregister(&dev->dev);
695 			put_device(&dev->dev);
696 			dev = NULL;
697 		}
698 	}
699 	if (!dev)
700 		xenbus_probe_node(bus, type, root);
701 	else
702 		put_device(&dev->dev);
703 
704 	kfree(root);
705 }
706 EXPORT_SYMBOL_GPL(xenbus_dev_changed);
707 
708 int xenbus_dev_freeze(struct device *dev)
709 {
710 	int err = 0;
711 	struct xenbus_driver *drv;
712 	struct xenbus_device *xdev
713 		= container_of(dev, struct xenbus_device, dev);
714 
715 	DPRINTK("%s", xdev->nodename);
716 
717 	if (dev->driver == NULL)
718 		return 0;
719 	drv = to_xenbus_driver(dev->driver);
720 	if (drv->suspend)
721 		err = drv->suspend(xdev);
722 	if (err)
723 		dev_warn(dev, "freeze failed: %i\n", err);
724 	return 0;
725 }
726 EXPORT_SYMBOL_GPL(xenbus_dev_freeze);
727 
728 int xenbus_dev_restore(struct device *dev)
729 {
730 	int err;
731 	struct xenbus_driver *drv;
732 	struct xenbus_device *xdev
733 		= container_of(dev, struct xenbus_device, dev);
734 
735 	DPRINTK("%s", xdev->nodename);
736 
737 	if (dev->driver == NULL)
738 		return 0;
739 	drv = to_xenbus_driver(dev->driver);
740 	err = talk_to_otherend(xdev);
741 	if (err) {
742 		dev_warn(dev, "restore (talk_to_otherend) failed: %i\n", err);
743 		return err;
744 	}
745 
746 	xdev->state = XenbusStateInitialising;
747 
748 	if (drv->resume) {
749 		err = drv->resume(xdev);
750 		if (err) {
751 			dev_warn(dev, "restore failed: %i\n", err);
752 			return err;
753 		}
754 	}
755 
756 	err = watch_otherend(xdev);
757 	if (err) {
758 		dev_warn(dev, "restore (watch_otherend) failed: %d\n", err);
759 		return err;
760 	}
761 
762 	return 0;
763 }
764 EXPORT_SYMBOL_GPL(xenbus_dev_restore);
765 
766 int xenbus_dev_thaw(struct device *dev)
767 {
768 	/* Do nothing */
769 	DPRINTK("thaw");
770 	return 0;
771 }
772 EXPORT_SYMBOL_GPL(xenbus_dev_thaw);
773 
774 /* A flag to determine if xenstored is 'ready' (i.e. has started) */
775 int xenstored_ready;
776 
777 
778 int register_xenstore_notifier(struct notifier_block *nb)
779 {
780 	int ret = 0;
781 
782 	if (xenstored_ready > 0)
783 		ret = nb->notifier_call(nb, 0, NULL);
784 	else
785 		blocking_notifier_chain_register(&xenstore_chain, nb);
786 
787 	return ret;
788 }
789 EXPORT_SYMBOL_GPL(register_xenstore_notifier);
790 
791 void unregister_xenstore_notifier(struct notifier_block *nb)
792 {
793 	blocking_notifier_chain_unregister(&xenstore_chain, nb);
794 }
795 EXPORT_SYMBOL_GPL(unregister_xenstore_notifier);
796 
797 static void xenbus_probe(void)
798 {
799 	xenstored_ready = 1;
800 
801 	if (!xen_store_interface)
802 		xen_store_interface = memremap(xen_store_gfn << XEN_PAGE_SHIFT,
803 					       XEN_PAGE_SIZE, MEMREMAP_WB);
804 	/*
805 	 * Now it is safe to free the IRQ used for xenstore late
806 	 * initialization. No need to unbind: it is about to be
807 	 * bound again from xb_init_comms. Note that calling
808 	 * unbind_from_irqhandler now would result in xen_evtchn_close()
809 	 * being called and the event channel not being enabled again
810 	 * afterwards, resulting in missed event notifications.
811 	 */
812 	if (xs_init_irq >= 0)
813 		free_irq(xs_init_irq, &xb_waitq);
814 
815 	/*
816 	 * In the HVM case, xenbus_init() deferred its call to
817 	 * xs_init() in case callbacks were not operational yet.
818 	 * So do it now.
819 	 */
820 	if (xen_store_domain_type == XS_HVM)
821 		xs_init();
822 
823 	/* Notify others that xenstore is up */
824 	blocking_notifier_call_chain(&xenstore_chain, 0, NULL);
825 }
826 
827 /*
828  * Returns true when XenStore init must be deferred in order to
829  * allow the PCI platform device to be initialised, before we
830  * can actually have event channel interrupts working.
831  */
832 static bool xs_hvm_defer_init_for_callback(void)
833 {
834 #ifdef CONFIG_XEN_PVHVM
835 	return xen_store_domain_type == XS_HVM &&
836 		!xen_have_vector_callback;
837 #else
838 	return false;
839 #endif
840 }
841 
842 static int xenbus_probe_thread(void *unused)
843 {
844 	DEFINE_WAIT(w);
845 
846 	/*
847 	 * We actually just want to wait for *any* trigger of xb_waitq,
848 	 * and run xenbus_probe() the moment it occurs.
849 	 */
850 	prepare_to_wait(&xb_waitq, &w, TASK_INTERRUPTIBLE);
851 	schedule();
852 	finish_wait(&xb_waitq, &w);
853 
854 	DPRINTK("probing");
855 	xenbus_probe();
856 	return 0;
857 }
858 
859 static int __init xenbus_probe_initcall(void)
860 {
861 	if (!xen_domain())
862 		return -ENODEV;
863 
864 	/*
865 	 * Probe XenBus here in the XS_PV case, and also XS_HVM unless we
866 	 * need to wait for the platform PCI device to come up or
867 	 * xen_store_interface is not ready.
868 	 */
869 	if (xen_store_domain_type == XS_PV ||
870 	    (xen_store_domain_type == XS_HVM &&
871 	     !xs_hvm_defer_init_for_callback() &&
872 	     XS_INTERFACE_READY))
873 		xenbus_probe();
874 
875 	/*
876 	 * For XS_LOCAL or when xen_store_interface is not ready, spawn a
877 	 * thread which will wait for xenstored or a xenstore-stubdom to be
878 	 * started, then probe.  It will be triggered when communication
879 	 * starts happening, by waiting on xb_waitq.
880 	 */
881 	if (xen_store_domain_type == XS_LOCAL || !XS_INTERFACE_READY) {
882 		struct task_struct *probe_task;
883 
884 		probe_task = kthread_run(xenbus_probe_thread, NULL,
885 					 "xenbus_probe");
886 		if (IS_ERR(probe_task))
887 			return PTR_ERR(probe_task);
888 	}
889 	return 0;
890 }
891 device_initcall(xenbus_probe_initcall);
892 
893 int xen_set_callback_via(uint64_t via)
894 {
895 	struct xen_hvm_param a;
896 	int ret;
897 
898 	a.domid = DOMID_SELF;
899 	a.index = HVM_PARAM_CALLBACK_IRQ;
900 	a.value = via;
901 
902 	ret = HYPERVISOR_hvm_op(HVMOP_set_param, &a);
903 	if (ret)
904 		return ret;
905 
906 	/*
907 	 * If xenbus_probe_initcall() deferred the xenbus_probe()
908 	 * due to the callback not functioning yet, we can do it now.
909 	 */
910 	if (!xenstored_ready && xs_hvm_defer_init_for_callback())
911 		xenbus_probe();
912 
913 	return ret;
914 }
915 EXPORT_SYMBOL_GPL(xen_set_callback_via);
916 
917 /* Set up event channel for xenstored which is run as a local process
918  * (this is normally used only in dom0)
919  */
920 static int __init xenstored_local_init(void)
921 {
922 	int err = -ENOMEM;
923 	unsigned long page = 0;
924 	struct evtchn_alloc_unbound alloc_unbound;
925 
926 	/* Allocate Xenstore page */
927 	page = get_zeroed_page(GFP_KERNEL);
928 	if (!page)
929 		goto out_err;
930 
931 	xen_store_gfn = virt_to_gfn((void *)page);
932 
933 	/* Next allocate a local port which xenstored can bind to */
934 	alloc_unbound.dom        = DOMID_SELF;
935 	alloc_unbound.remote_dom = DOMID_SELF;
936 
937 	err = HYPERVISOR_event_channel_op(EVTCHNOP_alloc_unbound,
938 					  &alloc_unbound);
939 	if (err == -ENOSYS)
940 		goto out_err;
941 
942 	BUG_ON(err);
943 	xen_store_evtchn = alloc_unbound.port;
944 
945 	return 0;
946 
947  out_err:
948 	if (page != 0)
949 		free_page(page);
950 	return err;
951 }
952 
953 static int xenbus_resume_cb(struct notifier_block *nb,
954 			    unsigned long action, void *data)
955 {
956 	int err = 0;
957 
958 	if (xen_hvm_domain()) {
959 		uint64_t v = 0;
960 
961 		err = hvm_get_parameter(HVM_PARAM_STORE_EVTCHN, &v);
962 		if (!err && v)
963 			xen_store_evtchn = v;
964 		else
965 			pr_warn("Cannot update xenstore event channel: %d\n",
966 				err);
967 	} else
968 		xen_store_evtchn = xen_start_info->store_evtchn;
969 
970 	return err;
971 }
972 
973 static struct notifier_block xenbus_resume_nb = {
974 	.notifier_call = xenbus_resume_cb,
975 };
976 
977 static irqreturn_t xenbus_late_init(int irq, void *unused)
978 {
979 	int err;
980 	uint64_t v = 0;
981 
982 	err = hvm_get_parameter(HVM_PARAM_STORE_PFN, &v);
983 	if (err || !v || !~v)
984 		return IRQ_HANDLED;
985 	xen_store_gfn = (unsigned long)v;
986 
987 	wake_up(&xb_waitq);
988 	return IRQ_HANDLED;
989 }
990 
991 static int __init xenbus_init(void)
992 {
993 	int err;
994 	uint64_t v = 0;
995 	bool wait = false;
996 	xen_store_domain_type = XS_UNKNOWN;
997 
998 	if (!xen_domain())
999 		return -ENODEV;
1000 
1001 	xenbus_ring_ops_init();
1002 
1003 	if (xen_pv_domain())
1004 		xen_store_domain_type = XS_PV;
1005 	if (xen_hvm_domain())
1006 	{
1007 		xen_store_domain_type = XS_HVM;
1008 		err = hvm_get_parameter(HVM_PARAM_STORE_EVTCHN, &v);
1009 		if (err)
1010 			goto out_error;
1011 		xen_store_evtchn = (int)v;
1012 		if (!v && xen_initial_domain())
1013 			xen_store_domain_type = XS_LOCAL;
1014 	}
1015 	if (xen_pv_domain() && !xen_start_info->store_evtchn)
1016 		xen_store_domain_type = XS_LOCAL;
1017 	if (xen_pv_domain() && xen_start_info->store_evtchn)
1018 		xenstored_ready = 1;
1019 
1020 	switch (xen_store_domain_type) {
1021 	case XS_LOCAL:
1022 		err = xenstored_local_init();
1023 		if (err)
1024 			goto out_error;
1025 		xen_store_interface = gfn_to_virt(xen_store_gfn);
1026 		break;
1027 	case XS_PV:
1028 		xen_store_evtchn = xen_start_info->store_evtchn;
1029 		xen_store_gfn = xen_start_info->store_mfn;
1030 		xen_store_interface = gfn_to_virt(xen_store_gfn);
1031 		break;
1032 	case XS_HVM:
1033 		err = hvm_get_parameter(HVM_PARAM_STORE_PFN, &v);
1034 		if (err)
1035 			goto out_error;
1036 		/*
1037 		 * Uninitialized hvm_params are zero and return no error.
1038 		 * Although it is theoretically possible to have
1039 		 * HVM_PARAM_STORE_PFN set to zero on purpose, in reality it is
1040 		 * not zero when valid. If zero, it means that Xenstore hasn't
1041 		 * been properly initialized. Instead of attempting to map a
1042 		 * wrong guest physical address return error.
1043 		 *
1044 		 * Also recognize all bits set as an invalid/uninitialized value.
1045 		 */
1046 		if (!v) {
1047 			err = -ENOENT;
1048 			goto out_error;
1049 		}
1050 		if (v == ~0ULL) {
1051 			wait = true;
1052 		} else {
1053 			/* Avoid truncation on 32-bit. */
1054 #if BITS_PER_LONG == 32
1055 			if (v > ULONG_MAX) {
1056 				pr_err("%s: cannot handle HVM_PARAM_STORE_PFN=%llx > ULONG_MAX\n",
1057 				       __func__, v);
1058 				err = -EINVAL;
1059 				goto out_error;
1060 			}
1061 #endif
1062 			xen_store_gfn = (unsigned long)v;
1063 			xen_store_interface =
1064 				memremap(xen_store_gfn << XEN_PAGE_SHIFT,
1065 					 XEN_PAGE_SIZE, MEMREMAP_WB);
1066 			if (!xen_store_interface) {
1067 				pr_err("%s: cannot map HVM_PARAM_STORE_PFN=%llx\n",
1068 				       __func__, v);
1069 				err = -EINVAL;
1070 				goto out_error;
1071 			}
1072 			if (xen_store_interface->connection != XENSTORE_CONNECTED)
1073 				wait = true;
1074 		}
1075 		if (wait) {
1076 			err = bind_evtchn_to_irqhandler(xen_store_evtchn,
1077 							xenbus_late_init,
1078 							0, "xenstore_late_init",
1079 							&xb_waitq);
1080 			if (err < 0) {
1081 				pr_err("xenstore_late_init couldn't bind irq err=%d\n",
1082 				       err);
1083 				goto out_error;
1084 			}
1085 
1086 			xs_init_irq = err;
1087 		}
1088 		break;
1089 	default:
1090 		pr_warn("Xenstore state unknown\n");
1091 		break;
1092 	}
1093 
1094 	/*
1095 	 * HVM domains may not have a functional callback yet. In that
1096 	 * case let xs_init() be called from xenbus_probe(), which will
1097 	 * get invoked at an appropriate time.
1098 	 */
1099 	if (xen_store_domain_type != XS_HVM) {
1100 		err = xs_init();
1101 		if (err) {
1102 			pr_warn("Error initializing xenstore comms: %i\n", err);
1103 			goto out_error;
1104 		}
1105 	}
1106 
1107 	if ((xen_store_domain_type != XS_LOCAL) &&
1108 	    (xen_store_domain_type != XS_UNKNOWN))
1109 		xen_resume_notifier_register(&xenbus_resume_nb);
1110 
1111 #ifdef CONFIG_XEN_COMPAT_XENFS
1112 	/*
1113 	 * Create xenfs mountpoint in /proc for compatibility with
1114 	 * utilities that expect to find "xenbus" under "/proc/xen".
1115 	 */
1116 	proc_create_mount_point("xen");
1117 #endif
1118 	return 0;
1119 
1120 out_error:
1121 	xen_store_domain_type = XS_UNKNOWN;
1122 	return err;
1123 }
1124 
1125 postcore_initcall(xenbus_init);
1126 
1127 MODULE_LICENSE("GPL");
1128