xref: /linux/net/9p/trans_virtio.c (revision bba2c3615bd6cfee7456d1130f2e6b01b3f4e9ba)
1 // SPDX-License-Identifier: GPL-2.0-only
2 /*
3  * The Virtio 9p transport driver
4  *
5  * This is a block based transport driver based on the lguest block driver
6  * code.
7  *
8  *  Copyright (C) 2007, 2008 Eric Van Hensbergen, IBM Corporation
9  *
10  *  Based on virtio console driver
11  *  Copyright (C) 2006, 2007 Rusty Russell, IBM Corporation
12  */
13 
14 #define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
15 
16 #include <linux/in.h>
17 #include <linux/module.h>
18 #include <linux/net.h>
19 #include <linux/ipv6.h>
20 #include <linux/errno.h>
21 #include <linux/kernel.h>
22 #include <linux/un.h>
23 #include <linux/uaccess.h>
24 #include <linux/inet.h>
25 #include <linux/file.h>
26 #include <linux/highmem.h>
27 #include <linux/slab.h>
28 #include <net/9p/9p.h>
29 #include <linux/fs_context.h>
30 #include <net/9p/client.h>
31 #include <net/9p/transport.h>
32 #include <linux/scatterlist.h>
33 #include <linux/swap.h>
34 #include <linux/virtio.h>
35 #include <linux/virtio_9p.h>
36 #include "trans_common.h"
37 
38 #define VIRTQUEUE_NUM	128
39 
40 /* a single mutex to manage channel initialization and attachment */
41 static DEFINE_MUTEX(virtio_9p_lock);
42 static DECLARE_WAIT_QUEUE_HEAD(vp_wq);
43 static atomic_t vp_pinned = ATOMIC_INIT(0);
44 
45 /**
46  * struct virtio_chan - per-instance transport information
47  * @inuse: whether the channel is in use
48  * @lock: protects multiple elements within this structure
49  * @client: client instance
50  * @vdev: virtio dev associated with this channel
51  * @vq: virtio queue associated with this channel
52  * @ring_bufs_avail: flag to indicate there is some available in the ring buf
53  * @vc_wq: wait queue for waiting for thing to be added to ring buf
54  * @p9_max_pages: maximum number of pinned pages
55  * @sg: scatter gather list which is used to pack a request (protected?)
56  * @chan_list: linked list of channels
57  *
58  * We keep all per-channel information in a structure.
59  * This structure is allocated within the devices dev->mem space.
60  * A pointer to the structure will get put in the transport private.
61  *
62  */
63 
64 struct virtio_chan {
65 	bool inuse;
66 
67 	spinlock_t lock;
68 
69 	struct p9_client *client;
70 	struct virtio_device *vdev;
71 	struct virtqueue *vq;
72 	int ring_bufs_avail;
73 	wait_queue_head_t *vc_wq;
74 	/* This is global limit. Since we don't have a global structure,
75 	 * will be placing it in each channel.
76 	 */
77 	unsigned long p9_max_pages;
78 	/* Scatterlist: can be too big for stack. */
79 	struct scatterlist sg[VIRTQUEUE_NUM];
80 	/**
81 	 * @tag: name to identify a mount null terminated
82 	 */
83 	char *tag;
84 
85 	struct list_head chan_list;
86 };
87 
88 static struct list_head virtio_chan_list;
89 
90 /* How many bytes left in this page. */
91 static unsigned int rest_of_page(void *data)
92 {
93 	return PAGE_SIZE - offset_in_page(data);
94 }
95 
96 /**
97  * p9_virtio_close - reclaim resources of a channel
98  * @client: client instance
99  *
100  * This reclaims a channel by freeing its resources and
101  * resetting its inuse flag.
102  *
103  */
104 
105 static void p9_virtio_close(struct p9_client *client)
106 {
107 	struct virtio_chan *chan = client->trans;
108 
109 	mutex_lock(&virtio_9p_lock);
110 	if (chan)
111 		chan->inuse = false;
112 	mutex_unlock(&virtio_9p_lock);
113 }
114 
115 /**
116  * req_done - callback which signals activity from the server
117  * @vq: virtio queue activity was received on
118  *
119  * This notifies us that the server has triggered some activity
120  * on the virtio channel - most likely a response to request we
121  * sent.  Figure out which requests now have responses and wake up
122  * those threads.
123  *
124  * Bugs: could do with some additional sanity checking, but appears to work.
125  *
126  */
127 
128 static void req_done(struct virtqueue *vq)
129 {
130 	struct virtio_chan *chan = vq->vdev->priv;
131 	unsigned int len;
132 	struct p9_req_t *req;
133 	bool need_wakeup = false;
134 	unsigned long flags;
135 
136 	p9_debug(P9_DEBUG_TRANS, ": request done\n");
137 
138 	spin_lock_irqsave(&chan->lock, flags);
139 	while ((req = virtqueue_get_buf(chan->vq, &len)) != NULL) {
140 		if (!chan->ring_bufs_avail) {
141 			chan->ring_bufs_avail = 1;
142 			need_wakeup = true;
143 		}
144 
145 		if (len) {
146 			req->rc.size = len;
147 			p9_client_cb(chan->client, req, REQ_STATUS_RCVD);
148 		}
149 	}
150 	spin_unlock_irqrestore(&chan->lock, flags);
151 	/* Wakeup if anyone waiting for VirtIO ring space. */
152 	if (need_wakeup)
153 		wake_up(chan->vc_wq);
154 }
155 
156 /**
157  * pack_sg_list - pack a scatter gather list from a linear buffer
158  * @sg: scatter/gather list to pack into
159  * @start: which segment of the sg_list to start at
160  * @limit: maximum segment to pack data to
161  * @data: data to pack into scatter/gather list
162  * @count: amount of data to pack into the scatter/gather list
163  *
164  * sg_lists have multiple segments of various sizes.  This will pack
165  * arbitrary data into an existing scatter gather list, segmenting the
166  * data as necessary within constraints.
167  *
168  */
169 
170 static int pack_sg_list(struct scatterlist *sg, int start,
171 			int limit, char *data, int count)
172 {
173 	int s;
174 	int index = start;
175 
176 	while (count) {
177 		s = rest_of_page(data);
178 		if (s > count)
179 			s = count;
180 		BUG_ON(index >= limit);
181 		/* Make sure we don't terminate early. */
182 		sg_unmark_end(&sg[index]);
183 		sg_set_buf(&sg[index++], data, s);
184 		count -= s;
185 		data += s;
186 	}
187 	if (index-start)
188 		sg_mark_end(&sg[index - 1]);
189 	return index-start;
190 }
191 
192 /* We don't currently allow canceling of virtio requests */
193 static int p9_virtio_cancel(struct p9_client *client, struct p9_req_t *req)
194 {
195 	return 1;
196 }
197 
198 /* Reply won't come, so drop req ref */
199 static int p9_virtio_cancelled(struct p9_client *client, struct p9_req_t *req)
200 {
201 	p9_req_put(client, req);
202 	return 0;
203 }
204 
205 /**
206  * pack_sg_list_p - Just like pack_sg_list. Instead of taking a buffer,
207  * this takes a list of pages.
208  * @sg: scatter/gather list to pack into
209  * @start: which segment of the sg_list to start at
210  * @limit: maximum number of pages in sg list.
211  * @pdata: a list of pages to add into sg.
212  * @nr_pages: number of pages to pack into the scatter/gather list
213  * @offs: amount of data in the beginning of first page _not_ to pack
214  * @count: amount of data to pack into the scatter/gather list
215  */
216 static int
217 pack_sg_list_p(struct scatterlist *sg, int start, int limit,
218 	       struct page **pdata, int nr_pages, size_t offs, int count)
219 {
220 	int i = 0, s;
221 	int data_off = offs;
222 	int index = start;
223 
224 	BUG_ON(nr_pages > (limit - start));
225 	/*
226 	 * if the first page doesn't start at
227 	 * page boundary find the offset
228 	 */
229 	while (nr_pages) {
230 		s = PAGE_SIZE - data_off;
231 		if (s > count)
232 			s = count;
233 		BUG_ON(index >= limit);
234 		/* Make sure we don't terminate early. */
235 		sg_unmark_end(&sg[index]);
236 		sg_set_page(&sg[index++], pdata[i++], s, data_off);
237 		data_off = 0;
238 		count -= s;
239 		nr_pages--;
240 	}
241 
242 	if (index-start)
243 		sg_mark_end(&sg[index - 1]);
244 	return index - start;
245 }
246 
247 /**
248  * p9_virtio_request - issue a request
249  * @client: client instance issuing the request
250  * @req: request to be issued
251  *
252  */
253 
254 static int
255 p9_virtio_request(struct p9_client *client, struct p9_req_t *req)
256 {
257 	int err;
258 	int in, out, out_sgs, in_sgs;
259 	unsigned long flags;
260 	struct virtio_chan *chan = client->trans;
261 	struct scatterlist *sgs[2];
262 
263 	p9_debug(P9_DEBUG_TRANS, "9p debug: virtio request\n");
264 
265 	WRITE_ONCE(req->status, REQ_STATUS_SENT);
266 req_retry:
267 	spin_lock_irqsave(&chan->lock, flags);
268 
269 	out_sgs = in_sgs = 0;
270 	/* Handle out VirtIO ring buffers */
271 	out = pack_sg_list(chan->sg, 0,
272 			   VIRTQUEUE_NUM, req->tc.sdata, req->tc.size);
273 	if (out)
274 		sgs[out_sgs++] = chan->sg;
275 
276 	in = pack_sg_list(chan->sg, out,
277 			  VIRTQUEUE_NUM, req->rc.sdata, req->rc.capacity);
278 	if (in)
279 		sgs[out_sgs + in_sgs++] = chan->sg + out;
280 
281 	err = virtqueue_add_sgs(chan->vq, sgs, out_sgs, in_sgs, req,
282 				GFP_ATOMIC);
283 	if (err < 0) {
284 		if (err == -ENOSPC) {
285 			chan->ring_bufs_avail = 0;
286 			spin_unlock_irqrestore(&chan->lock, flags);
287 			err = io_wait_event_killable(*chan->vc_wq,
288 						     chan->ring_bufs_avail);
289 			if (err  == -ERESTARTSYS)
290 				return err;
291 
292 			p9_debug(P9_DEBUG_TRANS, "Retry virtio request\n");
293 			goto req_retry;
294 		} else {
295 			spin_unlock_irqrestore(&chan->lock, flags);
296 			p9_debug(P9_DEBUG_TRANS,
297 				 "virtio rpc add_sgs returned failure\n");
298 			return -EIO;
299 		}
300 	}
301 	virtqueue_kick(chan->vq);
302 	spin_unlock_irqrestore(&chan->lock, flags);
303 
304 	p9_debug(P9_DEBUG_TRANS, "virtio request kicked\n");
305 	return 0;
306 }
307 
308 static int p9_get_mapped_pages(struct virtio_chan *chan,
309 			       struct page ***pages,
310 			       struct iov_iter *data,
311 			       int count,
312 			       size_t *offs,
313 			       int *need_drop)
314 {
315 	int nr_pages;
316 	int err;
317 
318 	if (!iov_iter_count(data))
319 		return 0;
320 
321 	if (!iov_iter_is_kvec(data)) {
322 		int n;
323 		/*
324 		 * We allow only p9_max_pages pinned. We wait for the
325 		 * Other zc request to finish here
326 		 */
327 		if (atomic_read(&vp_pinned) >= chan->p9_max_pages) {
328 			err = io_wait_event_killable(vp_wq,
329 			      (atomic_read(&vp_pinned) < chan->p9_max_pages));
330 			if (err == -ERESTARTSYS)
331 				return err;
332 		}
333 		n = iov_iter_get_pages_alloc2(data, pages, count, offs);
334 		if (n < 0)
335 			return n;
336 		*need_drop = 1;
337 		nr_pages = DIV_ROUND_UP(n + *offs, PAGE_SIZE);
338 		atomic_add(nr_pages, &vp_pinned);
339 		return n;
340 	} else {
341 		/* kernel buffer, no need to pin pages */
342 		int index;
343 		size_t len;
344 		void *p;
345 
346 		/* we'd already checked that it's non-empty */
347 		while (1) {
348 			len = iov_iter_single_seg_count(data);
349 			if (likely(len)) {
350 				p = data->kvec->iov_base + data->iov_offset;
351 				break;
352 			}
353 			iov_iter_advance(data, 0);
354 		}
355 		if (len > count)
356 			len = count;
357 
358 		nr_pages = DIV_ROUND_UP((unsigned long)p + len, PAGE_SIZE) -
359 			   (unsigned long)p / PAGE_SIZE;
360 
361 		*pages = kmalloc_objs(struct page *, nr_pages, GFP_NOFS);
362 		if (!*pages)
363 			return -ENOMEM;
364 
365 		*need_drop = 0;
366 		p -= (*offs = offset_in_page(p));
367 		for (index = 0; index < nr_pages; index++) {
368 			if (is_vmalloc_addr(p))
369 				(*pages)[index] = vmalloc_to_page(p);
370 			else
371 				(*pages)[index] = kmap_to_page(p);
372 			p += PAGE_SIZE;
373 		}
374 		iov_iter_advance(data, len);
375 		return len;
376 	}
377 }
378 
379 static void handle_rerror(struct p9_req_t *req, int in_hdr_len,
380 			  size_t offs, struct page **pages)
381 {
382 	unsigned size, n;
383 	void *to = req->rc.sdata + in_hdr_len;
384 
385 	// Fits entirely into the static data?  Nothing to do.
386 	if (req->rc.size < in_hdr_len || !pages)
387 		return;
388 
389 	// Really long error message?  Tough, truncate the reply.  Might get
390 	// rejected (we can't be arsed to adjust the size encoded in header,
391 	// or string size for that matter), but it wouldn't be anything valid
392 	// anyway.
393 	if (unlikely(req->rc.size > P9_ZC_HDR_SZ))
394 		req->rc.size = P9_ZC_HDR_SZ;
395 
396 	// data won't span more than two pages
397 	size = req->rc.size - in_hdr_len;
398 	n = PAGE_SIZE - offs;
399 	if (size > n) {
400 		memcpy_from_page(to, *pages++, offs, n);
401 		offs = 0;
402 		to += n;
403 		size -= n;
404 	}
405 	memcpy_from_page(to, *pages, offs, size);
406 }
407 
408 /**
409  * p9_virtio_zc_request - issue a zero copy request
410  * @client: client instance issuing the request
411  * @req: request to be issued
412  * @uidata: user buffer that should be used for zero copy read
413  * @uodata: user buffer that should be used for zero copy write
414  * @inlen: read buffer size
415  * @outlen: write buffer size
416  * @in_hdr_len: reader header size, This is the size of response protocol data
417  *
418  */
419 static int
420 p9_virtio_zc_request(struct p9_client *client, struct p9_req_t *req,
421 		     struct iov_iter *uidata, struct iov_iter *uodata,
422 		     int inlen, int outlen, int in_hdr_len)
423 {
424 	int in, out, err, out_sgs, in_sgs;
425 	unsigned long flags;
426 	int in_nr_pages = 0, out_nr_pages = 0;
427 	struct page **in_pages = NULL, **out_pages = NULL;
428 	struct virtio_chan *chan = client->trans;
429 	struct scatterlist *sgs[4];
430 	size_t offs = 0;
431 	int need_drop = 0;
432 	int kicked = 0;
433 
434 	p9_debug(P9_DEBUG_TRANS, "virtio request\n");
435 
436 	if (uodata) {
437 		__le32 sz;
438 		int n = p9_get_mapped_pages(chan, &out_pages, uodata,
439 					    outlen, &offs, &need_drop);
440 		if (n < 0) {
441 			err = n;
442 			goto err_out;
443 		}
444 		out_nr_pages = DIV_ROUND_UP(n + offs, PAGE_SIZE);
445 		if (n != outlen) {
446 			__le32 v = cpu_to_le32(n);
447 			memcpy(&req->tc.sdata[req->tc.size - 4], &v, 4);
448 			outlen = n;
449 		}
450 		/* The size field of the message must include the length of the
451 		 * header and the length of the data.  We didn't actually know
452 		 * the length of the data until this point so add it in now.
453 		 */
454 		sz = cpu_to_le32(req->tc.size + outlen);
455 		memcpy(&req->tc.sdata[0], &sz, sizeof(sz));
456 	} else if (uidata) {
457 		int n = p9_get_mapped_pages(chan, &in_pages, uidata,
458 					    inlen, &offs, &need_drop);
459 		if (n < 0) {
460 			err = n;
461 			goto err_out;
462 		}
463 		in_nr_pages = DIV_ROUND_UP(n + offs, PAGE_SIZE);
464 		if (n != inlen) {
465 			__le32 v = cpu_to_le32(n);
466 			memcpy(&req->tc.sdata[req->tc.size - 4], &v, 4);
467 			inlen = n;
468 		}
469 	}
470 	WRITE_ONCE(req->status, REQ_STATUS_SENT);
471 req_retry_pinned:
472 	spin_lock_irqsave(&chan->lock, flags);
473 
474 	out_sgs = in_sgs = 0;
475 
476 	/* out data */
477 	out = pack_sg_list(chan->sg, 0,
478 			   VIRTQUEUE_NUM, req->tc.sdata, req->tc.size);
479 
480 	if (out)
481 		sgs[out_sgs++] = chan->sg;
482 
483 	if (out_pages) {
484 		sgs[out_sgs++] = chan->sg + out;
485 		out += pack_sg_list_p(chan->sg, out, VIRTQUEUE_NUM,
486 				      out_pages, out_nr_pages, offs, outlen);
487 	}
488 
489 	/*
490 	 * Take care of in data
491 	 * For example TREAD have 11.
492 	 * 11 is the read/write header = PDU Header(7) + IO Size (4).
493 	 * Arrange in such a way that server places header in the
494 	 * allocated memory and payload onto the user buffer.
495 	 */
496 	in = pack_sg_list(chan->sg, out,
497 			  VIRTQUEUE_NUM, req->rc.sdata, in_hdr_len);
498 	if (in)
499 		sgs[out_sgs + in_sgs++] = chan->sg + out;
500 
501 	if (in_pages) {
502 		sgs[out_sgs + in_sgs++] = chan->sg + out + in;
503 		pack_sg_list_p(chan->sg, out + in, VIRTQUEUE_NUM,
504 			       in_pages, in_nr_pages, offs, inlen);
505 	}
506 
507 	BUG_ON(out_sgs + in_sgs > ARRAY_SIZE(sgs));
508 	err = virtqueue_add_sgs(chan->vq, sgs, out_sgs, in_sgs, req,
509 				GFP_ATOMIC);
510 	if (err < 0) {
511 		if (err == -ENOSPC) {
512 			chan->ring_bufs_avail = 0;
513 			spin_unlock_irqrestore(&chan->lock, flags);
514 			err = io_wait_event_killable(*chan->vc_wq,
515 						     chan->ring_bufs_avail);
516 			if (err  == -ERESTARTSYS)
517 				goto err_out;
518 
519 			p9_debug(P9_DEBUG_TRANS, "Retry virtio request\n");
520 			goto req_retry_pinned;
521 		} else {
522 			spin_unlock_irqrestore(&chan->lock, flags);
523 			p9_debug(P9_DEBUG_TRANS,
524 				 "virtio rpc add_sgs returned failure\n");
525 			err = -EIO;
526 			goto err_out;
527 		}
528 	}
529 	virtqueue_kick(chan->vq);
530 	spin_unlock_irqrestore(&chan->lock, flags);
531 	kicked = 1;
532 	p9_debug(P9_DEBUG_TRANS, "virtio request kicked\n");
533 	err = io_wait_event_killable(req->wq,
534 				     READ_ONCE(req->status) >= REQ_STATUS_RCVD);
535 	/*
536 	 * Make sure our req is coherent with regard to updates in other
537 	 * threads - echoes to wmb() in the callback
538 	 */
539 	smp_rmb();
540 	// RERROR needs reply (== error string) in static data
541 	if (READ_ONCE(req->status) == REQ_STATUS_RCVD &&
542 	    unlikely(req->rc.sdata[4] == P9_RERROR))
543 		handle_rerror(req, in_hdr_len, offs, in_pages);
544 
545 	/*
546 	 * Non kernel buffers are pinned, unpin them
547 	 */
548 err_out:
549 	if (need_drop) {
550 		if (in_pages) {
551 			p9_release_pages(in_pages, in_nr_pages);
552 			atomic_sub(in_nr_pages, &vp_pinned);
553 		}
554 		if (out_pages) {
555 			p9_release_pages(out_pages, out_nr_pages);
556 			atomic_sub(out_nr_pages, &vp_pinned);
557 		}
558 		/* wakeup anybody waiting for slots to pin pages */
559 		wake_up(&vp_wq);
560 	}
561 	kvfree(in_pages);
562 	kvfree(out_pages);
563 	if (!kicked) {
564 		/* reply won't come */
565 		p9_req_put(client, req);
566 	}
567 	return err;
568 }
569 
570 static ssize_t p9_mount_tag_show(struct device *dev,
571 				struct device_attribute *attr, char *buf)
572 {
573 	struct virtio_chan *chan;
574 	struct virtio_device *vdev;
575 	int tag_len;
576 
577 	vdev = dev_to_virtio(dev);
578 	chan = vdev->priv;
579 	tag_len = strlen(chan->tag);
580 
581 	memcpy(buf, chan->tag, tag_len + 1);
582 
583 	return tag_len + 1;
584 }
585 
586 static DEVICE_ATTR(mount_tag, 0444, p9_mount_tag_show, NULL);
587 
588 /**
589  * p9_virtio_probe - probe for existence of 9P virtio channels
590  * @vdev: virtio device to probe
591  *
592  * This probes for existing virtio channels.
593  *
594  */
595 
596 static int p9_virtio_probe(struct virtio_device *vdev)
597 {
598 	__u16 tag_len;
599 	char *tag;
600 	int err;
601 	struct virtio_chan *chan;
602 
603 	if (!vdev->config->get) {
604 		dev_err(&vdev->dev, "%s failure: config access disabled\n",
605 			__func__);
606 		return -EINVAL;
607 	}
608 
609 	chan = kmalloc_obj(struct virtio_chan);
610 	if (!chan) {
611 		pr_err("Failed to allocate virtio 9P channel\n");
612 		err = -ENOMEM;
613 		goto fail;
614 	}
615 
616 	chan->vdev = vdev;
617 
618 	/* We expect one virtqueue, for requests. */
619 	chan->vq = virtio_find_single_vq(vdev, req_done, "requests");
620 	if (IS_ERR(chan->vq)) {
621 		err = PTR_ERR(chan->vq);
622 		goto out_free_chan;
623 	}
624 	chan->vq->vdev->priv = chan;
625 	spin_lock_init(&chan->lock);
626 
627 	sg_init_table(chan->sg, VIRTQUEUE_NUM);
628 
629 	chan->inuse = false;
630 	if (virtio_has_feature(vdev, VIRTIO_9P_MOUNT_TAG)) {
631 		virtio_cread(vdev, struct virtio_9p_config, tag_len, &tag_len);
632 	} else {
633 		err = -EINVAL;
634 		goto out_free_vq;
635 	}
636 	tag = kzalloc(tag_len + 1, GFP_KERNEL);
637 	if (!tag) {
638 		err = -ENOMEM;
639 		goto out_free_vq;
640 	}
641 
642 	virtio_cread_bytes(vdev, offsetof(struct virtio_9p_config, tag),
643 			   tag, tag_len);
644 	chan->tag = tag;
645 	err = sysfs_create_file(&(vdev->dev.kobj), &dev_attr_mount_tag.attr);
646 	if (err) {
647 		goto out_free_tag;
648 	}
649 	chan->vc_wq = kmalloc_obj(wait_queue_head_t);
650 	if (!chan->vc_wq) {
651 		err = -ENOMEM;
652 		goto out_remove_file;
653 	}
654 	init_waitqueue_head(chan->vc_wq);
655 	chan->ring_bufs_avail = 1;
656 	/* Ceiling limit to avoid denial of service attacks */
657 	chan->p9_max_pages = nr_free_buffer_pages()/4;
658 
659 	virtio_device_ready(vdev);
660 
661 	mutex_lock(&virtio_9p_lock);
662 	list_add_tail(&chan->chan_list, &virtio_chan_list);
663 	mutex_unlock(&virtio_9p_lock);
664 
665 	/* Let udev rules use the new mount_tag attribute. */
666 	kobject_uevent(&(vdev->dev.kobj), KOBJ_CHANGE);
667 
668 	return 0;
669 
670 out_remove_file:
671 	sysfs_remove_file(&vdev->dev.kobj, &dev_attr_mount_tag.attr);
672 out_free_tag:
673 	kfree(tag);
674 out_free_vq:
675 	vdev->config->del_vqs(vdev);
676 out_free_chan:
677 	kfree(chan);
678 fail:
679 	return err;
680 }
681 
682 
683 /**
684  * p9_virtio_create - allocate a new virtio channel
685  * @client: client instance invoking this transport
686  * @fc: the filesystem context
687  *
688  * This sets up a transport channel for 9p communication.  Right now
689  * we only match the first available channel, but eventually we could look up
690  * alternate channels by matching devname versus a virtio_config entry.
691  * We use a simple reference count mechanism to ensure that only a single
692  * mount has a channel open at a time.
693  *
694  */
695 
696 static int
697 p9_virtio_create(struct p9_client *client, struct fs_context *fc)
698 {
699 	const char *devname = fc->source;
700 	struct virtio_chan *chan;
701 	int ret = -ENOENT;
702 	int found = 0;
703 
704 	if (devname == NULL)
705 		return -EINVAL;
706 
707 	mutex_lock(&virtio_9p_lock);
708 	list_for_each_entry(chan, &virtio_chan_list, chan_list) {
709 		if (!strcmp(devname, chan->tag)) {
710 			if (!chan->inuse) {
711 				chan->inuse = true;
712 				found = 1;
713 				break;
714 			}
715 			ret = -EBUSY;
716 		}
717 	}
718 	mutex_unlock(&virtio_9p_lock);
719 
720 	if (!found) {
721 		pr_err("no channels available for device %s\n", devname);
722 		return ret;
723 	}
724 
725 	client->trans = (void *)chan;
726 	client->status = Connected;
727 	chan->client = client;
728 
729 	return 0;
730 }
731 
732 /**
733  * p9_virtio_remove - clean up resources associated with a virtio device
734  * @vdev: virtio device to remove
735  *
736  */
737 
738 static void p9_virtio_remove(struct virtio_device *vdev)
739 {
740 	struct virtio_chan *chan = vdev->priv;
741 	unsigned long warning_time;
742 
743 	mutex_lock(&virtio_9p_lock);
744 
745 	/* Remove self from list so we don't get new users. */
746 	list_del(&chan->chan_list);
747 	warning_time = jiffies;
748 
749 	/* Wait for existing users to close. */
750 	while (chan->inuse) {
751 		mutex_unlock(&virtio_9p_lock);
752 		msleep(250);
753 		if (time_after(jiffies, warning_time + 10 * HZ)) {
754 			dev_emerg(&vdev->dev,
755 				  "p9_virtio_remove: waiting for device in use.\n");
756 			warning_time = jiffies;
757 		}
758 		mutex_lock(&virtio_9p_lock);
759 	}
760 
761 	mutex_unlock(&virtio_9p_lock);
762 
763 	virtio_reset_device(vdev);
764 	vdev->config->del_vqs(vdev);
765 
766 	sysfs_remove_file(&(vdev->dev.kobj), &dev_attr_mount_tag.attr);
767 	kobject_uevent(&(vdev->dev.kobj), KOBJ_CHANGE);
768 	kfree(chan->tag);
769 	kfree(chan->vc_wq);
770 	kfree(chan);
771 
772 }
773 
774 static struct virtio_device_id id_table[] = {
775 	{ VIRTIO_ID_9P, VIRTIO_DEV_ANY_ID },
776 	{ 0 },
777 };
778 
779 static unsigned int features[] = {
780 	VIRTIO_9P_MOUNT_TAG,
781 };
782 
783 /* The standard "struct lguest_driver": */
784 static struct virtio_driver p9_virtio_drv = {
785 	.feature_table  = features,
786 	.feature_table_size = ARRAY_SIZE(features),
787 	.driver.name    = KBUILD_MODNAME,
788 	.id_table	= id_table,
789 	.probe		= p9_virtio_probe,
790 	.remove		= p9_virtio_remove,
791 };
792 
793 static struct p9_trans_module p9_virtio_trans = {
794 	.name = "virtio",
795 	.create = p9_virtio_create,
796 	.close = p9_virtio_close,
797 	.request = p9_virtio_request,
798 	.zc_request = p9_virtio_zc_request,
799 	.cancel = p9_virtio_cancel,
800 	.cancelled = p9_virtio_cancelled,
801 	/*
802 	 * We leave one entry for input and one entry for response
803 	 * headers. We also skip one more entry to accommodate, address
804 	 * that are not at page boundary, that can result in an extra
805 	 * page in zero copy.
806 	 */
807 	.maxsize = PAGE_SIZE * (VIRTQUEUE_NUM - 3),
808 	.pooled_rbuffers = false,
809 	.def = true,
810 	.supports_vmalloc = false,
811 	.owner = THIS_MODULE,
812 };
813 
814 /* The standard init function */
815 static int __init p9_virtio_init(void)
816 {
817 	int rc;
818 
819 	INIT_LIST_HEAD(&virtio_chan_list);
820 
821 	v9fs_register_trans(&p9_virtio_trans);
822 	rc = register_virtio_driver(&p9_virtio_drv);
823 	if (rc)
824 		v9fs_unregister_trans(&p9_virtio_trans);
825 
826 	return rc;
827 }
828 
829 static void __exit p9_virtio_cleanup(void)
830 {
831 	unregister_virtio_driver(&p9_virtio_drv);
832 	v9fs_unregister_trans(&p9_virtio_trans);
833 }
834 
835 module_init(p9_virtio_init);
836 module_exit(p9_virtio_cleanup);
837 MODULE_ALIAS_9P("virtio");
838 
839 MODULE_DEVICE_TABLE(virtio, id_table);
840 MODULE_AUTHOR("Eric Van Hensbergen <ericvh@gmail.com>");
841 MODULE_DESCRIPTION("Virtio 9p Transport");
842 MODULE_LICENSE("GPL");
843