xref: /freebsd/sys/dev/nvd/nvd.c (revision ee7f4d8187356cd961ca8a7a5349f3e28e9225ea)
1bb0ec6b3SJim Harris /*-
2aeae6079SJim Harris  * Copyright (C) 2012-2016 Intel Corporation
3bb0ec6b3SJim Harris  * All rights reserved.
4bb0ec6b3SJim Harris  *
5bb0ec6b3SJim Harris  * Redistribution and use in source and binary forms, with or without
6bb0ec6b3SJim Harris  * modification, are permitted provided that the following conditions
7bb0ec6b3SJim Harris  * are met:
8bb0ec6b3SJim Harris  * 1. Redistributions of source code must retain the above copyright
9bb0ec6b3SJim Harris  *    notice, this list of conditions and the following disclaimer.
10bb0ec6b3SJim Harris  * 2. Redistributions in binary form must reproduce the above copyright
11bb0ec6b3SJim Harris  *    notice, this list of conditions and the following disclaimer in the
12bb0ec6b3SJim Harris  *    documentation and/or other materials provided with the distribution.
13bb0ec6b3SJim Harris  *
14bb0ec6b3SJim Harris  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15bb0ec6b3SJim Harris  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16bb0ec6b3SJim Harris  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17bb0ec6b3SJim Harris  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18bb0ec6b3SJim Harris  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19bb0ec6b3SJim Harris  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20bb0ec6b3SJim Harris  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21bb0ec6b3SJim Harris  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22bb0ec6b3SJim Harris  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23bb0ec6b3SJim Harris  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24bb0ec6b3SJim Harris  * SUCH DAMAGE.
25bb0ec6b3SJim Harris  */
26bb0ec6b3SJim Harris 
27bb0ec6b3SJim Harris #include <sys/cdefs.h>
28bb0ec6b3SJim Harris __FBSDID("$FreeBSD$");
29bb0ec6b3SJim Harris 
30bb0ec6b3SJim Harris #include <sys/param.h>
31bb0ec6b3SJim Harris #include <sys/bio.h>
32bb0ec6b3SJim Harris #include <sys/kernel.h>
33bb0ec6b3SJim Harris #include <sys/malloc.h>
34bb0ec6b3SJim Harris #include <sys/module.h>
35aeae6079SJim Harris #include <sys/sysctl.h>
36bb0ec6b3SJim Harris #include <sys/systm.h>
37bb0ec6b3SJim Harris #include <sys/taskqueue.h>
38bb0ec6b3SJim Harris 
39bb0ec6b3SJim Harris #include <geom/geom.h>
40bb0ec6b3SJim Harris #include <geom/geom_disk.h>
41bb0ec6b3SJim Harris 
42bb0ec6b3SJim Harris #include <dev/nvme/nvme.h>
43bb0ec6b3SJim Harris 
4438441bd9SJim Harris #define NVD_STR		"nvd"
4538441bd9SJim Harris 
46bb0ec6b3SJim Harris struct nvd_disk;
47bb0ec6b3SJim Harris 
48bb0ec6b3SJim Harris static disk_ioctl_t nvd_ioctl;
49bb0ec6b3SJim Harris static disk_strategy_t nvd_strategy;
50bb0ec6b3SJim Harris 
5147ef4244SJim Harris static void nvd_done(void *arg, const struct nvme_completion *cpl);
5247ef4244SJim Harris 
53ec84ecbbSJim Harris static void *nvd_new_disk(struct nvme_namespace *ns, void *ctrlr);
54bb0ec6b3SJim Harris static void destroy_geom_disk(struct nvd_disk *ndisk);
55bb0ec6b3SJim Harris 
56ec84ecbbSJim Harris static void *nvd_new_controller(struct nvme_controller *ctrlr);
57232e2edbSJim Harris static void nvd_controller_fail(void *ctrlr);
58ec84ecbbSJim Harris 
59bb0ec6b3SJim Harris static int nvd_load(void);
60bb0ec6b3SJim Harris static void nvd_unload(void);
61bb0ec6b3SJim Harris 
62bb0ec6b3SJim Harris MALLOC_DEFINE(M_NVD, "nvd", "nvd(4) allocations");
63bb0ec6b3SJim Harris 
64bb0ec6b3SJim Harris struct nvme_consumer *consumer_handle;
65bb0ec6b3SJim Harris 
66bb0ec6b3SJim Harris struct nvd_disk {
67bb0ec6b3SJim Harris 
68bb0ec6b3SJim Harris 	struct bio_queue_head	bioq;
69bb0ec6b3SJim Harris 	struct task		bioqtask;
70bb0ec6b3SJim Harris 	struct mtx		bioqlock;
71bb0ec6b3SJim Harris 
72bb0ec6b3SJim Harris 	struct disk		*disk;
73bb0ec6b3SJim Harris 	struct taskqueue	*tq;
74bb0ec6b3SJim Harris 	struct nvme_namespace	*ns;
75bb0ec6b3SJim Harris 
76bb0ec6b3SJim Harris 	uint32_t		cur_depth;
7758d0b8f3SJim Harris 	uint32_t		ordered_in_flight;
78bb0ec6b3SJim Harris 
79ec84ecbbSJim Harris 	TAILQ_ENTRY(nvd_disk)	global_tailq;
80ec84ecbbSJim Harris 	TAILQ_ENTRY(nvd_disk)	ctrlr_tailq;
81bb0ec6b3SJim Harris };
82bb0ec6b3SJim Harris 
83ec84ecbbSJim Harris struct nvd_controller {
84ec84ecbbSJim Harris 
85ec84ecbbSJim Harris 	TAILQ_ENTRY(nvd_controller)	tailq;
86ec84ecbbSJim Harris 	TAILQ_HEAD(, nvd_disk)		disk_head;
87ec84ecbbSJim Harris };
88ec84ecbbSJim Harris 
89ec84ecbbSJim Harris static TAILQ_HEAD(, nvd_controller)	ctrlr_head;
90ec84ecbbSJim Harris static TAILQ_HEAD(disk_list, nvd_disk)	disk_head;
91bb0ec6b3SJim Harris 
92aeae6079SJim Harris static SYSCTL_NODE(_hw, OID_AUTO, nvd, CTLFLAG_RD, 0, "nvd driver parameters");
93aeae6079SJim Harris /*
94aeae6079SJim Harris  * The NVMe specification does not define a maximum or optimal delete size, so
95aeae6079SJim Harris  *  technically max delete size is min(full size of the namespace, 2^32 - 1
96aeae6079SJim Harris  *  LBAs).  A single delete for a multi-TB NVMe namespace though may take much
97aeae6079SJim Harris  *  longer to complete than the nvme(4) I/O timeout period.  So choose a sensible
98aeae6079SJim Harris  *  default here that is still suitably large to minimize the number of overall
99aeae6079SJim Harris  *  delete operations.
100aeae6079SJim Harris  */
101aeae6079SJim Harris static uint64_t nvd_delete_max = (1024 * 1024 * 1024);  /* 1GB */
102aeae6079SJim Harris SYSCTL_UQUAD(_hw_nvd, OID_AUTO, delete_max, CTLFLAG_RDTUN, &nvd_delete_max, 0,
103aeae6079SJim Harris 	     "nvd maximum BIO_DELETE size in bytes");
104aeae6079SJim Harris 
105bb0ec6b3SJim Harris static int nvd_modevent(module_t mod, int type, void *arg)
106bb0ec6b3SJim Harris {
107bb0ec6b3SJim Harris 	int error = 0;
108bb0ec6b3SJim Harris 
109bb0ec6b3SJim Harris 	switch (type) {
110bb0ec6b3SJim Harris 	case MOD_LOAD:
111bb0ec6b3SJim Harris 		error = nvd_load();
112bb0ec6b3SJim Harris 		break;
113bb0ec6b3SJim Harris 	case MOD_UNLOAD:
114bb0ec6b3SJim Harris 		nvd_unload();
115bb0ec6b3SJim Harris 		break;
116bb0ec6b3SJim Harris 	default:
117bb0ec6b3SJim Harris 		break;
118bb0ec6b3SJim Harris 	}
119bb0ec6b3SJim Harris 
120bb0ec6b3SJim Harris 	return (error);
121bb0ec6b3SJim Harris }
122bb0ec6b3SJim Harris 
123bb0ec6b3SJim Harris moduledata_t nvd_mod = {
12438441bd9SJim Harris 	NVD_STR,
125bb0ec6b3SJim Harris 	(modeventhand_t)nvd_modevent,
1269823d527SKevin Lo 	0
127bb0ec6b3SJim Harris };
128bb0ec6b3SJim Harris 
129bb0ec6b3SJim Harris DECLARE_MODULE(nvd, nvd_mod, SI_SUB_DRIVERS, SI_ORDER_ANY);
130bb0ec6b3SJim Harris MODULE_VERSION(nvd, 1);
131bb0ec6b3SJim Harris MODULE_DEPEND(nvd, nvme, 1, 1, 1);
132bb0ec6b3SJim Harris 
133bb0ec6b3SJim Harris static int
134bb0ec6b3SJim Harris nvd_load()
135bb0ec6b3SJim Harris {
136bb0ec6b3SJim Harris 
137ec84ecbbSJim Harris 	TAILQ_INIT(&ctrlr_head);
138ec84ecbbSJim Harris 	TAILQ_INIT(&disk_head);
139ec84ecbbSJim Harris 
140ec84ecbbSJim Harris 	consumer_handle = nvme_register_consumer(nvd_new_disk,
141232e2edbSJim Harris 	    nvd_new_controller, NULL, nvd_controller_fail);
142bb0ec6b3SJim Harris 
143bb0ec6b3SJim Harris 	return (consumer_handle != NULL ? 0 : -1);
144bb0ec6b3SJim Harris }
145bb0ec6b3SJim Harris 
146bb0ec6b3SJim Harris static void
147bb0ec6b3SJim Harris nvd_unload()
148bb0ec6b3SJim Harris {
149ec84ecbbSJim Harris 	struct nvd_controller	*ctrlr;
150ec84ecbbSJim Harris 	struct nvd_disk		*disk;
151bb0ec6b3SJim Harris 
152ec84ecbbSJim Harris 	while (!TAILQ_EMPTY(&ctrlr_head)) {
153ec84ecbbSJim Harris 		ctrlr = TAILQ_FIRST(&ctrlr_head);
154ec84ecbbSJim Harris 		TAILQ_REMOVE(&ctrlr_head, ctrlr, tailq);
155ec84ecbbSJim Harris 		free(ctrlr, M_NVD);
156ec84ecbbSJim Harris 	}
157ec84ecbbSJim Harris 
158ec84ecbbSJim Harris 	while (!TAILQ_EMPTY(&disk_head)) {
159ec84ecbbSJim Harris 		disk = TAILQ_FIRST(&disk_head);
160ec84ecbbSJim Harris 		TAILQ_REMOVE(&disk_head, disk, global_tailq);
161ec84ecbbSJim Harris 		destroy_geom_disk(disk);
162ec84ecbbSJim Harris 		free(disk, M_NVD);
163bb0ec6b3SJim Harris 	}
164bb0ec6b3SJim Harris 
165bb0ec6b3SJim Harris 	nvme_unregister_consumer(consumer_handle);
166bb0ec6b3SJim Harris }
167bb0ec6b3SJim Harris 
16847ef4244SJim Harris static int
16947ef4244SJim Harris nvd_bio_submit(struct nvd_disk *ndisk, struct bio *bp)
17047ef4244SJim Harris {
17147ef4244SJim Harris 	int err;
17247ef4244SJim Harris 
17347ef4244SJim Harris 	bp->bio_driver1 = NULL;
17447ef4244SJim Harris 	atomic_add_int(&ndisk->cur_depth, 1);
17547ef4244SJim Harris 	err = nvme_ns_bio_process(ndisk->ns, bp, nvd_done);
17647ef4244SJim Harris 	if (err) {
17747ef4244SJim Harris 		atomic_add_int(&ndisk->cur_depth, -1);
17858d0b8f3SJim Harris 		if (__predict_false(bp->bio_flags & BIO_ORDERED))
17958d0b8f3SJim Harris 			atomic_add_int(&ndisk->ordered_in_flight, -1);
18047ef4244SJim Harris 		bp->bio_error = err;
18147ef4244SJim Harris 		bp->bio_flags |= BIO_ERROR;
18247ef4244SJim Harris 		bp->bio_resid = bp->bio_bcount;
18347ef4244SJim Harris 		biodone(bp);
18447ef4244SJim Harris 		return (-1);
18547ef4244SJim Harris 	}
18647ef4244SJim Harris 
18747ef4244SJim Harris 	return (0);
18847ef4244SJim Harris }
18947ef4244SJim Harris 
190bb0ec6b3SJim Harris static void
191bb0ec6b3SJim Harris nvd_strategy(struct bio *bp)
192bb0ec6b3SJim Harris {
193bb0ec6b3SJim Harris 	struct nvd_disk *ndisk;
194bb0ec6b3SJim Harris 
195bb0ec6b3SJim Harris 	ndisk = (struct nvd_disk *)bp->bio_disk->d_drv1;
196bb0ec6b3SJim Harris 
19758d0b8f3SJim Harris 	if (__predict_false(bp->bio_flags & BIO_ORDERED))
19858d0b8f3SJim Harris 		atomic_add_int(&ndisk->ordered_in_flight, 1);
19958d0b8f3SJim Harris 
20058d0b8f3SJim Harris 	if (__predict_true(ndisk->ordered_in_flight == 0)) {
20158d0b8f3SJim Harris 		nvd_bio_submit(ndisk, bp);
20258d0b8f3SJim Harris 		return;
20358d0b8f3SJim Harris 	}
20458d0b8f3SJim Harris 
20558d0b8f3SJim Harris 	/*
20658d0b8f3SJim Harris 	 * There are ordered bios in flight, so we need to submit
20758d0b8f3SJim Harris 	 *  bios through the task queue to enforce ordering.
20858d0b8f3SJim Harris 	 */
209bb0ec6b3SJim Harris 	mtx_lock(&ndisk->bioqlock);
210bb0ec6b3SJim Harris 	bioq_insert_tail(&ndisk->bioq, bp);
211bb0ec6b3SJim Harris 	mtx_unlock(&ndisk->bioqlock);
212bb0ec6b3SJim Harris 	taskqueue_enqueue(ndisk->tq, &ndisk->bioqtask);
213bb0ec6b3SJim Harris }
214bb0ec6b3SJim Harris 
215bb0ec6b3SJim Harris static int
216bb0ec6b3SJim Harris nvd_ioctl(struct disk *ndisk, u_long cmd, void *data, int fflag,
217bb0ec6b3SJim Harris     struct thread *td)
218bb0ec6b3SJim Harris {
219bb0ec6b3SJim Harris 	int ret = 0;
220bb0ec6b3SJim Harris 
221bb0ec6b3SJim Harris 	switch (cmd) {
222bb0ec6b3SJim Harris 	default:
223bb0ec6b3SJim Harris 		ret = EIO;
224bb0ec6b3SJim Harris 	}
225bb0ec6b3SJim Harris 
226bb0ec6b3SJim Harris 	return (ret);
227bb0ec6b3SJim Harris }
228bb0ec6b3SJim Harris 
229bb0ec6b3SJim Harris static void
230cf81529cSJim Harris nvd_done(void *arg, const struct nvme_completion *cpl)
231bb0ec6b3SJim Harris {
232bb0ec6b3SJim Harris 	struct bio *bp;
233bb0ec6b3SJim Harris 	struct nvd_disk *ndisk;
234bb0ec6b3SJim Harris 
235bb0ec6b3SJim Harris 	bp = (struct bio *)arg;
236bb0ec6b3SJim Harris 
237bb0ec6b3SJim Harris 	ndisk = bp->bio_disk->d_drv1;
238bb0ec6b3SJim Harris 
2390f71ecf7SJim Harris 	atomic_add_int(&ndisk->cur_depth, -1);
24058d0b8f3SJim Harris 	if (__predict_false(bp->bio_flags & BIO_ORDERED))
24158d0b8f3SJim Harris 		atomic_add_int(&ndisk->ordered_in_flight, -1);
242bb0ec6b3SJim Harris 
243bb0ec6b3SJim Harris 	biodone(bp);
244bb0ec6b3SJim Harris }
245bb0ec6b3SJim Harris 
246bb0ec6b3SJim Harris static void
247bb0ec6b3SJim Harris nvd_bioq_process(void *arg, int pending)
248bb0ec6b3SJim Harris {
249bb0ec6b3SJim Harris 	struct nvd_disk *ndisk = arg;
250bb0ec6b3SJim Harris 	struct bio *bp;
251bb0ec6b3SJim Harris 
252bb0ec6b3SJim Harris 	for (;;) {
253bb0ec6b3SJim Harris 		mtx_lock(&ndisk->bioqlock);
254bb0ec6b3SJim Harris 		bp = bioq_takefirst(&ndisk->bioq);
255bb0ec6b3SJim Harris 		mtx_unlock(&ndisk->bioqlock);
256bb0ec6b3SJim Harris 		if (bp == NULL)
257bb0ec6b3SJim Harris 			break;
258bb0ec6b3SJim Harris 
25947ef4244SJim Harris 		if (nvd_bio_submit(ndisk, bp) != 0) {
26026ca317aSJim Harris 			continue;
261bb0ec6b3SJim Harris 		}
262bb0ec6b3SJim Harris 
263bb0ec6b3SJim Harris #ifdef BIO_ORDERED
264bb0ec6b3SJim Harris 		/*
265bb0ec6b3SJim Harris 		 * BIO_ORDERED flag dictates that the bio with BIO_ORDERED
266bb0ec6b3SJim Harris 		 *  flag set must be completed before proceeding with
267bb0ec6b3SJim Harris 		 *  additional bios.
268bb0ec6b3SJim Harris 		 */
269bb0ec6b3SJim Harris 		if (bp->bio_flags & BIO_ORDERED) {
270bb0ec6b3SJim Harris 			while (ndisk->cur_depth > 0) {
271bb0ec6b3SJim Harris 				pause("nvd flush", 1);
272bb0ec6b3SJim Harris 			}
273bb0ec6b3SJim Harris 		}
274bb0ec6b3SJim Harris #endif
275bb0ec6b3SJim Harris 	}
276bb0ec6b3SJim Harris }
277bb0ec6b3SJim Harris 
278038a5ee4SJim Harris static void *
279ec84ecbbSJim Harris nvd_new_controller(struct nvme_controller *ctrlr)
280ec84ecbbSJim Harris {
281ec84ecbbSJim Harris 	struct nvd_controller	*nvd_ctrlr;
282ec84ecbbSJim Harris 
283ec84ecbbSJim Harris 	nvd_ctrlr = malloc(sizeof(struct nvd_controller), M_NVD,
284237d2019SJim Harris 	    M_ZERO | M_WAITOK);
285ec84ecbbSJim Harris 
286ec84ecbbSJim Harris 	TAILQ_INIT(&nvd_ctrlr->disk_head);
287ec84ecbbSJim Harris 	TAILQ_INSERT_TAIL(&ctrlr_head, nvd_ctrlr, tailq);
288ec84ecbbSJim Harris 
289ec84ecbbSJim Harris 	return (nvd_ctrlr);
290ec84ecbbSJim Harris }
291ec84ecbbSJim Harris 
292ec84ecbbSJim Harris static void *
293ec84ecbbSJim Harris nvd_new_disk(struct nvme_namespace *ns, void *ctrlr_arg)
294bb0ec6b3SJim Harris {
29538441bd9SJim Harris 	uint8_t			descr[NVME_MODEL_NUMBER_LENGTH+1];
296bb0ec6b3SJim Harris 	struct nvd_disk		*ndisk;
297bb0ec6b3SJim Harris 	struct disk		*disk;
298ec84ecbbSJim Harris 	struct nvd_controller	*ctrlr = ctrlr_arg;
299bb0ec6b3SJim Harris 
300237d2019SJim Harris 	ndisk = malloc(sizeof(struct nvd_disk), M_NVD, M_ZERO | M_WAITOK);
301bb0ec6b3SJim Harris 
302bb0ec6b3SJim Harris 	disk = disk_alloc();
303bb0ec6b3SJim Harris 	disk->d_strategy = nvd_strategy;
304bb0ec6b3SJim Harris 	disk->d_ioctl = nvd_ioctl;
30538441bd9SJim Harris 	disk->d_name = NVD_STR;
306bb0ec6b3SJim Harris 	disk->d_drv1 = ndisk;
307bb0ec6b3SJim Harris 
308bb0ec6b3SJim Harris 	disk->d_maxsize = nvme_ns_get_max_io_xfer_size(ns);
309bb0ec6b3SJim Harris 	disk->d_sectorsize = nvme_ns_get_sector_size(ns);
310bb0ec6b3SJim Harris 	disk->d_mediasize = (off_t)nvme_ns_get_size(ns);
31170fb74bdSJim Harris 	disk->d_delmaxsize = (off_t)nvme_ns_get_size(ns);
312aeae6079SJim Harris 	if (disk->d_delmaxsize > nvd_delete_max)
313aeae6079SJim Harris 		disk->d_delmaxsize = nvd_delete_max;
314*ee7f4d81SAlexander Motin 	disk->d_stripesize = nvme_ns_get_stripesize(ns);
315bb0ec6b3SJim Harris 
316ec84ecbbSJim Harris 	if (TAILQ_EMPTY(&disk_head))
317bb0ec6b3SJim Harris 		disk->d_unit = 0;
318bb0ec6b3SJim Harris 	else
319ec84ecbbSJim Harris 		disk->d_unit =
320ec84ecbbSJim Harris 		    TAILQ_LAST(&disk_head, disk_list)->disk->d_unit + 1;
321bb0ec6b3SJim Harris 
322454f163bSJim Harris 	disk->d_flags = DISKFLAG_DIRECT_COMPLETION;
323bb0ec6b3SJim Harris 
324bb0ec6b3SJim Harris 	if (nvme_ns_get_flags(ns) & NVME_NS_DEALLOCATE_SUPPORTED)
325bb0ec6b3SJim Harris 		disk->d_flags |= DISKFLAG_CANDELETE;
326bb0ec6b3SJim Harris 
327bb0ec6b3SJim Harris 	if (nvme_ns_get_flags(ns) & NVME_NS_FLUSH_SUPPORTED)
328bb0ec6b3SJim Harris 		disk->d_flags |= DISKFLAG_CANFLUSHCACHE;
329bb0ec6b3SJim Harris 
3305fdf9c3cSJim Harris /* ifdef used here to ease porting to stable branches at a later point. */
3315fdf9c3cSJim Harris #ifdef DISKFLAG_UNMAPPED_BIO
3325fdf9c3cSJim Harris 	disk->d_flags |= DISKFLAG_UNMAPPED_BIO;
3335fdf9c3cSJim Harris #endif
3345fdf9c3cSJim Harris 
335e8f25c62SJim Harris 	/*
336e8f25c62SJim Harris 	 * d_ident and d_descr are both far bigger than the length of either
337e8f25c62SJim Harris 	 *  the serial or model number strings.
338e8f25c62SJim Harris 	 */
33938441bd9SJim Harris 	nvme_strvis(disk->d_ident, nvme_ns_get_serial_number(ns),
34038441bd9SJim Harris 	    sizeof(disk->d_ident), NVME_SERIAL_NUMBER_LENGTH);
34138441bd9SJim Harris 
34238441bd9SJim Harris 	nvme_strvis(descr, nvme_ns_get_model_number(ns), sizeof(descr),
34338441bd9SJim Harris 	    NVME_MODEL_NUMBER_LENGTH);
344bb0ec6b3SJim Harris 
345bb0ec6b3SJim Harris #if __FreeBSD_version >= 900034
34638441bd9SJim Harris 	strlcpy(disk->d_descr, descr, sizeof(descr));
347bb0ec6b3SJim Harris #endif
348bb0ec6b3SJim Harris 
349bb0ec6b3SJim Harris 	ndisk->ns = ns;
350bb0ec6b3SJim Harris 	ndisk->disk = disk;
351bb0ec6b3SJim Harris 	ndisk->cur_depth = 0;
35258d0b8f3SJim Harris 	ndisk->ordered_in_flight = 0;
353bb0ec6b3SJim Harris 
354bb0ec6b3SJim Harris 	mtx_init(&ndisk->bioqlock, "NVD bioq lock", NULL, MTX_DEF);
355bb0ec6b3SJim Harris 	bioq_init(&ndisk->bioq);
356bb0ec6b3SJim Harris 
357bb0ec6b3SJim Harris 	TASK_INIT(&ndisk->bioqtask, 0, nvd_bioq_process, ndisk);
358bb0ec6b3SJim Harris 	ndisk->tq = taskqueue_create("nvd_taskq", M_WAITOK,
359bb0ec6b3SJim Harris 	    taskqueue_thread_enqueue, &ndisk->tq);
360bb0ec6b3SJim Harris 	taskqueue_start_threads(&ndisk->tq, 1, PI_DISK, "nvd taskq");
361bb0ec6b3SJim Harris 
362ec84ecbbSJim Harris 	TAILQ_INSERT_TAIL(&disk_head, ndisk, global_tailq);
363ec84ecbbSJim Harris 	TAILQ_INSERT_TAIL(&ctrlr->disk_head, ndisk, ctrlr_tailq);
364038a5ee4SJim Harris 
365c3e9dd89SJim Harris 	disk_create(disk, DISK_VERSION);
366c3e9dd89SJim Harris 
36738441bd9SJim Harris 	printf(NVD_STR"%u: <%s> NVMe namespace\n", disk->d_unit, descr);
36838441bd9SJim Harris 	printf(NVD_STR"%u: %juMB (%ju %u byte sectors)\n", disk->d_unit,
36938441bd9SJim Harris 		(uintmax_t)disk->d_mediasize / (1024*1024),
37038441bd9SJim Harris 		(uintmax_t)disk->d_mediasize / disk->d_sectorsize,
37138441bd9SJim Harris 		disk->d_sectorsize);
37238441bd9SJim Harris 
373038a5ee4SJim Harris 	return (NULL);
374bb0ec6b3SJim Harris }
375bb0ec6b3SJim Harris 
376bb0ec6b3SJim Harris static void
377bb0ec6b3SJim Harris destroy_geom_disk(struct nvd_disk *ndisk)
378bb0ec6b3SJim Harris {
379bb0ec6b3SJim Harris 	struct bio	*bp;
38038441bd9SJim Harris 	struct disk	*disk;
38138441bd9SJim Harris 	uint32_t	unit;
38238441bd9SJim Harris 	int		cnt = 0;
383bb0ec6b3SJim Harris 
38438441bd9SJim Harris 	disk = ndisk->disk;
38538441bd9SJim Harris 	unit = disk->d_unit;
386bb0ec6b3SJim Harris 	taskqueue_free(ndisk->tq);
38738441bd9SJim Harris 
388bb0ec6b3SJim Harris 	disk_destroy(ndisk->disk);
389bb0ec6b3SJim Harris 
390bb0ec6b3SJim Harris 	mtx_lock(&ndisk->bioqlock);
391bb0ec6b3SJim Harris 	for (;;) {
392bb0ec6b3SJim Harris 		bp = bioq_takefirst(&ndisk->bioq);
393bb0ec6b3SJim Harris 		if (bp == NULL)
394bb0ec6b3SJim Harris 			break;
395bb0ec6b3SJim Harris 		bp->bio_error = EIO;
396bb0ec6b3SJim Harris 		bp->bio_flags |= BIO_ERROR;
397bb0ec6b3SJim Harris 		bp->bio_resid = bp->bio_bcount;
39838441bd9SJim Harris 		cnt++;
399bb0ec6b3SJim Harris 		biodone(bp);
400bb0ec6b3SJim Harris 	}
40138441bd9SJim Harris 
40238441bd9SJim Harris 	printf(NVD_STR"%u: lost device - %d outstanding\n", unit, cnt);
40338441bd9SJim Harris 	printf(NVD_STR"%u: removing device entry\n", unit);
40438441bd9SJim Harris 
405bb0ec6b3SJim Harris 	mtx_unlock(&ndisk->bioqlock);
406bb0ec6b3SJim Harris 
407bb0ec6b3SJim Harris 	mtx_destroy(&ndisk->bioqlock);
408bb0ec6b3SJim Harris }
409232e2edbSJim Harris 
410232e2edbSJim Harris static void
411232e2edbSJim Harris nvd_controller_fail(void *ctrlr_arg)
412232e2edbSJim Harris {
413232e2edbSJim Harris 	struct nvd_controller	*ctrlr = ctrlr_arg;
414232e2edbSJim Harris 	struct nvd_disk		*disk;
415232e2edbSJim Harris 
416232e2edbSJim Harris 	while (!TAILQ_EMPTY(&ctrlr->disk_head)) {
417232e2edbSJim Harris 		disk = TAILQ_FIRST(&ctrlr->disk_head);
418232e2edbSJim Harris 		TAILQ_REMOVE(&disk_head, disk, global_tailq);
419232e2edbSJim Harris 		TAILQ_REMOVE(&ctrlr->disk_head, disk, ctrlr_tailq);
420232e2edbSJim Harris 		destroy_geom_disk(disk);
421232e2edbSJim Harris 		free(disk, M_NVD);
422232e2edbSJim Harris 	}
423232e2edbSJim Harris 
424232e2edbSJim Harris 	TAILQ_REMOVE(&ctrlr_head, ctrlr, tailq);
425232e2edbSJim Harris 	free(ctrlr, M_NVD);
426232e2edbSJim Harris }
427232e2edbSJim Harris 
428