xref: /freebsd/sys/dev/nvd/nvd.c (revision a498975ef70e00fa25af3cc0a6ad5560f9bcff85)
1bb0ec6b3SJim Harris /*-
2aeae6079SJim Harris  * Copyright (C) 2012-2016 Intel Corporation
3bb0ec6b3SJim Harris  * All rights reserved.
4bb0ec6b3SJim Harris  *
5bb0ec6b3SJim Harris  * Redistribution and use in source and binary forms, with or without
6bb0ec6b3SJim Harris  * modification, are permitted provided that the following conditions
7bb0ec6b3SJim Harris  * are met:
8bb0ec6b3SJim Harris  * 1. Redistributions of source code must retain the above copyright
9bb0ec6b3SJim Harris  *    notice, this list of conditions and the following disclaimer.
10bb0ec6b3SJim Harris  * 2. Redistributions in binary form must reproduce the above copyright
11bb0ec6b3SJim Harris  *    notice, this list of conditions and the following disclaimer in the
12bb0ec6b3SJim Harris  *    documentation and/or other materials provided with the distribution.
13bb0ec6b3SJim Harris  *
14bb0ec6b3SJim Harris  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15bb0ec6b3SJim Harris  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16bb0ec6b3SJim Harris  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17bb0ec6b3SJim Harris  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18bb0ec6b3SJim Harris  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19bb0ec6b3SJim Harris  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20bb0ec6b3SJim Harris  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21bb0ec6b3SJim Harris  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22bb0ec6b3SJim Harris  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23bb0ec6b3SJim Harris  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24bb0ec6b3SJim Harris  * SUCH DAMAGE.
25bb0ec6b3SJim Harris  */
26bb0ec6b3SJim Harris 
27bb0ec6b3SJim Harris #include <sys/cdefs.h>
28bb0ec6b3SJim Harris __FBSDID("$FreeBSD$");
29bb0ec6b3SJim Harris 
30bb0ec6b3SJim Harris #include <sys/param.h>
31bb0ec6b3SJim Harris #include <sys/bio.h>
32bb0ec6b3SJim Harris #include <sys/kernel.h>
33bb0ec6b3SJim Harris #include <sys/malloc.h>
34bb0ec6b3SJim Harris #include <sys/module.h>
35aeae6079SJim Harris #include <sys/sysctl.h>
36bb0ec6b3SJim Harris #include <sys/systm.h>
37bb0ec6b3SJim Harris #include <sys/taskqueue.h>
38bb0ec6b3SJim Harris 
39bb0ec6b3SJim Harris #include <geom/geom.h>
40bb0ec6b3SJim Harris #include <geom/geom_disk.h>
41bb0ec6b3SJim Harris 
42bb0ec6b3SJim Harris #include <dev/nvme/nvme.h>
43bb0ec6b3SJim Harris 
4438441bd9SJim Harris #define NVD_STR		"nvd"
4538441bd9SJim Harris 
46bb0ec6b3SJim Harris struct nvd_disk;
47bb0ec6b3SJim Harris 
48bb0ec6b3SJim Harris static disk_ioctl_t nvd_ioctl;
49bb0ec6b3SJim Harris static disk_strategy_t nvd_strategy;
50*a498975eSScott Long static dumper_t nvd_dump;
51bb0ec6b3SJim Harris 
5247ef4244SJim Harris static void nvd_done(void *arg, const struct nvme_completion *cpl);
5347ef4244SJim Harris 
54ec84ecbbSJim Harris static void *nvd_new_disk(struct nvme_namespace *ns, void *ctrlr);
55bb0ec6b3SJim Harris static void destroy_geom_disk(struct nvd_disk *ndisk);
56bb0ec6b3SJim Harris 
57ec84ecbbSJim Harris static void *nvd_new_controller(struct nvme_controller *ctrlr);
58232e2edbSJim Harris static void nvd_controller_fail(void *ctrlr);
59ec84ecbbSJim Harris 
60bb0ec6b3SJim Harris static int nvd_load(void);
61bb0ec6b3SJim Harris static void nvd_unload(void);
62bb0ec6b3SJim Harris 
63bb0ec6b3SJim Harris MALLOC_DEFINE(M_NVD, "nvd", "nvd(4) allocations");
64bb0ec6b3SJim Harris 
65bb0ec6b3SJim Harris struct nvme_consumer *consumer_handle;
66bb0ec6b3SJim Harris 
67bb0ec6b3SJim Harris struct nvd_disk {
68bb0ec6b3SJim Harris 
69bb0ec6b3SJim Harris 	struct bio_queue_head	bioq;
70bb0ec6b3SJim Harris 	struct task		bioqtask;
71bb0ec6b3SJim Harris 	struct mtx		bioqlock;
72bb0ec6b3SJim Harris 
73bb0ec6b3SJim Harris 	struct disk		*disk;
74bb0ec6b3SJim Harris 	struct taskqueue	*tq;
75bb0ec6b3SJim Harris 	struct nvme_namespace	*ns;
76bb0ec6b3SJim Harris 
77bb0ec6b3SJim Harris 	uint32_t		cur_depth;
7858d0b8f3SJim Harris 	uint32_t		ordered_in_flight;
79bb0ec6b3SJim Harris 
80ec84ecbbSJim Harris 	TAILQ_ENTRY(nvd_disk)	global_tailq;
81ec84ecbbSJim Harris 	TAILQ_ENTRY(nvd_disk)	ctrlr_tailq;
82bb0ec6b3SJim Harris };
83bb0ec6b3SJim Harris 
84ec84ecbbSJim Harris struct nvd_controller {
85ec84ecbbSJim Harris 
86ec84ecbbSJim Harris 	TAILQ_ENTRY(nvd_controller)	tailq;
87ec84ecbbSJim Harris 	TAILQ_HEAD(, nvd_disk)		disk_head;
88ec84ecbbSJim Harris };
89ec84ecbbSJim Harris 
90ec84ecbbSJim Harris static TAILQ_HEAD(, nvd_controller)	ctrlr_head;
91ec84ecbbSJim Harris static TAILQ_HEAD(disk_list, nvd_disk)	disk_head;
92bb0ec6b3SJim Harris 
93aeae6079SJim Harris static SYSCTL_NODE(_hw, OID_AUTO, nvd, CTLFLAG_RD, 0, "nvd driver parameters");
94aeae6079SJim Harris /*
95aeae6079SJim Harris  * The NVMe specification does not define a maximum or optimal delete size, so
96aeae6079SJim Harris  *  technically max delete size is min(full size of the namespace, 2^32 - 1
97aeae6079SJim Harris  *  LBAs).  A single delete for a multi-TB NVMe namespace though may take much
98aeae6079SJim Harris  *  longer to complete than the nvme(4) I/O timeout period.  So choose a sensible
99aeae6079SJim Harris  *  default here that is still suitably large to minimize the number of overall
100aeae6079SJim Harris  *  delete operations.
101aeae6079SJim Harris  */
102aeae6079SJim Harris static uint64_t nvd_delete_max = (1024 * 1024 * 1024);  /* 1GB */
103aeae6079SJim Harris SYSCTL_UQUAD(_hw_nvd, OID_AUTO, delete_max, CTLFLAG_RDTUN, &nvd_delete_max, 0,
104aeae6079SJim Harris 	     "nvd maximum BIO_DELETE size in bytes");
105aeae6079SJim Harris 
106bb0ec6b3SJim Harris static int nvd_modevent(module_t mod, int type, void *arg)
107bb0ec6b3SJim Harris {
108bb0ec6b3SJim Harris 	int error = 0;
109bb0ec6b3SJim Harris 
110bb0ec6b3SJim Harris 	switch (type) {
111bb0ec6b3SJim Harris 	case MOD_LOAD:
112bb0ec6b3SJim Harris 		error = nvd_load();
113bb0ec6b3SJim Harris 		break;
114bb0ec6b3SJim Harris 	case MOD_UNLOAD:
115bb0ec6b3SJim Harris 		nvd_unload();
116bb0ec6b3SJim Harris 		break;
117bb0ec6b3SJim Harris 	default:
118bb0ec6b3SJim Harris 		break;
119bb0ec6b3SJim Harris 	}
120bb0ec6b3SJim Harris 
121bb0ec6b3SJim Harris 	return (error);
122bb0ec6b3SJim Harris }
123bb0ec6b3SJim Harris 
124bb0ec6b3SJim Harris moduledata_t nvd_mod = {
12538441bd9SJim Harris 	NVD_STR,
126bb0ec6b3SJim Harris 	(modeventhand_t)nvd_modevent,
1279823d527SKevin Lo 	0
128bb0ec6b3SJim Harris };
129bb0ec6b3SJim Harris 
130bb0ec6b3SJim Harris DECLARE_MODULE(nvd, nvd_mod, SI_SUB_DRIVERS, SI_ORDER_ANY);
131bb0ec6b3SJim Harris MODULE_VERSION(nvd, 1);
132bb0ec6b3SJim Harris MODULE_DEPEND(nvd, nvme, 1, 1, 1);
133bb0ec6b3SJim Harris 
134bb0ec6b3SJim Harris static int
135bb0ec6b3SJim Harris nvd_load()
136bb0ec6b3SJim Harris {
137bb0ec6b3SJim Harris 
138ec84ecbbSJim Harris 	TAILQ_INIT(&ctrlr_head);
139ec84ecbbSJim Harris 	TAILQ_INIT(&disk_head);
140ec84ecbbSJim Harris 
141ec84ecbbSJim Harris 	consumer_handle = nvme_register_consumer(nvd_new_disk,
142232e2edbSJim Harris 	    nvd_new_controller, NULL, nvd_controller_fail);
143bb0ec6b3SJim Harris 
144bb0ec6b3SJim Harris 	return (consumer_handle != NULL ? 0 : -1);
145bb0ec6b3SJim Harris }
146bb0ec6b3SJim Harris 
147bb0ec6b3SJim Harris static void
148bb0ec6b3SJim Harris nvd_unload()
149bb0ec6b3SJim Harris {
150ec84ecbbSJim Harris 	struct nvd_controller	*ctrlr;
151ec84ecbbSJim Harris 	struct nvd_disk		*disk;
152bb0ec6b3SJim Harris 
153ec84ecbbSJim Harris 	while (!TAILQ_EMPTY(&ctrlr_head)) {
154ec84ecbbSJim Harris 		ctrlr = TAILQ_FIRST(&ctrlr_head);
155ec84ecbbSJim Harris 		TAILQ_REMOVE(&ctrlr_head, ctrlr, tailq);
156ec84ecbbSJim Harris 		free(ctrlr, M_NVD);
157ec84ecbbSJim Harris 	}
158ec84ecbbSJim Harris 
159ec84ecbbSJim Harris 	while (!TAILQ_EMPTY(&disk_head)) {
160ec84ecbbSJim Harris 		disk = TAILQ_FIRST(&disk_head);
161ec84ecbbSJim Harris 		TAILQ_REMOVE(&disk_head, disk, global_tailq);
162ec84ecbbSJim Harris 		destroy_geom_disk(disk);
163ec84ecbbSJim Harris 		free(disk, M_NVD);
164bb0ec6b3SJim Harris 	}
165bb0ec6b3SJim Harris 
166bb0ec6b3SJim Harris 	nvme_unregister_consumer(consumer_handle);
167bb0ec6b3SJim Harris }
168bb0ec6b3SJim Harris 
16947ef4244SJim Harris static int
17047ef4244SJim Harris nvd_bio_submit(struct nvd_disk *ndisk, struct bio *bp)
17147ef4244SJim Harris {
17247ef4244SJim Harris 	int err;
17347ef4244SJim Harris 
17447ef4244SJim Harris 	bp->bio_driver1 = NULL;
17547ef4244SJim Harris 	atomic_add_int(&ndisk->cur_depth, 1);
17647ef4244SJim Harris 	err = nvme_ns_bio_process(ndisk->ns, bp, nvd_done);
17747ef4244SJim Harris 	if (err) {
17847ef4244SJim Harris 		atomic_add_int(&ndisk->cur_depth, -1);
17958d0b8f3SJim Harris 		if (__predict_false(bp->bio_flags & BIO_ORDERED))
18058d0b8f3SJim Harris 			atomic_add_int(&ndisk->ordered_in_flight, -1);
18147ef4244SJim Harris 		bp->bio_error = err;
18247ef4244SJim Harris 		bp->bio_flags |= BIO_ERROR;
18347ef4244SJim Harris 		bp->bio_resid = bp->bio_bcount;
18447ef4244SJim Harris 		biodone(bp);
18547ef4244SJim Harris 		return (-1);
18647ef4244SJim Harris 	}
18747ef4244SJim Harris 
18847ef4244SJim Harris 	return (0);
18947ef4244SJim Harris }
19047ef4244SJim Harris 
191bb0ec6b3SJim Harris static void
192bb0ec6b3SJim Harris nvd_strategy(struct bio *bp)
193bb0ec6b3SJim Harris {
194bb0ec6b3SJim Harris 	struct nvd_disk *ndisk;
195bb0ec6b3SJim Harris 
196bb0ec6b3SJim Harris 	ndisk = (struct nvd_disk *)bp->bio_disk->d_drv1;
197bb0ec6b3SJim Harris 
19858d0b8f3SJim Harris 	if (__predict_false(bp->bio_flags & BIO_ORDERED))
19958d0b8f3SJim Harris 		atomic_add_int(&ndisk->ordered_in_flight, 1);
20058d0b8f3SJim Harris 
20158d0b8f3SJim Harris 	if (__predict_true(ndisk->ordered_in_flight == 0)) {
20258d0b8f3SJim Harris 		nvd_bio_submit(ndisk, bp);
20358d0b8f3SJim Harris 		return;
20458d0b8f3SJim Harris 	}
20558d0b8f3SJim Harris 
20658d0b8f3SJim Harris 	/*
20758d0b8f3SJim Harris 	 * There are ordered bios in flight, so we need to submit
20858d0b8f3SJim Harris 	 *  bios through the task queue to enforce ordering.
20958d0b8f3SJim Harris 	 */
210bb0ec6b3SJim Harris 	mtx_lock(&ndisk->bioqlock);
211bb0ec6b3SJim Harris 	bioq_insert_tail(&ndisk->bioq, bp);
212bb0ec6b3SJim Harris 	mtx_unlock(&ndisk->bioqlock);
213bb0ec6b3SJim Harris 	taskqueue_enqueue(ndisk->tq, &ndisk->bioqtask);
214bb0ec6b3SJim Harris }
215bb0ec6b3SJim Harris 
216bb0ec6b3SJim Harris static int
217bb0ec6b3SJim Harris nvd_ioctl(struct disk *ndisk, u_long cmd, void *data, int fflag,
218bb0ec6b3SJim Harris     struct thread *td)
219bb0ec6b3SJim Harris {
220bb0ec6b3SJim Harris 	int ret = 0;
221bb0ec6b3SJim Harris 
222bb0ec6b3SJim Harris 	switch (cmd) {
223bb0ec6b3SJim Harris 	default:
224bb0ec6b3SJim Harris 		ret = EIO;
225bb0ec6b3SJim Harris 	}
226bb0ec6b3SJim Harris 
227bb0ec6b3SJim Harris 	return (ret);
228bb0ec6b3SJim Harris }
229bb0ec6b3SJim Harris 
230*a498975eSScott Long static int
231*a498975eSScott Long nvd_dump(void *arg, void *virt, vm_offset_t phys, off_t offset, size_t len)
232*a498975eSScott Long {
233*a498975eSScott Long 	struct nvd_disk *ndisk;
234*a498975eSScott Long 	struct disk *dp;
235*a498975eSScott Long 	int error;
236*a498975eSScott Long 
237*a498975eSScott Long 	dp = arg;
238*a498975eSScott Long 	ndisk = dp->d_drv1;
239*a498975eSScott Long 
240*a498975eSScott Long 	if (len > 0) {
241*a498975eSScott Long 		if ((error = nvme_ns_dump(ndisk->ns, virt, offset, len)) != 0)
242*a498975eSScott Long 			return (error);
243*a498975eSScott Long 	} else {
244*a498975eSScott Long 		/* XXX sync to stable storage */
245*a498975eSScott Long 	}
246*a498975eSScott Long 
247*a498975eSScott Long 	return (0);
248*a498975eSScott Long }
249*a498975eSScott Long 
250bb0ec6b3SJim Harris static void
251cf81529cSJim Harris nvd_done(void *arg, const struct nvme_completion *cpl)
252bb0ec6b3SJim Harris {
253bb0ec6b3SJim Harris 	struct bio *bp;
254bb0ec6b3SJim Harris 	struct nvd_disk *ndisk;
255bb0ec6b3SJim Harris 
256bb0ec6b3SJim Harris 	bp = (struct bio *)arg;
257bb0ec6b3SJim Harris 
258bb0ec6b3SJim Harris 	ndisk = bp->bio_disk->d_drv1;
259bb0ec6b3SJim Harris 
2600f71ecf7SJim Harris 	atomic_add_int(&ndisk->cur_depth, -1);
26158d0b8f3SJim Harris 	if (__predict_false(bp->bio_flags & BIO_ORDERED))
26258d0b8f3SJim Harris 		atomic_add_int(&ndisk->ordered_in_flight, -1);
263bb0ec6b3SJim Harris 
264bb0ec6b3SJim Harris 	biodone(bp);
265bb0ec6b3SJim Harris }
266bb0ec6b3SJim Harris 
267bb0ec6b3SJim Harris static void
268bb0ec6b3SJim Harris nvd_bioq_process(void *arg, int pending)
269bb0ec6b3SJim Harris {
270bb0ec6b3SJim Harris 	struct nvd_disk *ndisk = arg;
271bb0ec6b3SJim Harris 	struct bio *bp;
272bb0ec6b3SJim Harris 
273bb0ec6b3SJim Harris 	for (;;) {
274bb0ec6b3SJim Harris 		mtx_lock(&ndisk->bioqlock);
275bb0ec6b3SJim Harris 		bp = bioq_takefirst(&ndisk->bioq);
276bb0ec6b3SJim Harris 		mtx_unlock(&ndisk->bioqlock);
277bb0ec6b3SJim Harris 		if (bp == NULL)
278bb0ec6b3SJim Harris 			break;
279bb0ec6b3SJim Harris 
28047ef4244SJim Harris 		if (nvd_bio_submit(ndisk, bp) != 0) {
28126ca317aSJim Harris 			continue;
282bb0ec6b3SJim Harris 		}
283bb0ec6b3SJim Harris 
284bb0ec6b3SJim Harris #ifdef BIO_ORDERED
285bb0ec6b3SJim Harris 		/*
286bb0ec6b3SJim Harris 		 * BIO_ORDERED flag dictates that the bio with BIO_ORDERED
287bb0ec6b3SJim Harris 		 *  flag set must be completed before proceeding with
288bb0ec6b3SJim Harris 		 *  additional bios.
289bb0ec6b3SJim Harris 		 */
290bb0ec6b3SJim Harris 		if (bp->bio_flags & BIO_ORDERED) {
291bb0ec6b3SJim Harris 			while (ndisk->cur_depth > 0) {
292bb0ec6b3SJim Harris 				pause("nvd flush", 1);
293bb0ec6b3SJim Harris 			}
294bb0ec6b3SJim Harris 		}
295bb0ec6b3SJim Harris #endif
296bb0ec6b3SJim Harris 	}
297bb0ec6b3SJim Harris }
298bb0ec6b3SJim Harris 
299038a5ee4SJim Harris static void *
300ec84ecbbSJim Harris nvd_new_controller(struct nvme_controller *ctrlr)
301ec84ecbbSJim Harris {
302ec84ecbbSJim Harris 	struct nvd_controller	*nvd_ctrlr;
303ec84ecbbSJim Harris 
304ec84ecbbSJim Harris 	nvd_ctrlr = malloc(sizeof(struct nvd_controller), M_NVD,
305237d2019SJim Harris 	    M_ZERO | M_WAITOK);
306ec84ecbbSJim Harris 
307ec84ecbbSJim Harris 	TAILQ_INIT(&nvd_ctrlr->disk_head);
308ec84ecbbSJim Harris 	TAILQ_INSERT_TAIL(&ctrlr_head, nvd_ctrlr, tailq);
309ec84ecbbSJim Harris 
310ec84ecbbSJim Harris 	return (nvd_ctrlr);
311ec84ecbbSJim Harris }
312ec84ecbbSJim Harris 
313ec84ecbbSJim Harris static void *
314ec84ecbbSJim Harris nvd_new_disk(struct nvme_namespace *ns, void *ctrlr_arg)
315bb0ec6b3SJim Harris {
31638441bd9SJim Harris 	uint8_t			descr[NVME_MODEL_NUMBER_LENGTH+1];
317bb0ec6b3SJim Harris 	struct nvd_disk		*ndisk;
318bb0ec6b3SJim Harris 	struct disk		*disk;
319ec84ecbbSJim Harris 	struct nvd_controller	*ctrlr = ctrlr_arg;
320bb0ec6b3SJim Harris 
321237d2019SJim Harris 	ndisk = malloc(sizeof(struct nvd_disk), M_NVD, M_ZERO | M_WAITOK);
322bb0ec6b3SJim Harris 
323bb0ec6b3SJim Harris 	disk = disk_alloc();
324bb0ec6b3SJim Harris 	disk->d_strategy = nvd_strategy;
325bb0ec6b3SJim Harris 	disk->d_ioctl = nvd_ioctl;
326*a498975eSScott Long 	disk->d_dump = nvd_dump;
32738441bd9SJim Harris 	disk->d_name = NVD_STR;
328bb0ec6b3SJim Harris 	disk->d_drv1 = ndisk;
329bb0ec6b3SJim Harris 
330bb0ec6b3SJim Harris 	disk->d_maxsize = nvme_ns_get_max_io_xfer_size(ns);
331bb0ec6b3SJim Harris 	disk->d_sectorsize = nvme_ns_get_sector_size(ns);
332bb0ec6b3SJim Harris 	disk->d_mediasize = (off_t)nvme_ns_get_size(ns);
33370fb74bdSJim Harris 	disk->d_delmaxsize = (off_t)nvme_ns_get_size(ns);
334aeae6079SJim Harris 	if (disk->d_delmaxsize > nvd_delete_max)
335aeae6079SJim Harris 		disk->d_delmaxsize = nvd_delete_max;
336ee7f4d81SAlexander Motin 	disk->d_stripesize = nvme_ns_get_stripesize(ns);
337bb0ec6b3SJim Harris 
338ec84ecbbSJim Harris 	if (TAILQ_EMPTY(&disk_head))
339bb0ec6b3SJim Harris 		disk->d_unit = 0;
340bb0ec6b3SJim Harris 	else
341ec84ecbbSJim Harris 		disk->d_unit =
342ec84ecbbSJim Harris 		    TAILQ_LAST(&disk_head, disk_list)->disk->d_unit + 1;
343bb0ec6b3SJim Harris 
344454f163bSJim Harris 	disk->d_flags = DISKFLAG_DIRECT_COMPLETION;
345bb0ec6b3SJim Harris 
346bb0ec6b3SJim Harris 	if (nvme_ns_get_flags(ns) & NVME_NS_DEALLOCATE_SUPPORTED)
347bb0ec6b3SJim Harris 		disk->d_flags |= DISKFLAG_CANDELETE;
348bb0ec6b3SJim Harris 
349bb0ec6b3SJim Harris 	if (nvme_ns_get_flags(ns) & NVME_NS_FLUSH_SUPPORTED)
350bb0ec6b3SJim Harris 		disk->d_flags |= DISKFLAG_CANFLUSHCACHE;
351bb0ec6b3SJim Harris 
3525fdf9c3cSJim Harris /* ifdef used here to ease porting to stable branches at a later point. */
3535fdf9c3cSJim Harris #ifdef DISKFLAG_UNMAPPED_BIO
3545fdf9c3cSJim Harris 	disk->d_flags |= DISKFLAG_UNMAPPED_BIO;
3555fdf9c3cSJim Harris #endif
3565fdf9c3cSJim Harris 
357e8f25c62SJim Harris 	/*
358e8f25c62SJim Harris 	 * d_ident and d_descr are both far bigger than the length of either
359e8f25c62SJim Harris 	 *  the serial or model number strings.
360e8f25c62SJim Harris 	 */
36138441bd9SJim Harris 	nvme_strvis(disk->d_ident, nvme_ns_get_serial_number(ns),
36238441bd9SJim Harris 	    sizeof(disk->d_ident), NVME_SERIAL_NUMBER_LENGTH);
36338441bd9SJim Harris 
36438441bd9SJim Harris 	nvme_strvis(descr, nvme_ns_get_model_number(ns), sizeof(descr),
36538441bd9SJim Harris 	    NVME_MODEL_NUMBER_LENGTH);
366bb0ec6b3SJim Harris 
367bb0ec6b3SJim Harris #if __FreeBSD_version >= 900034
36838441bd9SJim Harris 	strlcpy(disk->d_descr, descr, sizeof(descr));
369bb0ec6b3SJim Harris #endif
370bb0ec6b3SJim Harris 
371bb0ec6b3SJim Harris 	ndisk->ns = ns;
372bb0ec6b3SJim Harris 	ndisk->disk = disk;
373bb0ec6b3SJim Harris 	ndisk->cur_depth = 0;
37458d0b8f3SJim Harris 	ndisk->ordered_in_flight = 0;
375bb0ec6b3SJim Harris 
376bb0ec6b3SJim Harris 	mtx_init(&ndisk->bioqlock, "NVD bioq lock", NULL, MTX_DEF);
377bb0ec6b3SJim Harris 	bioq_init(&ndisk->bioq);
378bb0ec6b3SJim Harris 
379bb0ec6b3SJim Harris 	TASK_INIT(&ndisk->bioqtask, 0, nvd_bioq_process, ndisk);
380bb0ec6b3SJim Harris 	ndisk->tq = taskqueue_create("nvd_taskq", M_WAITOK,
381bb0ec6b3SJim Harris 	    taskqueue_thread_enqueue, &ndisk->tq);
382bb0ec6b3SJim Harris 	taskqueue_start_threads(&ndisk->tq, 1, PI_DISK, "nvd taskq");
383bb0ec6b3SJim Harris 
384ec84ecbbSJim Harris 	TAILQ_INSERT_TAIL(&disk_head, ndisk, global_tailq);
385ec84ecbbSJim Harris 	TAILQ_INSERT_TAIL(&ctrlr->disk_head, ndisk, ctrlr_tailq);
386038a5ee4SJim Harris 
387c3e9dd89SJim Harris 	disk_create(disk, DISK_VERSION);
388c3e9dd89SJim Harris 
38938441bd9SJim Harris 	printf(NVD_STR"%u: <%s> NVMe namespace\n", disk->d_unit, descr);
39038441bd9SJim Harris 	printf(NVD_STR"%u: %juMB (%ju %u byte sectors)\n", disk->d_unit,
39138441bd9SJim Harris 		(uintmax_t)disk->d_mediasize / (1024*1024),
39238441bd9SJim Harris 		(uintmax_t)disk->d_mediasize / disk->d_sectorsize,
39338441bd9SJim Harris 		disk->d_sectorsize);
39438441bd9SJim Harris 
395038a5ee4SJim Harris 	return (NULL);
396bb0ec6b3SJim Harris }
397bb0ec6b3SJim Harris 
398bb0ec6b3SJim Harris static void
399bb0ec6b3SJim Harris destroy_geom_disk(struct nvd_disk *ndisk)
400bb0ec6b3SJim Harris {
401bb0ec6b3SJim Harris 	struct bio	*bp;
40238441bd9SJim Harris 	struct disk	*disk;
40338441bd9SJim Harris 	uint32_t	unit;
40438441bd9SJim Harris 	int		cnt = 0;
405bb0ec6b3SJim Harris 
40638441bd9SJim Harris 	disk = ndisk->disk;
40738441bd9SJim Harris 	unit = disk->d_unit;
408bb0ec6b3SJim Harris 	taskqueue_free(ndisk->tq);
40938441bd9SJim Harris 
410bb0ec6b3SJim Harris 	disk_destroy(ndisk->disk);
411bb0ec6b3SJim Harris 
412bb0ec6b3SJim Harris 	mtx_lock(&ndisk->bioqlock);
413bb0ec6b3SJim Harris 	for (;;) {
414bb0ec6b3SJim Harris 		bp = bioq_takefirst(&ndisk->bioq);
415bb0ec6b3SJim Harris 		if (bp == NULL)
416bb0ec6b3SJim Harris 			break;
417bb0ec6b3SJim Harris 		bp->bio_error = EIO;
418bb0ec6b3SJim Harris 		bp->bio_flags |= BIO_ERROR;
419bb0ec6b3SJim Harris 		bp->bio_resid = bp->bio_bcount;
42038441bd9SJim Harris 		cnt++;
421bb0ec6b3SJim Harris 		biodone(bp);
422bb0ec6b3SJim Harris 	}
42338441bd9SJim Harris 
42438441bd9SJim Harris 	printf(NVD_STR"%u: lost device - %d outstanding\n", unit, cnt);
42538441bd9SJim Harris 	printf(NVD_STR"%u: removing device entry\n", unit);
42638441bd9SJim Harris 
427bb0ec6b3SJim Harris 	mtx_unlock(&ndisk->bioqlock);
428bb0ec6b3SJim Harris 
429bb0ec6b3SJim Harris 	mtx_destroy(&ndisk->bioqlock);
430bb0ec6b3SJim Harris }
431232e2edbSJim Harris 
432232e2edbSJim Harris static void
433232e2edbSJim Harris nvd_controller_fail(void *ctrlr_arg)
434232e2edbSJim Harris {
435232e2edbSJim Harris 	struct nvd_controller	*ctrlr = ctrlr_arg;
436232e2edbSJim Harris 	struct nvd_disk		*disk;
437232e2edbSJim Harris 
438232e2edbSJim Harris 	while (!TAILQ_EMPTY(&ctrlr->disk_head)) {
439232e2edbSJim Harris 		disk = TAILQ_FIRST(&ctrlr->disk_head);
440232e2edbSJim Harris 		TAILQ_REMOVE(&disk_head, disk, global_tailq);
441232e2edbSJim Harris 		TAILQ_REMOVE(&ctrlr->disk_head, disk, ctrlr_tailq);
442232e2edbSJim Harris 		destroy_geom_disk(disk);
443232e2edbSJim Harris 		free(disk, M_NVD);
444232e2edbSJim Harris 	}
445232e2edbSJim Harris 
446232e2edbSJim Harris 	TAILQ_REMOVE(&ctrlr_head, ctrlr, tailq);
447232e2edbSJim Harris 	free(ctrlr, M_NVD);
448232e2edbSJim Harris }
449232e2edbSJim Harris 
450