xref: /freebsd/sys/dev/nvdimm/nvdimm.c (revision 86dc8398c9ca2283c5d6984992b7a585257b5adb)
1 /*-
2  * Copyright (c) 2017 The FreeBSD Foundation
3  * All rights reserved.
4  * Copyright (c) 2018, 2019 Intel Corporation
5  *
6  * This software was developed by Konstantin Belousov <kib@FreeBSD.org>
7  * under sponsorship from the FreeBSD Foundation.
8  *
9  * Redistribution and use in source and binary forms, with or without
10  * modification, are permitted provided that the following conditions
11  * are met:
12  * 1. Redistributions of source code must retain the above copyright
13  *    notice, this list of conditions and the following disclaimer.
14  * 2. Redistributions in binary form must reproduce the above copyright
15  *    notice, this list of conditions and the following disclaimer in the
16  *    documentation and/or other materials provided with the distribution.
17  *
18  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
19  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
20  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
21  * ARE DISCLAIMED. IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
22  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
23  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
24  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
25  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
26  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
27  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
28  * SUCH DAMAGE.
29  */
30 
31 #include <sys/cdefs.h>
32 __FBSDID("$FreeBSD$");
33 
34 #include "opt_acpi.h"
35 #include "opt_ddb.h"
36 
37 #include <sys/param.h>
38 #include <sys/systm.h>
39 #include <sys/bio.h>
40 #include <sys/bitstring.h>
41 #include <sys/bus.h>
42 #include <sys/kernel.h>
43 #include <sys/lock.h>
44 #include <sys/malloc.h>
45 #include <sys/module.h>
46 #include <sys/sbuf.h>
47 #include <sys/sysctl.h>
48 #include <sys/uuid.h>
49 
50 #include <contrib/dev/acpica/include/acpi.h>
51 #include <contrib/dev/acpica/include/accommon.h>
52 #include <contrib/dev/acpica/include/acuuid.h>
53 #include <dev/acpica/acpivar.h>
54 
55 #include <dev/nvdimm/nvdimm_var.h>
56 
57 #define _COMPONENT	ACPI_OEM
58 ACPI_MODULE_NAME("NVDIMM")
59 
60 static struct uuid intel_nvdimm_dsm_uuid =
61     {0x4309AC30,0x0D11,0x11E4,0x91,0x91,{0x08,0x00,0x20,0x0C,0x9A,0x66}};
62 #define INTEL_NVDIMM_DSM_REV 1
63 #define INTEL_NVDIMM_DSM_GET_LABEL_SIZE 4
64 #define INTEL_NVDIMM_DSM_GET_LABEL_DATA 5
65 
66 static devclass_t nvdimm_devclass;
67 MALLOC_DEFINE(M_NVDIMM, "nvdimm", "NVDIMM driver memory");
68 
69 static int
70 read_label_area_size(struct nvdimm_dev *nv)
71 {
72 	ACPI_OBJECT *result_buffer;
73 	ACPI_HANDLE handle;
74 	ACPI_STATUS status;
75 	ACPI_BUFFER result;
76 	uint32_t *out;
77 	int error;
78 
79 	handle = nvdimm_root_get_acpi_handle(nv->nv_dev);
80 	if (handle == NULL)
81 		return (ENODEV);
82 	result.Length = ACPI_ALLOCATE_BUFFER;
83 	result.Pointer = NULL;
84 	status = acpi_EvaluateDSM(handle, (uint8_t *)&intel_nvdimm_dsm_uuid,
85 	    INTEL_NVDIMM_DSM_REV, INTEL_NVDIMM_DSM_GET_LABEL_SIZE, NULL,
86 	    &result);
87 	error = ENXIO;
88 	if (ACPI_SUCCESS(status) && result.Pointer != NULL &&
89 	    result.Length >= sizeof(ACPI_OBJECT)) {
90 		result_buffer = result.Pointer;
91 		if (result_buffer->Type == ACPI_TYPE_BUFFER &&
92 		    result_buffer->Buffer.Length >= 12) {
93 			out = (uint32_t *)result_buffer->Buffer.Pointer;
94 			nv->label_area_size = out[1];
95 			nv->max_label_xfer = out[2];
96 			error = 0;
97 		}
98 	}
99 	if (result.Pointer != NULL)
100 		AcpiOsFree(result.Pointer);
101 	return (error);
102 }
103 
104 static int
105 read_label_area(struct nvdimm_dev *nv, uint8_t *dest, off_t offset,
106     off_t length)
107 {
108 	ACPI_BUFFER result;
109 	ACPI_HANDLE handle;
110 	ACPI_OBJECT params_pkg, params_buf, *result_buf;
111 	ACPI_STATUS status;
112 	uint32_t params[2];
113 	off_t to_read;
114 	int error;
115 
116 	error = 0;
117 	handle = nvdimm_root_get_acpi_handle(nv->nv_dev);
118 	if (offset < 0 || length <= 0 ||
119 	    offset + length > nv->label_area_size ||
120 	    handle == NULL)
121 		return (ENODEV);
122 	params_pkg.Type = ACPI_TYPE_PACKAGE;
123 	params_pkg.Package.Count = 1;
124 	params_pkg.Package.Elements = &params_buf;
125 	params_buf.Type = ACPI_TYPE_BUFFER;
126 	params_buf.Buffer.Length = sizeof(params);
127 	params_buf.Buffer.Pointer = (UINT8 *)params;
128 	while (length > 0) {
129 		to_read = MIN(length, nv->max_label_xfer);
130 		params[0] = offset;
131 		params[1] = to_read;
132 		result.Length = ACPI_ALLOCATE_BUFFER;
133 		result.Pointer = NULL;
134 		status = acpi_EvaluateDSM(handle,
135 		    (uint8_t *)&intel_nvdimm_dsm_uuid, INTEL_NVDIMM_DSM_REV,
136 		    INTEL_NVDIMM_DSM_GET_LABEL_DATA, &params_pkg, &result);
137 		if (ACPI_FAILURE(status) ||
138 		    result.Length < sizeof(ACPI_OBJECT) ||
139 		    result.Pointer == NULL) {
140 			error = ENXIO;
141 			break;
142 		}
143 		result_buf = (ACPI_OBJECT *)result.Pointer;
144 		if (result_buf->Type != ACPI_TYPE_BUFFER ||
145 		    result_buf->Buffer.Pointer == NULL ||
146 		    result_buf->Buffer.Length != 4 + to_read ||
147 		    ((uint16_t *)result_buf->Buffer.Pointer)[0] != 0) {
148 			error = ENXIO;
149 			break;
150 		}
151 		bcopy(result_buf->Buffer.Pointer + 4, dest, to_read);
152 		dest += to_read;
153 		offset += to_read;
154 		length -= to_read;
155 		if (result.Pointer != NULL) {
156 			AcpiOsFree(result.Pointer);
157 			result.Pointer = NULL;
158 		}
159 	}
160 	if (result.Pointer != NULL)
161 		AcpiOsFree(result.Pointer);
162 	return (error);
163 }
164 
165 static uint64_t
166 fletcher64(const void *data, size_t length)
167 {
168 	size_t i;
169 	uint32_t a, b;
170 	const uint32_t *d;
171 
172 	a = 0;
173 	b = 0;
174 	d = (const uint32_t *)data;
175 	length = length / sizeof(uint32_t);
176 	for (i = 0; i < length; i++) {
177 		a += d[i];
178 		b += a;
179 	}
180 	return ((uint64_t)b << 32 | a);
181 }
182 
183 static bool
184 label_index_is_valid(struct nvdimm_label_index *index, uint32_t max_labels,
185     size_t size, size_t offset)
186 {
187 	uint64_t checksum;
188 
189 	index = (struct nvdimm_label_index *)((uint8_t *)index + size * offset);
190 	if (strcmp(index->signature, NVDIMM_INDEX_BLOCK_SIGNATURE) != 0)
191 		return false;
192 	checksum = index->checksum;
193 	index->checksum = 0;
194 	if (checksum != fletcher64(index, size) ||
195 	    index->this_offset != size * offset || index->this_size != size ||
196 	    index->other_offset != size * (offset == 0 ? 1 : 0) ||
197 	    index->seq == 0 || index->seq > 3 || index->slot_cnt > max_labels ||
198 	    index->label_size != 1)
199 		return false;
200 	return true;
201 }
202 
203 static int
204 read_label(struct nvdimm_dev *nv, int num)
205 {
206 	struct nvdimm_label_entry *entry, *i, *next;
207 	uint64_t checksum;
208 	off_t offset;
209 	int error;
210 
211 	offset = nv->label_index->label_offset +
212 	    num * (128 << nv->label_index->label_size);
213 	entry = malloc(sizeof(*entry), M_NVDIMM, M_WAITOK);
214 	error = read_label_area(nv, (uint8_t *)&entry->label, offset,
215 	    sizeof(struct nvdimm_label));
216 	if (error != 0) {
217 		free(entry, M_NVDIMM);
218 		return (error);
219 	}
220 	checksum = entry->label.checksum;
221 	entry->label.checksum = 0;
222 	if (checksum != fletcher64(&entry->label, sizeof(entry->label)) ||
223 	    entry->label.slot != num) {
224 		free(entry, M_NVDIMM);
225 		return (ENXIO);
226 	}
227 
228 	/* Insertion ordered by dimm_phys_addr */
229 	if (SLIST_EMPTY(&nv->labels) ||
230 	    entry->label.dimm_phys_addr <=
231 	    SLIST_FIRST(&nv->labels)->label.dimm_phys_addr) {
232 		SLIST_INSERT_HEAD(&nv->labels, entry, link);
233 		return (0);
234 	}
235 	SLIST_FOREACH_SAFE(i, &nv->labels, link, next) {
236 		if (next == NULL ||
237 		    entry->label.dimm_phys_addr <= next->label.dimm_phys_addr) {
238 			SLIST_INSERT_AFTER(i, entry, link);
239 			return (0);
240 		}
241 	}
242 	__assert_unreachable();
243 }
244 
245 static int
246 read_labels(struct nvdimm_dev *nv)
247 {
248 	struct nvdimm_label_index *indices, *index1;
249 	size_t index_size, num_labels;
250 	int error, n;
251 	bool index_0_valid, index_1_valid;
252 
253 	for (index_size = 256; ; index_size += 256) {
254 		num_labels = 8 * (index_size -
255 		    sizeof(struct nvdimm_label_index));
256 		if (index_size + num_labels * sizeof(struct nvdimm_label) >=
257 		    nv->label_area_size)
258 			break;
259 	}
260 	num_labels = (nv->label_area_size - index_size) /
261 	    sizeof(struct nvdimm_label);
262 	indices = malloc(2 * index_size, M_NVDIMM, M_WAITOK);
263 	index1 = (void *)((uint8_t *)indices + index_size);
264 	error = read_label_area(nv, (void *)indices, 0, 2 * index_size);
265 	if (error != 0) {
266 		free(indices, M_NVDIMM);
267 		return (error);
268 	}
269 	index_0_valid = label_index_is_valid(indices, num_labels, index_size,
270 	    0);
271 	index_1_valid = label_index_is_valid(indices, num_labels, index_size,
272 	    1);
273 	if (!index_0_valid && !index_1_valid) {
274 		free(indices, M_NVDIMM);
275 		return (ENXIO);
276 	}
277 	if (index_0_valid && index_1_valid) {
278 		if (((int)indices->seq - (int)index1->seq + 3) % 3 == 1) {
279 			/* index 0 was more recently updated */
280 			index_1_valid = false;
281 		} else {
282 			/*
283 			 * either index 1 was more recently updated,
284 			 * or the sequence numbers are equal, in which
285 			 * case the specification says the block with
286 			 * the higher offset is to be treated as valid
287 			 */
288 			index_0_valid = false;
289 		}
290 	}
291 	nv->label_index = malloc(index_size, M_NVDIMM, M_WAITOK);
292 	bcopy(index_0_valid ? indices : index1, nv->label_index, index_size);
293 	free(indices, M_NVDIMM);
294 	bit_ffc_at((bitstr_t *)nv->label_index->free, 0,
295 	    nv->label_index->slot_cnt, &n);
296 	while (n >= 0) {
297 		read_label(nv, n);
298 		bit_ffc_at((bitstr_t *)nv->label_index->free, n + 1,
299 		    nv->label_index->slot_cnt, &n);
300 	}
301 	return (0);
302 }
303 
304 static int
305 nvdimm_probe(device_t dev)
306 {
307 
308 	return (BUS_PROBE_NOWILDCARD);
309 }
310 
311 static int
312 nvdimm_attach(device_t dev)
313 {
314 	struct nvdimm_dev *nv;
315 	struct sysctl_ctx_list *ctx;
316 	struct sysctl_oid *oid;
317 	struct sysctl_oid_list *children;
318 	struct sbuf *sb;
319 	ACPI_TABLE_NFIT *nfitbl;
320 	ACPI_STATUS status;
321 	ACPI_NFIT_MEMORY_MAP **maps;
322 	int error, i, num_maps;
323 	uint16_t flags;
324 
325 	nv = device_get_softc(dev);
326 	ctx = device_get_sysctl_ctx(dev);
327 	oid = device_get_sysctl_tree(dev);
328 	children = SYSCTL_CHILDREN(oid);
329 	MPASS(nvdimm_root_get_acpi_handle(dev) != NULL);
330 	nv->nv_dev = dev;
331 	nv->nv_handle = nvdimm_root_get_device_handle(dev);
332 
333 	status = AcpiGetTable(ACPI_SIG_NFIT, 1, (ACPI_TABLE_HEADER **)&nfitbl);
334 	if (ACPI_FAILURE(status)) {
335 		if (bootverbose)
336 			device_printf(dev, "cannot get NFIT\n");
337 		return (ENXIO);
338 	}
339 	acpi_nfit_get_flush_addrs(nfitbl, nv->nv_handle, &nv->nv_flush_addr,
340 	    &nv->nv_flush_addr_cnt);
341 
342 	/*
343 	 * Each NVDIMM should have at least one memory map associated with it.
344 	 * If any of the maps have one of the error flags set, reflect that in
345 	 * the overall status.
346 	 */
347 	acpi_nfit_get_memory_maps_by_dimm(nfitbl, nv->nv_handle, &maps,
348 	    &num_maps);
349 	if (num_maps == 0) {
350 		free(nv->nv_flush_addr, M_NVDIMM);
351 		free(maps, M_NVDIMM);
352 		device_printf(dev, "cannot find memory map\n");
353 		return (ENXIO);
354 	}
355 	flags = 0;
356 	for (i = 0; i < num_maps; i++) {
357 		flags |= maps[i]->Flags;
358 	}
359 	free(maps, M_NVDIMM);
360 
361 	/* sbuf_new_auto(9) is M_WAITOK; no need to check for NULL. */
362 	sb = sbuf_new_auto();
363 	(void) sbuf_printf(sb, "0x%b", flags,
364 	    "\20"
365 	    "\001SAVE_FAILED"
366 	    "\002RESTORE_FAILED"
367 	    "\003FLUSH_FAILED"
368 	    "\004NOT_ARMED"
369 	    "\005HEALTH_OBSERVED"
370 	    "\006HEALTH_ENABLED"
371 	    "\007MAP_FAILED");
372 	error = sbuf_finish(sb);
373 	if (error != 0) {
374 		sbuf_delete(sb);
375 		free(nv->nv_flush_addr, M_NVDIMM);
376 		device_printf(dev, "cannot convert flags to string\n");
377 		return (error);
378 	}
379 	/* strdup(9) is M_WAITOK; no need to check for NULL. */
380 	nv->nv_flags_str = strdup(sbuf_data(sb), M_NVDIMM);
381 	sbuf_delete(sb);
382 	SYSCTL_ADD_STRING(ctx, children, OID_AUTO, "flags",
383 	    CTLFLAG_RD | CTLFLAG_MPSAFE, nv->nv_flags_str, 0,
384 	    "NVDIMM State Flags");
385 	/*
386 	 * Anything other than HEALTH_ENABLED indicates a fault condition of
387 	 * some kind, so log if that's seen.
388 	 */
389 	if ((flags & ~ACPI_NFIT_MEM_HEALTH_ENABLED) != 0)
390 		device_printf(dev, "flags: %s\n", nv->nv_flags_str);
391 
392 	AcpiPutTable(&nfitbl->Header);
393 	error = read_label_area_size(nv);
394 	if (error == 0) {
395 		/*
396 		 * Ignoring errors reading labels. Not all NVDIMMs
397 		 * support labels and namespaces.
398 		 */
399 		read_labels(nv);
400 	}
401 	return (0);
402 }
403 
404 static int
405 nvdimm_detach(device_t dev)
406 {
407 	struct nvdimm_dev *nv;
408 	struct nvdimm_label_entry *label, *next;
409 
410 	nv = device_get_softc(dev);
411 	free(nv->nv_flags_str, M_NVDIMM);
412 	free(nv->nv_flush_addr, M_NVDIMM);
413 	free(nv->label_index, M_NVDIMM);
414 	SLIST_FOREACH_SAFE(label, &nv->labels, link, next) {
415 		SLIST_REMOVE_HEAD(&nv->labels, link);
416 		free(label, M_NVDIMM);
417 	}
418 	return (0);
419 }
420 
421 static int
422 nvdimm_suspend(device_t dev)
423 {
424 
425 	return (0);
426 }
427 
428 static int
429 nvdimm_resume(device_t dev)
430 {
431 
432 	return (0);
433 }
434 
435 static device_method_t nvdimm_methods[] = {
436 	DEVMETHOD(device_probe, nvdimm_probe),
437 	DEVMETHOD(device_attach, nvdimm_attach),
438 	DEVMETHOD(device_detach, nvdimm_detach),
439 	DEVMETHOD(device_suspend, nvdimm_suspend),
440 	DEVMETHOD(device_resume, nvdimm_resume),
441 	DEVMETHOD_END
442 };
443 
444 static driver_t	nvdimm_driver = {
445 	"nvdimm",
446 	nvdimm_methods,
447 	sizeof(struct nvdimm_dev),
448 };
449 
450 struct nvdimm_dev *
451 nvdimm_find_by_handle(nfit_handle_t nv_handle)
452 {
453 	struct nvdimm_dev *res;
454 	device_t *dimms;
455 	int i, error, num_dimms;
456 
457 	res = NULL;
458 	error = devclass_get_devices(devclass_find(nvdimm_driver.name), &dimms,
459 	    &num_dimms);
460 	if (error != 0)
461 		return (NULL);
462 	for (i = 0; i < num_dimms; i++) {
463 		if (nvdimm_root_get_device_handle(dimms[i]) == nv_handle) {
464 			res = device_get_softc(dimms[i]);
465 			break;
466 		}
467 	}
468 	free(dimms, M_TEMP);
469 	return (res);
470 }
471 
472 DRIVER_MODULE(nvdimm, nvdimm_acpi_root, nvdimm_driver, nvdimm_devclass, NULL,
473     NULL);
474 MODULE_DEPEND(nvdimm, acpi, 1, 1, 1);
475