xref: /freebsd/usr.bin/mkimg/image.c (revision b2d48be1bc7df45ddd13b143a160d0acb5a383c5)
1 /*-
2  * Copyright (c) 2014 Juniper Networks, Inc.
3  * All rights reserved.
4  *
5  * Redistribution and use in source and binary forms, with or without
6  * modification, are permitted provided that the following conditions
7  * are met:
8  * 1. Redistributions of source code must retain the above copyright
9  *    notice, this list of conditions and the following disclaimer.
10  * 2. Redistributions in binary form must reproduce the above copyright
11  *    notice, this list of conditions and the following disclaimer in the
12  *    documentation and/or other materials provided with the distribution.
13  *
14  * THIS SOFTWARE IS PROVIDED BY THE AUTHOR AND CONTRIBUTORS ``AS IS'' AND
15  * ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
16  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE
17  * ARE DISCLAIMED.  IN NO EVENT SHALL THE AUTHOR OR CONTRIBUTORS BE LIABLE
18  * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL
19  * DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS
20  * OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION)
21  * HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
22  * LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY
23  * OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
24  * SUCH DAMAGE.
25  */
26 
27 #include <sys/cdefs.h>
28 __FBSDID("$FreeBSD$");
29 
30 #include <sys/mman.h>
31 #include <sys/queue.h>
32 #include <sys/stat.h>
33 #include <sys/types.h>
34 #include <assert.h>
35 #include <errno.h>
36 #include <limits.h>
37 #include <paths.h>
38 #include <stdint.h>
39 #include <stdio.h>
40 #include <stdlib.h>
41 #include <string.h>
42 #include <unistd.h>
43 
44 #include "image.h"
45 #include "mkimg.h"
46 
47 struct chunk {
48 	STAILQ_ENTRY(chunk) ch_list;
49 	size_t	ch_size;		/* Size of chunk in bytes. */
50 	lba_t	ch_block;		/* Block address in image. */
51 	union {
52 		struct {
53 			off_t	ofs;	/* Offset in backing file. */
54 			int	fd;	/* FD of backing file. */
55 		} file;
56 		struct {
57 			void	*ptr;	/* Pointer to data in memory */
58 		} mem;
59 	} ch_u;
60 	u_int	ch_type;
61 #define	CH_TYPE_ZEROES		0	/* Chunk is a gap (no data). */
62 #define	CH_TYPE_FILE		1	/* File-backed chunk. */
63 #define	CH_TYPE_MEMORY		2	/* Memory-backed chunk */
64 };
65 
66 static STAILQ_HEAD(chunk_head, chunk) image_chunks;
67 static u_int image_nchunks;
68 
69 static char image_swap_file[PATH_MAX];
70 static int image_swap_fd = -1;
71 static u_int image_swap_pgsz;
72 static off_t image_swap_size;
73 
74 static lba_t image_size;
75 
76 static int
77 is_empty_sector(void *buf)
78 {
79 	uint64_t *p = buf;
80 	size_t n, max;
81 
82 	assert(((uintptr_t)p & 3) == 0);
83 
84 	max = secsz / sizeof(uint64_t);
85 	for (n = 0; n < max; n++) {
86 		if (p[n] != 0UL)
87 			return (0);
88 	}
89 	return (1);
90 }
91 
92 /*
93  * Swap file handlng.
94  */
95 
96 static off_t
97 image_swap_alloc(size_t size)
98 {
99 	off_t ofs;
100 	size_t unit;
101 
102 	unit = (secsz > image_swap_pgsz) ? secsz : image_swap_pgsz;
103 	assert((unit & (unit - 1)) == 0);
104 
105 	size = (size + unit - 1) & ~(unit - 1);
106 
107 	ofs = image_swap_size;
108 	image_swap_size += size;
109 	if (ftruncate(image_swap_fd, image_swap_size) == -1) {
110 		image_swap_size = ofs;
111 		ofs = -1LL;
112 	}
113 	return (ofs);
114 }
115 
116 /*
117  * Image chunk handling.
118  */
119 
120 static struct chunk *
121 image_chunk_find(lba_t blk)
122 {
123 	static struct chunk *last = NULL;
124 	struct chunk *ch;
125 
126 	ch = (last != NULL && last->ch_block <= blk)
127 	    ? last : STAILQ_FIRST(&image_chunks);
128 	while (ch != NULL) {
129 		if (ch->ch_block <= blk &&
130 		    (lba_t)(ch->ch_block + (ch->ch_size / secsz)) > blk) {
131 			last = ch;
132 			break;
133 		}
134 		ch = STAILQ_NEXT(ch, ch_list);
135 	}
136 	return (ch);
137 }
138 
139 static size_t
140 image_chunk_grow(struct chunk *ch, size_t sz)
141 {
142 	size_t dsz, newsz;
143 
144 	newsz = ch->ch_size + sz;
145 	if (newsz > ch->ch_size) {
146 		ch->ch_size = newsz;
147 		return (0);
148 	}
149 	/* We would overflow -- create new chunk for remainder. */
150 	dsz = SIZE_MAX - ch->ch_size;
151 	assert(dsz < sz);
152 	ch->ch_size = SIZE_MAX;
153 	return (sz - dsz);
154 }
155 
156 static struct chunk *
157 image_chunk_memory(struct chunk *ch, lba_t blk)
158 {
159 	struct chunk *new;
160 	void *ptr;
161 
162 	ptr = calloc(1, secsz);
163 	if (ptr == NULL)
164 		return (NULL);
165 
166 	if (ch->ch_block < blk) {
167 		new = malloc(sizeof(*new));
168 		if (new == NULL) {
169 			free(ptr);
170 			return (NULL);
171 		}
172 		memcpy(new, ch, sizeof(*new));
173 		ch->ch_size = (blk - ch->ch_block) * secsz;
174 		new->ch_block = blk;
175 		new->ch_size -= ch->ch_size;
176 		STAILQ_INSERT_AFTER(&image_chunks, ch, new, ch_list);
177 		image_nchunks++;
178 		ch = new;
179 	}
180 
181 	if (ch->ch_size > secsz) {
182 		new = malloc(sizeof(*new));
183 		if (new == NULL) {
184 			free(ptr);
185 			return (NULL);
186 		}
187 		memcpy(new, ch, sizeof(*new));
188 		ch->ch_size = secsz;
189 		new->ch_block++;
190 		new->ch_size -= secsz;
191 		STAILQ_INSERT_AFTER(&image_chunks, ch, new, ch_list);
192 		image_nchunks++;
193 	}
194 
195 	ch->ch_type = CH_TYPE_MEMORY;
196 	ch->ch_u.mem.ptr = ptr;
197 	return (ch);
198 }
199 
200 static int
201 image_chunk_skipto(lba_t to)
202 {
203 	struct chunk *ch;
204 	lba_t from;
205 	size_t sz;
206 
207 	ch = STAILQ_LAST(&image_chunks, chunk, ch_list);
208 	from = (ch != NULL) ? ch->ch_block + (ch->ch_size / secsz) : 0LL;
209 
210 	assert(from <= to);
211 
212 	/* Nothing to do? */
213 	if (from == to)
214 		return (0);
215 	/* Avoid bugs due to overflows. */
216 	if ((uintmax_t)(to - from) > (uintmax_t)(SIZE_MAX / secsz))
217 		return (EFBIG);
218 	sz = (to - from) * secsz;
219 	if (ch != NULL && ch->ch_type == CH_TYPE_ZEROES) {
220 		sz = image_chunk_grow(ch, sz);
221 		if (sz == 0)
222 			return (0);
223 		from = ch->ch_block + (ch->ch_size / secsz);
224 	}
225 	ch = malloc(sizeof(*ch));
226 	if (ch == NULL)
227 		return (ENOMEM);
228 	memset(ch, 0, sizeof(*ch));
229 	ch->ch_block = from;
230 	ch->ch_size = sz;
231 	ch->ch_type = CH_TYPE_ZEROES;
232 	STAILQ_INSERT_TAIL(&image_chunks, ch, ch_list);
233 	image_nchunks++;
234 	return (0);
235 }
236 
237 static int
238 image_chunk_append(lba_t blk, size_t sz, off_t ofs, int fd)
239 {
240 	struct chunk *ch;
241 
242 	ch = STAILQ_LAST(&image_chunks, chunk, ch_list);
243 	if (ch != NULL && ch->ch_type == CH_TYPE_FILE) {
244 		if (fd == ch->ch_u.file.fd &&
245 		    blk == (lba_t)(ch->ch_block + (ch->ch_size / secsz)) &&
246 		    ofs == (off_t)(ch->ch_u.file.ofs + ch->ch_size)) {
247 			sz = image_chunk_grow(ch, sz);
248 			if (sz == 0)
249 				return (0);
250 			blk = ch->ch_block + (ch->ch_size / secsz);
251 			ofs = ch->ch_u.file.ofs + ch->ch_size;
252 		}
253 	}
254 	ch = malloc(sizeof(*ch));
255 	if (ch == NULL)
256 		return (ENOMEM);
257 	memset(ch, 0, sizeof(*ch));
258 	ch->ch_block = blk;
259 	ch->ch_size = sz;
260 	ch->ch_type = CH_TYPE_FILE;
261 	ch->ch_u.file.ofs = ofs;
262 	ch->ch_u.file.fd = fd;
263 	STAILQ_INSERT_TAIL(&image_chunks, ch, ch_list);
264 	image_nchunks++;
265 	return (0);
266 }
267 
268 static int
269 image_chunk_copyin(lba_t blk, void *buf, size_t sz, off_t ofs, int fd)
270 {
271 	uint8_t *p = buf;
272 	int error;
273 
274 	error = 0;
275 	sz = (sz + secsz - 1) & ~(secsz - 1);
276 	while (!error && sz > 0) {
277 		if (is_empty_sector(p))
278 			error = image_chunk_skipto(blk + 1);
279 		else
280 			error = image_chunk_append(blk, secsz, ofs, fd);
281 		blk++;
282 		p += secsz;
283 		sz -= secsz;
284 		ofs += secsz;
285 	}
286 	return (error);
287 }
288 
289 /*
290  * File mapping support.
291  */
292 
293 static void *
294 image_file_map(int fd, off_t ofs, size_t sz)
295 {
296 	void *ptr;
297 	size_t unit;
298 	int flags, prot;
299 
300 	unit = (secsz > image_swap_pgsz) ? secsz : image_swap_pgsz;
301 	assert((unit & (unit - 1)) == 0);
302 
303 	flags = MAP_NOCORE | MAP_NOSYNC | MAP_SHARED;
304 	/* Allow writing to our swap file only. */
305 	prot = PROT_READ | ((fd == image_swap_fd) ? PROT_WRITE : 0);
306 	sz = (sz + unit - 1) & ~(unit - 1);
307 	ptr = mmap(NULL, sz, prot, flags, fd, ofs);
308 	return ((ptr == MAP_FAILED) ? NULL : ptr);
309 }
310 
311 static int
312 image_file_unmap(void *buffer, size_t sz)
313 {
314 	size_t unit;
315 
316 	unit = (secsz > image_swap_pgsz) ? secsz : image_swap_pgsz;
317 	sz = (sz + unit - 1) & ~(unit - 1);
318 	munmap(buffer, sz);
319 	return (0);
320 }
321 
322 /*
323  * Input/source file handling.
324  */
325 
326 static int
327 image_copyin_stream(lba_t blk, int fd, uint64_t *sizep)
328 {
329 	char *buffer;
330 	uint64_t bytesize;
331 	off_t swofs;
332 	size_t iosz;
333 	ssize_t rdsz;
334 	int error;
335 
336 	/*
337 	 * This makes sure we're doing I/O in multiples of the page
338 	 * size as well as of the sector size. 2MB is the minimum
339 	 * by virtue of secsz at least 512 bytes and the page size
340 	 * at least 4K bytes.
341 	 */
342 	iosz = secsz * image_swap_pgsz;
343 
344 	bytesize = 0;
345 	do {
346 		swofs = image_swap_alloc(iosz);
347 		if (swofs == -1LL)
348 			return (errno);
349 		buffer = image_file_map(image_swap_fd, swofs, iosz);
350 		if (buffer == NULL)
351 			return (errno);
352 		rdsz = read(fd, buffer, iosz);
353 		if (rdsz > 0)
354 			error = image_chunk_copyin(blk, buffer, rdsz, swofs,
355 			    image_swap_fd);
356 		else if (rdsz < 0)
357 			error = errno;
358 		else
359 			error = 0;
360 		image_file_unmap(buffer, iosz);
361 		/* XXX should we relinguish unused swap space? */
362 		if (error)
363 			return (error);
364 
365 		bytesize += rdsz;
366 		blk += (rdsz + secsz - 1) / secsz;
367 	} while (rdsz > 0);
368 
369 	if (sizep != NULL)
370 		*sizep = bytesize;
371 	return (0);
372 }
373 
374 static int
375 image_copyin_mapped(lba_t blk, int fd, uint64_t *sizep)
376 {
377 	off_t cur, data, end, hole, pos;
378 	void *buf;
379 	uint64_t bytesize;
380 	size_t iosz, sz;
381 	int error;
382 
383 	/*
384 	 * We'd like to know the size of the file and we must
385 	 * be able to seek in order to mmap(2). If this isn't
386 	 * possible, then treat the file as a stream/pipe.
387 	 */
388 	end = lseek(fd, 0L, SEEK_END);
389 	if (end == -1L)
390 		return (image_copyin_stream(blk, fd, sizep));
391 
392 	/*
393 	 * We need the file opened for the duration and our
394 	 * caller is going to close the file. Make a dup(2)
395 	 * so that control the faith of the descriptor.
396 	 */
397 	fd = dup(fd);
398 	if (fd == -1)
399 		return (errno);
400 
401 	iosz = secsz * image_swap_pgsz;
402 
403 	bytesize = 0;
404 	cur = pos = 0;
405 	error = 0;
406 	while (!error && cur < end) {
407 		hole = lseek(fd, cur, SEEK_HOLE);
408 		if (hole == -1)
409 			hole = end;
410 		data = lseek(fd, cur, SEEK_DATA);
411 		if (data == -1)
412 			data = end;
413 
414 		/*
415 		 * Treat the entire file as data if sparse files
416 		 * are not supported by the underlying file system.
417 		 */
418 		if (hole == end && data == end)
419 			data = cur;
420 
421 		if (cur == hole && data > hole) {
422 			hole = pos;
423 			pos = data & ~((uint64_t)secsz - 1);
424 
425 			blk += (pos - hole) / secsz;
426 			error = image_chunk_skipto(blk);
427 
428 			bytesize += pos - hole;
429 			cur = data;
430 		} else if (cur == data && hole > data) {
431 			data = pos;
432 			pos = (hole + secsz - 1) & ~((uint64_t)secsz - 1);
433 
434 			while (data < pos) {
435 				sz = (pos - data > (off_t)iosz)
436 				    ? iosz : (size_t)(pos - data);
437 
438 				buf = image_file_map(fd, data, sz);
439 				if (buf != NULL) {
440 					error = image_chunk_copyin(blk, buf,
441 					    sz, data, fd);
442 					image_file_unmap(buf, sz);
443 				} else
444 					error = errno;
445 
446 				blk += sz / secsz;
447 				bytesize += sz;
448 				data += sz;
449 			}
450 			cur = hole;
451 		} else {
452 			/*
453 			 * I don't know what this means or whether it
454 			 * can happen at all...
455 			 */
456 			error = EDOOFUS;
457 			break;
458 		}
459 	}
460 	if (error)
461 		close(fd);
462 	if (!error && sizep != NULL)
463 		*sizep = bytesize;
464 	return (error);
465 }
466 
467 int
468 image_copyin(lba_t blk, int fd, uint64_t *sizep)
469 {
470 	struct stat sb;
471 	int error;
472 
473 	error = image_chunk_skipto(blk);
474 	if (!error) {
475 		if (fstat(fd, &sb) == -1 || !S_ISREG(sb.st_mode))
476 			error = image_copyin_stream(blk, fd, sizep);
477 		else
478 			error = image_copyin_mapped(blk, fd, sizep);
479 	}
480 	return (error);
481 }
482 
483 /*
484  * Output/sink file handling.
485  */
486 
487 int
488 image_copyout(int fd)
489 {
490 	int error;
491 
492 	error = image_copyout_region(fd, 0, image_size);
493 	if (!error)
494 		error = image_copyout_done(fd);
495 	return (error);
496 }
497 
498 int
499 image_copyout_done(int fd)
500 {
501 	off_t ofs;
502 	int error;
503 
504 	ofs = lseek(fd, 0L, SEEK_CUR);
505 	if (ofs == -1)
506 		return (0);
507 	error = (ftruncate(fd, ofs) == -1) ? errno : 0;
508 	return (error);
509 }
510 
511 static int
512 image_copyout_memory(int fd, size_t size, void *ptr)
513 {
514 
515 	if (write(fd, ptr, size) == -1)
516 		return (errno);
517 	return (0);
518 }
519 
520 int
521 image_copyout_zeroes(int fd, size_t count)
522 {
523 	static uint8_t *zeroes = NULL;
524 	size_t sz;
525 	int error;
526 
527 	if (lseek(fd, (off_t)count, SEEK_CUR) != -1)
528 		return (0);
529 
530 	/*
531 	 * If we can't seek, we must write.
532 	 */
533 
534 	if (zeroes == NULL) {
535 		zeroes = calloc(1, secsz);
536 		if (zeroes == NULL)
537 			return (ENOMEM);
538 	}
539 
540 	while (count > 0) {
541 		sz = (count > secsz) ? secsz : count;
542 		error = image_copyout_memory(fd, sz, zeroes);
543 		if (error)
544 			return (error);
545 		count -= sz;
546 	}
547 	return (0);
548 }
549 
550 static int
551 image_copyout_file(int fd, size_t size, int ifd, off_t iofs)
552 {
553 	void *buf;
554 	size_t iosz, sz;
555 	int error;
556 
557 	iosz = secsz * image_swap_pgsz;
558 
559 	while (size > 0) {
560 		sz = (size > iosz) ? iosz : size;
561 		buf = image_file_map(ifd, iofs, sz);
562 		if (buf == NULL)
563 			return (errno);
564 		error = image_copyout_memory(fd, sz, buf);
565 		image_file_unmap(buf, sz);
566 		if (error)
567 			return (error);
568 		size -= sz;
569 		iofs += sz;
570 	}
571 	return (0);
572 }
573 
574 int
575 image_copyout_region(int fd, lba_t blk, lba_t size)
576 {
577 	struct chunk *ch;
578 	size_t ofs, sz;
579 	int error;
580 
581 	size *= secsz;
582 
583 	while (size > 0) {
584 		ch = image_chunk_find(blk);
585 		if (ch == NULL)
586 			return (EINVAL);
587 		ofs = (blk - ch->ch_block) * secsz;
588 		sz = ch->ch_size - ofs;
589 		sz = ((lba_t)sz < size) ? sz : (size_t)size;
590 		switch (ch->ch_type) {
591 		case CH_TYPE_ZEROES:
592 			error = image_copyout_zeroes(fd, sz);
593 			break;
594 		case CH_TYPE_FILE:
595 			error = image_copyout_file(fd, sz, ch->ch_u.file.fd,
596 			    ch->ch_u.file.ofs + ofs);
597 			break;
598 		case CH_TYPE_MEMORY:
599 			error = image_copyout_memory(fd, sz, ch->ch_u.mem.ptr);
600 			break;
601 		default:
602 			return (EDOOFUS);
603 		}
604 		size -= sz;
605 		blk += sz / secsz;
606 	}
607 	return (0);
608 }
609 
610 int
611 image_data(lba_t blk, lba_t size)
612 {
613 	struct chunk *ch;
614 	lba_t lim;
615 
616 	while (1) {
617 		ch = image_chunk_find(blk);
618 		if (ch == NULL)
619 			return (0);
620 		if (ch->ch_type != CH_TYPE_ZEROES)
621 			return (1);
622 		lim = ch->ch_block + (ch->ch_size / secsz);
623 		if (lim >= blk + size)
624 			return (0);
625 		size -= lim - blk;
626 		blk = lim;
627 	}
628 	/*NOTREACHED*/
629 }
630 
631 lba_t
632 image_get_size(void)
633 {
634 
635 	return (image_size);
636 }
637 
638 int
639 image_set_size(lba_t blk)
640 {
641 	int error;
642 
643 	error = image_chunk_skipto(blk);
644 	if (!error)
645 		image_size = blk;
646 	return (error);
647 }
648 
649 int
650 image_write(lba_t blk, void *buf, ssize_t len)
651 {
652 	struct chunk *ch;
653 
654 	while (len > 0) {
655 		if (!is_empty_sector(buf)) {
656 			ch = image_chunk_find(blk);
657 			if (ch == NULL)
658 				return (ENXIO);
659 			/* We may not be able to write to files. */
660 			if (ch->ch_type == CH_TYPE_FILE)
661 				return (EINVAL);
662 			if (ch->ch_type == CH_TYPE_ZEROES) {
663 				ch = image_chunk_memory(ch, blk);
664 				if (ch == NULL)
665 					return (ENOMEM);
666 			}
667 			assert(ch->ch_type == CH_TYPE_MEMORY);
668 			memcpy(ch->ch_u.mem.ptr, buf, secsz);
669 		}
670 		blk++;
671 		buf = (char *)buf + secsz;
672 		len--;
673 	}
674 	return (0);
675 }
676 
677 static void
678 image_cleanup(void)
679 {
680 	struct chunk *ch;
681 
682 	while ((ch = STAILQ_FIRST(&image_chunks)) != NULL) {
683 		switch (ch->ch_type) {
684 		case CH_TYPE_FILE:
685 			/* We may be closing the same file multiple times. */
686 			if (ch->ch_u.file.fd != -1)
687 				close(ch->ch_u.file.fd);
688 			break;
689 		case CH_TYPE_MEMORY:
690 			free(ch->ch_u.mem.ptr);
691 			break;
692 		default:
693 			break;
694 		}
695 		STAILQ_REMOVE_HEAD(&image_chunks, ch_list);
696 		free(ch);
697 	}
698 	if (image_swap_fd != -1)
699 		close(image_swap_fd);
700 	unlink(image_swap_file);
701 }
702 
703 int
704 image_init(void)
705 {
706 	const char *tmpdir;
707 
708 	STAILQ_INIT(&image_chunks);
709 	image_nchunks = 0;
710 
711 	image_swap_size = 0;
712 	image_swap_pgsz = getpagesize();
713 
714 	if (atexit(image_cleanup) == -1)
715 		return (errno);
716 	if ((tmpdir = getenv("TMPDIR")) == NULL || *tmpdir == '\0')
717 		tmpdir = _PATH_TMP;
718 	snprintf(image_swap_file, sizeof(image_swap_file), "%s/mkimg-XXXXXX",
719 	    tmpdir);
720 	image_swap_fd = mkstemp(image_swap_file);
721 	if (image_swap_fd == -1)
722 		return (errno);
723 	return (0);
724 }
725