xref: /freebsd/contrib/xz/src/liblzma/common/auto_decoder.c (revision 3b35e7ee8de9b0260149a2b77e87a2b9c7a36244)
1*3b35e7eeSXin LI // SPDX-License-Identifier: 0BSD
2*3b35e7eeSXin LI 
381ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
481ad8388SMartin Matuska //
581ad8388SMartin Matuska /// \file       auto_decoder.c
673ed8e77SXin LI /// \brief      Autodetect between .xz, .lzma (LZMA_Alone), and .lz (lzip)
781ad8388SMartin Matuska //
881ad8388SMartin Matuska //  Author:     Lasse Collin
981ad8388SMartin Matuska //
1081ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
1181ad8388SMartin Matuska 
1281ad8388SMartin Matuska #include "stream_decoder.h"
1381ad8388SMartin Matuska #include "alone_decoder.h"
1473ed8e77SXin LI #ifdef HAVE_LZIP_DECODER
1573ed8e77SXin LI #	include "lzip_decoder.h"
1673ed8e77SXin LI #endif
1781ad8388SMartin Matuska 
1881ad8388SMartin Matuska 
191456f0f9SXin LI typedef struct {
2073ed8e77SXin LI 	/// .xz Stream decoder, LZMA_Alone decoder, or lzip decoder
2181ad8388SMartin Matuska 	lzma_next_coder next;
2281ad8388SMartin Matuska 
2381ad8388SMartin Matuska 	uint64_t memlimit;
2481ad8388SMartin Matuska 	uint32_t flags;
2581ad8388SMartin Matuska 
2681ad8388SMartin Matuska 	enum {
2781ad8388SMartin Matuska 		SEQ_INIT,
2881ad8388SMartin Matuska 		SEQ_CODE,
2981ad8388SMartin Matuska 		SEQ_FINISH,
3081ad8388SMartin Matuska 	} sequence;
311456f0f9SXin LI } lzma_auto_coder;
3281ad8388SMartin Matuska 
3381ad8388SMartin Matuska 
3481ad8388SMartin Matuska static lzma_ret
351456f0f9SXin LI auto_decode(void *coder_ptr, const lzma_allocator *allocator,
3681ad8388SMartin Matuska 		const uint8_t *restrict in, size_t *restrict in_pos,
3781ad8388SMartin Matuska 		size_t in_size, uint8_t *restrict out,
3881ad8388SMartin Matuska 		size_t *restrict out_pos, size_t out_size, lzma_action action)
3981ad8388SMartin Matuska {
401456f0f9SXin LI 	lzma_auto_coder *coder = coder_ptr;
411456f0f9SXin LI 
4281ad8388SMartin Matuska 	switch (coder->sequence) {
4381ad8388SMartin Matuska 	case SEQ_INIT:
4481ad8388SMartin Matuska 		if (*in_pos >= in_size)
4581ad8388SMartin Matuska 			return LZMA_OK;
4681ad8388SMartin Matuska 
4781ad8388SMartin Matuska 		// Update the sequence now, because we want to continue from
4881ad8388SMartin Matuska 		// SEQ_CODE even if we return some LZMA_*_CHECK.
4981ad8388SMartin Matuska 		coder->sequence = SEQ_CODE;
5081ad8388SMartin Matuska 
5173ed8e77SXin LI 		// Detect the file format. .xz files start with 0xFD which
5273ed8e77SXin LI 		// cannot be the first byte of .lzma (LZMA_Alone) format.
5373ed8e77SXin LI 		// The .lz format starts with 0x4C which could be the
5473ed8e77SXin LI 		// first byte of a .lzma file but luckily it would mean
5573ed8e77SXin LI 		// lc/lp/pb being 4/3/1 which liblzma doesn't support because
5673ed8e77SXin LI 		// lc + lp > 4. So using just 0x4C to detect .lz is OK here.
5781ad8388SMartin Matuska 		if (in[*in_pos] == 0xFD) {
5881ad8388SMartin Matuska 			return_if_error(lzma_stream_decoder_init(
5981ad8388SMartin Matuska 					&coder->next, allocator,
6081ad8388SMartin Matuska 					coder->memlimit, coder->flags));
6173ed8e77SXin LI #ifdef HAVE_LZIP_DECODER
6273ed8e77SXin LI 		} else if (in[*in_pos] == 0x4C) {
6373ed8e77SXin LI 			return_if_error(lzma_lzip_decoder_init(
6473ed8e77SXin LI 					&coder->next, allocator,
6573ed8e77SXin LI 					coder->memlimit, coder->flags));
6673ed8e77SXin LI #endif
6781ad8388SMartin Matuska 		} else {
6881ad8388SMartin Matuska 			return_if_error(lzma_alone_decoder_init(&coder->next,
6942b10a37SXin LI 					allocator, coder->memlimit, true));
7081ad8388SMartin Matuska 
7181ad8388SMartin Matuska 			// If the application wants to know about missing
7281ad8388SMartin Matuska 			// integrity check or about the check in general, we
7381ad8388SMartin Matuska 			// need to handle it here, because LZMA_Alone decoder
7481ad8388SMartin Matuska 			// doesn't accept any flags.
7581ad8388SMartin Matuska 			if (coder->flags & LZMA_TELL_NO_CHECK)
7681ad8388SMartin Matuska 				return LZMA_NO_CHECK;
7781ad8388SMartin Matuska 
7881ad8388SMartin Matuska 			if (coder->flags & LZMA_TELL_ANY_CHECK)
7981ad8388SMartin Matuska 				return LZMA_GET_CHECK;
8081ad8388SMartin Matuska 		}
8181ad8388SMartin Matuska 
8281ad8388SMartin Matuska 	// Fall through
8381ad8388SMartin Matuska 
8481ad8388SMartin Matuska 	case SEQ_CODE: {
8581ad8388SMartin Matuska 		const lzma_ret ret = coder->next.code(
8681ad8388SMartin Matuska 				coder->next.coder, allocator,
8781ad8388SMartin Matuska 				in, in_pos, in_size,
8881ad8388SMartin Matuska 				out, out_pos, out_size, action);
8981ad8388SMartin Matuska 		if (ret != LZMA_STREAM_END
9081ad8388SMartin Matuska 				|| (coder->flags & LZMA_CONCATENATED) == 0)
9181ad8388SMartin Matuska 			return ret;
9281ad8388SMartin Matuska 
9381ad8388SMartin Matuska 		coder->sequence = SEQ_FINISH;
9481ad8388SMartin Matuska 	}
9581ad8388SMartin Matuska 
9681ad8388SMartin Matuska 	// Fall through
9781ad8388SMartin Matuska 
9881ad8388SMartin Matuska 	case SEQ_FINISH:
999e6bbe47SXin LI 		// When LZMA_CONCATENATED was used and we were decoding
1009e6bbe47SXin LI 		// a LZMA_Alone file, we need to check that there is no
10181ad8388SMartin Matuska 		// trailing garbage and wait for LZMA_FINISH.
10281ad8388SMartin Matuska 		if (*in_pos < in_size)
10381ad8388SMartin Matuska 			return LZMA_DATA_ERROR;
10481ad8388SMartin Matuska 
10581ad8388SMartin Matuska 		return action == LZMA_FINISH ? LZMA_STREAM_END : LZMA_OK;
10681ad8388SMartin Matuska 
10781ad8388SMartin Matuska 	default:
10881ad8388SMartin Matuska 		assert(0);
10981ad8388SMartin Matuska 		return LZMA_PROG_ERROR;
11081ad8388SMartin Matuska 	}
11181ad8388SMartin Matuska }
11281ad8388SMartin Matuska 
11381ad8388SMartin Matuska 
11481ad8388SMartin Matuska static void
1151456f0f9SXin LI auto_decoder_end(void *coder_ptr, const lzma_allocator *allocator)
11681ad8388SMartin Matuska {
1171456f0f9SXin LI 	lzma_auto_coder *coder = coder_ptr;
11881ad8388SMartin Matuska 	lzma_next_end(&coder->next, allocator);
11981ad8388SMartin Matuska 	lzma_free(coder, allocator);
12081ad8388SMartin Matuska 	return;
12181ad8388SMartin Matuska }
12281ad8388SMartin Matuska 
12381ad8388SMartin Matuska 
12481ad8388SMartin Matuska static lzma_check
1251456f0f9SXin LI auto_decoder_get_check(const void *coder_ptr)
12681ad8388SMartin Matuska {
1271456f0f9SXin LI 	const lzma_auto_coder *coder = coder_ptr;
1281456f0f9SXin LI 
12981ad8388SMartin Matuska 	// It is LZMA_Alone if get_check is NULL.
13081ad8388SMartin Matuska 	return coder->next.get_check == NULL ? LZMA_CHECK_NONE
13181ad8388SMartin Matuska 			: coder->next.get_check(coder->next.coder);
13281ad8388SMartin Matuska }
13381ad8388SMartin Matuska 
13481ad8388SMartin Matuska 
13581ad8388SMartin Matuska static lzma_ret
1361456f0f9SXin LI auto_decoder_memconfig(void *coder_ptr, uint64_t *memusage,
13781ad8388SMartin Matuska 		uint64_t *old_memlimit, uint64_t new_memlimit)
13881ad8388SMartin Matuska {
1391456f0f9SXin LI 	lzma_auto_coder *coder = coder_ptr;
1401456f0f9SXin LI 
14181ad8388SMartin Matuska 	lzma_ret ret;
14281ad8388SMartin Matuska 
14381ad8388SMartin Matuska 	if (coder->next.memconfig != NULL) {
14481ad8388SMartin Matuska 		ret = coder->next.memconfig(coder->next.coder,
14581ad8388SMartin Matuska 				memusage, old_memlimit, new_memlimit);
14681ad8388SMartin Matuska 		assert(*old_memlimit == coder->memlimit);
14781ad8388SMartin Matuska 	} else {
14881ad8388SMartin Matuska 		// No coder is configured yet. Use the base value as
14981ad8388SMartin Matuska 		// the current memory usage.
15081ad8388SMartin Matuska 		*memusage = LZMA_MEMUSAGE_BASE;
15181ad8388SMartin Matuska 		*old_memlimit = coder->memlimit;
152b71a5db3SXin LI 
15381ad8388SMartin Matuska 		ret = LZMA_OK;
154b71a5db3SXin LI 		if (new_memlimit != 0 && new_memlimit < *memusage)
155b71a5db3SXin LI 			ret = LZMA_MEMLIMIT_ERROR;
15681ad8388SMartin Matuska 	}
15781ad8388SMartin Matuska 
15881ad8388SMartin Matuska 	if (ret == LZMA_OK && new_memlimit != 0)
15981ad8388SMartin Matuska 		coder->memlimit = new_memlimit;
16081ad8388SMartin Matuska 
16181ad8388SMartin Matuska 	return ret;
16281ad8388SMartin Matuska }
16381ad8388SMartin Matuska 
16481ad8388SMartin Matuska 
16581ad8388SMartin Matuska static lzma_ret
16653200025SRui Paulo auto_decoder_init(lzma_next_coder *next, const lzma_allocator *allocator,
16781ad8388SMartin Matuska 		uint64_t memlimit, uint32_t flags)
16881ad8388SMartin Matuska {
16981ad8388SMartin Matuska 	lzma_next_coder_init(&auto_decoder_init, next, allocator);
17081ad8388SMartin Matuska 
17181ad8388SMartin Matuska 	if (flags & ~LZMA_SUPPORTED_FLAGS)
17281ad8388SMartin Matuska 		return LZMA_OPTIONS_ERROR;
17381ad8388SMartin Matuska 
1741456f0f9SXin LI 	lzma_auto_coder *coder = next->coder;
1751456f0f9SXin LI 	if (coder == NULL) {
1761456f0f9SXin LI 		coder = lzma_alloc(sizeof(lzma_auto_coder), allocator);
1771456f0f9SXin LI 		if (coder == NULL)
17881ad8388SMartin Matuska 			return LZMA_MEM_ERROR;
17981ad8388SMartin Matuska 
1801456f0f9SXin LI 		next->coder = coder;
18181ad8388SMartin Matuska 		next->code = &auto_decode;
18281ad8388SMartin Matuska 		next->end = &auto_decoder_end;
18381ad8388SMartin Matuska 		next->get_check = &auto_decoder_get_check;
18481ad8388SMartin Matuska 		next->memconfig = &auto_decoder_memconfig;
1851456f0f9SXin LI 		coder->next = LZMA_NEXT_CODER_INIT;
18681ad8388SMartin Matuska 	}
18781ad8388SMartin Matuska 
188b71a5db3SXin LI 	coder->memlimit = my_max(1, memlimit);
1891456f0f9SXin LI 	coder->flags = flags;
1901456f0f9SXin LI 	coder->sequence = SEQ_INIT;
19181ad8388SMartin Matuska 
19281ad8388SMartin Matuska 	return LZMA_OK;
19381ad8388SMartin Matuska }
19481ad8388SMartin Matuska 
19581ad8388SMartin Matuska 
19681ad8388SMartin Matuska extern LZMA_API(lzma_ret)
19781ad8388SMartin Matuska lzma_auto_decoder(lzma_stream *strm, uint64_t memlimit, uint32_t flags)
19881ad8388SMartin Matuska {
19981ad8388SMartin Matuska 	lzma_next_strm_init(auto_decoder_init, strm, memlimit, flags);
20081ad8388SMartin Matuska 
20181ad8388SMartin Matuska 	strm->internal->supported_actions[LZMA_RUN] = true;
20281ad8388SMartin Matuska 	strm->internal->supported_actions[LZMA_FINISH] = true;
20381ad8388SMartin Matuska 
20481ad8388SMartin Matuska 	return LZMA_OK;
20581ad8388SMartin Matuska }
206