xref: /freebsd/contrib/xz/src/liblzma/common/auto_decoder.c (revision b71a5db306ab1ad1e23c7f9e3c949c6218f43455)
181ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
281ad8388SMartin Matuska //
381ad8388SMartin Matuska /// \file       auto_decoder.c
481ad8388SMartin Matuska /// \brief      Autodetect between .xz Stream and .lzma (LZMA_Alone) formats
581ad8388SMartin Matuska //
681ad8388SMartin Matuska //  Author:     Lasse Collin
781ad8388SMartin Matuska //
881ad8388SMartin Matuska //  This file has been put into the public domain.
981ad8388SMartin Matuska //  You can do whatever you want with this file.
1081ad8388SMartin Matuska //
1181ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
1281ad8388SMartin Matuska 
1381ad8388SMartin Matuska #include "stream_decoder.h"
1481ad8388SMartin Matuska #include "alone_decoder.h"
1581ad8388SMartin Matuska 
1681ad8388SMartin Matuska 
171456f0f9SXin LI typedef struct {
1881ad8388SMartin Matuska 	/// Stream decoder or LZMA_Alone decoder
1981ad8388SMartin Matuska 	lzma_next_coder next;
2081ad8388SMartin Matuska 
2181ad8388SMartin Matuska 	uint64_t memlimit;
2281ad8388SMartin Matuska 	uint32_t flags;
2381ad8388SMartin Matuska 
2481ad8388SMartin Matuska 	enum {
2581ad8388SMartin Matuska 		SEQ_INIT,
2681ad8388SMartin Matuska 		SEQ_CODE,
2781ad8388SMartin Matuska 		SEQ_FINISH,
2881ad8388SMartin Matuska 	} sequence;
291456f0f9SXin LI } lzma_auto_coder;
3081ad8388SMartin Matuska 
3181ad8388SMartin Matuska 
3281ad8388SMartin Matuska static lzma_ret
331456f0f9SXin LI auto_decode(void *coder_ptr, const lzma_allocator *allocator,
3481ad8388SMartin Matuska 		const uint8_t *restrict in, size_t *restrict in_pos,
3581ad8388SMartin Matuska 		size_t in_size, uint8_t *restrict out,
3681ad8388SMartin Matuska 		size_t *restrict out_pos, size_t out_size, lzma_action action)
3781ad8388SMartin Matuska {
381456f0f9SXin LI 	lzma_auto_coder *coder = coder_ptr;
391456f0f9SXin LI 
4081ad8388SMartin Matuska 	switch (coder->sequence) {
4181ad8388SMartin Matuska 	case SEQ_INIT:
4281ad8388SMartin Matuska 		if (*in_pos >= in_size)
4381ad8388SMartin Matuska 			return LZMA_OK;
4481ad8388SMartin Matuska 
4581ad8388SMartin Matuska 		// Update the sequence now, because we want to continue from
4681ad8388SMartin Matuska 		// SEQ_CODE even if we return some LZMA_*_CHECK.
4781ad8388SMartin Matuska 		coder->sequence = SEQ_CODE;
4881ad8388SMartin Matuska 
4981ad8388SMartin Matuska 		// Detect the file format. For now this is simple, since if
5081ad8388SMartin Matuska 		// it doesn't start with 0xFD (the first magic byte of the
5181ad8388SMartin Matuska 		// new format), it has to be LZMA_Alone, or something that
5281ad8388SMartin Matuska 		// we don't support at all.
5381ad8388SMartin Matuska 		if (in[*in_pos] == 0xFD) {
5481ad8388SMartin Matuska 			return_if_error(lzma_stream_decoder_init(
5581ad8388SMartin Matuska 					&coder->next, allocator,
5681ad8388SMartin Matuska 					coder->memlimit, coder->flags));
5781ad8388SMartin Matuska 		} else {
5881ad8388SMartin Matuska 			return_if_error(lzma_alone_decoder_init(&coder->next,
5942b10a37SXin LI 					allocator, coder->memlimit, true));
6081ad8388SMartin Matuska 
6181ad8388SMartin Matuska 			// If the application wants to know about missing
6281ad8388SMartin Matuska 			// integrity check or about the check in general, we
6381ad8388SMartin Matuska 			// need to handle it here, because LZMA_Alone decoder
6481ad8388SMartin Matuska 			// doesn't accept any flags.
6581ad8388SMartin Matuska 			if (coder->flags & LZMA_TELL_NO_CHECK)
6681ad8388SMartin Matuska 				return LZMA_NO_CHECK;
6781ad8388SMartin Matuska 
6881ad8388SMartin Matuska 			if (coder->flags & LZMA_TELL_ANY_CHECK)
6981ad8388SMartin Matuska 				return LZMA_GET_CHECK;
7081ad8388SMartin Matuska 		}
7181ad8388SMartin Matuska 
7281ad8388SMartin Matuska 	// Fall through
7381ad8388SMartin Matuska 
7481ad8388SMartin Matuska 	case SEQ_CODE: {
7581ad8388SMartin Matuska 		const lzma_ret ret = coder->next.code(
7681ad8388SMartin Matuska 				coder->next.coder, allocator,
7781ad8388SMartin Matuska 				in, in_pos, in_size,
7881ad8388SMartin Matuska 				out, out_pos, out_size, action);
7981ad8388SMartin Matuska 		if (ret != LZMA_STREAM_END
8081ad8388SMartin Matuska 				|| (coder->flags & LZMA_CONCATENATED) == 0)
8181ad8388SMartin Matuska 			return ret;
8281ad8388SMartin Matuska 
8381ad8388SMartin Matuska 		coder->sequence = SEQ_FINISH;
8481ad8388SMartin Matuska 	}
8581ad8388SMartin Matuska 
8681ad8388SMartin Matuska 	// Fall through
8781ad8388SMartin Matuska 
8881ad8388SMartin Matuska 	case SEQ_FINISH:
8981ad8388SMartin Matuska 		// When LZMA_DECODE_CONCATENATED was used and we were decoding
9081ad8388SMartin Matuska 		// LZMA_Alone file, we need to check check that there is no
9181ad8388SMartin Matuska 		// trailing garbage and wait for LZMA_FINISH.
9281ad8388SMartin Matuska 		if (*in_pos < in_size)
9381ad8388SMartin Matuska 			return LZMA_DATA_ERROR;
9481ad8388SMartin Matuska 
9581ad8388SMartin Matuska 		return action == LZMA_FINISH ? LZMA_STREAM_END : LZMA_OK;
9681ad8388SMartin Matuska 
9781ad8388SMartin Matuska 	default:
9881ad8388SMartin Matuska 		assert(0);
9981ad8388SMartin Matuska 		return LZMA_PROG_ERROR;
10081ad8388SMartin Matuska 	}
10181ad8388SMartin Matuska }
10281ad8388SMartin Matuska 
10381ad8388SMartin Matuska 
10481ad8388SMartin Matuska static void
1051456f0f9SXin LI auto_decoder_end(void *coder_ptr, const lzma_allocator *allocator)
10681ad8388SMartin Matuska {
1071456f0f9SXin LI 	lzma_auto_coder *coder = coder_ptr;
10881ad8388SMartin Matuska 	lzma_next_end(&coder->next, allocator);
10981ad8388SMartin Matuska 	lzma_free(coder, allocator);
11081ad8388SMartin Matuska 	return;
11181ad8388SMartin Matuska }
11281ad8388SMartin Matuska 
11381ad8388SMartin Matuska 
11481ad8388SMartin Matuska static lzma_check
1151456f0f9SXin LI auto_decoder_get_check(const void *coder_ptr)
11681ad8388SMartin Matuska {
1171456f0f9SXin LI 	const lzma_auto_coder *coder = coder_ptr;
1181456f0f9SXin LI 
11981ad8388SMartin Matuska 	// It is LZMA_Alone if get_check is NULL.
12081ad8388SMartin Matuska 	return coder->next.get_check == NULL ? LZMA_CHECK_NONE
12181ad8388SMartin Matuska 			: coder->next.get_check(coder->next.coder);
12281ad8388SMartin Matuska }
12381ad8388SMartin Matuska 
12481ad8388SMartin Matuska 
12581ad8388SMartin Matuska static lzma_ret
1261456f0f9SXin LI auto_decoder_memconfig(void *coder_ptr, uint64_t *memusage,
12781ad8388SMartin Matuska 		uint64_t *old_memlimit, uint64_t new_memlimit)
12881ad8388SMartin Matuska {
1291456f0f9SXin LI 	lzma_auto_coder *coder = coder_ptr;
1301456f0f9SXin LI 
13181ad8388SMartin Matuska 	lzma_ret ret;
13281ad8388SMartin Matuska 
13381ad8388SMartin Matuska 	if (coder->next.memconfig != NULL) {
13481ad8388SMartin Matuska 		ret = coder->next.memconfig(coder->next.coder,
13581ad8388SMartin Matuska 				memusage, old_memlimit, new_memlimit);
13681ad8388SMartin Matuska 		assert(*old_memlimit == coder->memlimit);
13781ad8388SMartin Matuska 	} else {
13881ad8388SMartin Matuska 		// No coder is configured yet. Use the base value as
13981ad8388SMartin Matuska 		// the current memory usage.
14081ad8388SMartin Matuska 		*memusage = LZMA_MEMUSAGE_BASE;
14181ad8388SMartin Matuska 		*old_memlimit = coder->memlimit;
142*b71a5db3SXin LI 
14381ad8388SMartin Matuska 		ret = LZMA_OK;
144*b71a5db3SXin LI 		if (new_memlimit != 0 && new_memlimit < *memusage)
145*b71a5db3SXin LI 			ret = LZMA_MEMLIMIT_ERROR;
14681ad8388SMartin Matuska 	}
14781ad8388SMartin Matuska 
14881ad8388SMartin Matuska 	if (ret == LZMA_OK && new_memlimit != 0)
14981ad8388SMartin Matuska 		coder->memlimit = new_memlimit;
15081ad8388SMartin Matuska 
15181ad8388SMartin Matuska 	return ret;
15281ad8388SMartin Matuska }
15381ad8388SMartin Matuska 
15481ad8388SMartin Matuska 
15581ad8388SMartin Matuska static lzma_ret
15653200025SRui Paulo auto_decoder_init(lzma_next_coder *next, const lzma_allocator *allocator,
15781ad8388SMartin Matuska 		uint64_t memlimit, uint32_t flags)
15881ad8388SMartin Matuska {
15981ad8388SMartin Matuska 	lzma_next_coder_init(&auto_decoder_init, next, allocator);
16081ad8388SMartin Matuska 
16181ad8388SMartin Matuska 	if (flags & ~LZMA_SUPPORTED_FLAGS)
16281ad8388SMartin Matuska 		return LZMA_OPTIONS_ERROR;
16381ad8388SMartin Matuska 
1641456f0f9SXin LI 	lzma_auto_coder *coder = next->coder;
1651456f0f9SXin LI 	if (coder == NULL) {
1661456f0f9SXin LI 		coder = lzma_alloc(sizeof(lzma_auto_coder), allocator);
1671456f0f9SXin LI 		if (coder == NULL)
16881ad8388SMartin Matuska 			return LZMA_MEM_ERROR;
16981ad8388SMartin Matuska 
1701456f0f9SXin LI 		next->coder = coder;
17181ad8388SMartin Matuska 		next->code = &auto_decode;
17281ad8388SMartin Matuska 		next->end = &auto_decoder_end;
17381ad8388SMartin Matuska 		next->get_check = &auto_decoder_get_check;
17481ad8388SMartin Matuska 		next->memconfig = &auto_decoder_memconfig;
1751456f0f9SXin LI 		coder->next = LZMA_NEXT_CODER_INIT;
17681ad8388SMartin Matuska 	}
17781ad8388SMartin Matuska 
178*b71a5db3SXin LI 	coder->memlimit = my_max(1, memlimit);
1791456f0f9SXin LI 	coder->flags = flags;
1801456f0f9SXin LI 	coder->sequence = SEQ_INIT;
18181ad8388SMartin Matuska 
18281ad8388SMartin Matuska 	return LZMA_OK;
18381ad8388SMartin Matuska }
18481ad8388SMartin Matuska 
18581ad8388SMartin Matuska 
18681ad8388SMartin Matuska extern LZMA_API(lzma_ret)
18781ad8388SMartin Matuska lzma_auto_decoder(lzma_stream *strm, uint64_t memlimit, uint32_t flags)
18881ad8388SMartin Matuska {
18981ad8388SMartin Matuska 	lzma_next_strm_init(auto_decoder_init, strm, memlimit, flags);
19081ad8388SMartin Matuska 
19181ad8388SMartin Matuska 	strm->internal->supported_actions[LZMA_RUN] = true;
19281ad8388SMartin Matuska 	strm->internal->supported_actions[LZMA_FINISH] = true;
19381ad8388SMartin Matuska 
19481ad8388SMartin Matuska 	return LZMA_OK;
19581ad8388SMartin Matuska }
196