xref: /freebsd/contrib/xz/src/liblzma/common/auto_decoder.c (revision 42b10a37c6580e4fa7afe04e16a7a6e82188215f)
181ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
281ad8388SMartin Matuska //
381ad8388SMartin Matuska /// \file       auto_decoder.c
481ad8388SMartin Matuska /// \brief      Autodetect between .xz Stream and .lzma (LZMA_Alone) formats
581ad8388SMartin Matuska //
681ad8388SMartin Matuska //  Author:     Lasse Collin
781ad8388SMartin Matuska //
881ad8388SMartin Matuska //  This file has been put into the public domain.
981ad8388SMartin Matuska //  You can do whatever you want with this file.
1081ad8388SMartin Matuska //
1181ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
1281ad8388SMartin Matuska 
1381ad8388SMartin Matuska #include "stream_decoder.h"
1481ad8388SMartin Matuska #include "alone_decoder.h"
1581ad8388SMartin Matuska 
1681ad8388SMartin Matuska 
1781ad8388SMartin Matuska struct lzma_coder_s {
1881ad8388SMartin Matuska 	/// Stream decoder or LZMA_Alone decoder
1981ad8388SMartin Matuska 	lzma_next_coder next;
2081ad8388SMartin Matuska 
2181ad8388SMartin Matuska 	uint64_t memlimit;
2281ad8388SMartin Matuska 	uint32_t flags;
2381ad8388SMartin Matuska 
2481ad8388SMartin Matuska 	enum {
2581ad8388SMartin Matuska 		SEQ_INIT,
2681ad8388SMartin Matuska 		SEQ_CODE,
2781ad8388SMartin Matuska 		SEQ_FINISH,
2881ad8388SMartin Matuska 	} sequence;
2981ad8388SMartin Matuska };
3081ad8388SMartin Matuska 
3181ad8388SMartin Matuska 
3281ad8388SMartin Matuska static lzma_ret
3381ad8388SMartin Matuska auto_decode(lzma_coder *coder, lzma_allocator *allocator,
3481ad8388SMartin Matuska 		const uint8_t *restrict in, size_t *restrict in_pos,
3581ad8388SMartin Matuska 		size_t in_size, uint8_t *restrict out,
3681ad8388SMartin Matuska 		size_t *restrict out_pos, size_t out_size, lzma_action action)
3781ad8388SMartin Matuska {
3881ad8388SMartin Matuska 	switch (coder->sequence) {
3981ad8388SMartin Matuska 	case SEQ_INIT:
4081ad8388SMartin Matuska 		if (*in_pos >= in_size)
4181ad8388SMartin Matuska 			return LZMA_OK;
4281ad8388SMartin Matuska 
4381ad8388SMartin Matuska 		// Update the sequence now, because we want to continue from
4481ad8388SMartin Matuska 		// SEQ_CODE even if we return some LZMA_*_CHECK.
4581ad8388SMartin Matuska 		coder->sequence = SEQ_CODE;
4681ad8388SMartin Matuska 
4781ad8388SMartin Matuska 		// Detect the file format. For now this is simple, since if
4881ad8388SMartin Matuska 		// it doesn't start with 0xFD (the first magic byte of the
4981ad8388SMartin Matuska 		// new format), it has to be LZMA_Alone, or something that
5081ad8388SMartin Matuska 		// we don't support at all.
5181ad8388SMartin Matuska 		if (in[*in_pos] == 0xFD) {
5281ad8388SMartin Matuska 			return_if_error(lzma_stream_decoder_init(
5381ad8388SMartin Matuska 					&coder->next, allocator,
5481ad8388SMartin Matuska 					coder->memlimit, coder->flags));
5581ad8388SMartin Matuska 		} else {
5681ad8388SMartin Matuska 			return_if_error(lzma_alone_decoder_init(&coder->next,
57*42b10a37SXin LI 					allocator, coder->memlimit, true));
5881ad8388SMartin Matuska 
5981ad8388SMartin Matuska 			// If the application wants to know about missing
6081ad8388SMartin Matuska 			// integrity check or about the check in general, we
6181ad8388SMartin Matuska 			// need to handle it here, because LZMA_Alone decoder
6281ad8388SMartin Matuska 			// doesn't accept any flags.
6381ad8388SMartin Matuska 			if (coder->flags & LZMA_TELL_NO_CHECK)
6481ad8388SMartin Matuska 				return LZMA_NO_CHECK;
6581ad8388SMartin Matuska 
6681ad8388SMartin Matuska 			if (coder->flags & LZMA_TELL_ANY_CHECK)
6781ad8388SMartin Matuska 				return LZMA_GET_CHECK;
6881ad8388SMartin Matuska 		}
6981ad8388SMartin Matuska 
7081ad8388SMartin Matuska 	// Fall through
7181ad8388SMartin Matuska 
7281ad8388SMartin Matuska 	case SEQ_CODE: {
7381ad8388SMartin Matuska 		const lzma_ret ret = coder->next.code(
7481ad8388SMartin Matuska 				coder->next.coder, allocator,
7581ad8388SMartin Matuska 				in, in_pos, in_size,
7681ad8388SMartin Matuska 				out, out_pos, out_size, action);
7781ad8388SMartin Matuska 		if (ret != LZMA_STREAM_END
7881ad8388SMartin Matuska 				|| (coder->flags & LZMA_CONCATENATED) == 0)
7981ad8388SMartin Matuska 			return ret;
8081ad8388SMartin Matuska 
8181ad8388SMartin Matuska 		coder->sequence = SEQ_FINISH;
8281ad8388SMartin Matuska 	}
8381ad8388SMartin Matuska 
8481ad8388SMartin Matuska 	// Fall through
8581ad8388SMartin Matuska 
8681ad8388SMartin Matuska 	case SEQ_FINISH:
8781ad8388SMartin Matuska 		// When LZMA_DECODE_CONCATENATED was used and we were decoding
8881ad8388SMartin Matuska 		// LZMA_Alone file, we need to check check that there is no
8981ad8388SMartin Matuska 		// trailing garbage and wait for LZMA_FINISH.
9081ad8388SMartin Matuska 		if (*in_pos < in_size)
9181ad8388SMartin Matuska 			return LZMA_DATA_ERROR;
9281ad8388SMartin Matuska 
9381ad8388SMartin Matuska 		return action == LZMA_FINISH ? LZMA_STREAM_END : LZMA_OK;
9481ad8388SMartin Matuska 
9581ad8388SMartin Matuska 	default:
9681ad8388SMartin Matuska 		assert(0);
9781ad8388SMartin Matuska 		return LZMA_PROG_ERROR;
9881ad8388SMartin Matuska 	}
9981ad8388SMartin Matuska }
10081ad8388SMartin Matuska 
10181ad8388SMartin Matuska 
10281ad8388SMartin Matuska static void
10381ad8388SMartin Matuska auto_decoder_end(lzma_coder *coder, lzma_allocator *allocator)
10481ad8388SMartin Matuska {
10581ad8388SMartin Matuska 	lzma_next_end(&coder->next, allocator);
10681ad8388SMartin Matuska 	lzma_free(coder, allocator);
10781ad8388SMartin Matuska 	return;
10881ad8388SMartin Matuska }
10981ad8388SMartin Matuska 
11081ad8388SMartin Matuska 
11181ad8388SMartin Matuska static lzma_check
11281ad8388SMartin Matuska auto_decoder_get_check(const lzma_coder *coder)
11381ad8388SMartin Matuska {
11481ad8388SMartin Matuska 	// It is LZMA_Alone if get_check is NULL.
11581ad8388SMartin Matuska 	return coder->next.get_check == NULL ? LZMA_CHECK_NONE
11681ad8388SMartin Matuska 			: coder->next.get_check(coder->next.coder);
11781ad8388SMartin Matuska }
11881ad8388SMartin Matuska 
11981ad8388SMartin Matuska 
12081ad8388SMartin Matuska static lzma_ret
12181ad8388SMartin Matuska auto_decoder_memconfig(lzma_coder *coder, uint64_t *memusage,
12281ad8388SMartin Matuska 		uint64_t *old_memlimit, uint64_t new_memlimit)
12381ad8388SMartin Matuska {
12481ad8388SMartin Matuska 	lzma_ret ret;
12581ad8388SMartin Matuska 
12681ad8388SMartin Matuska 	if (coder->next.memconfig != NULL) {
12781ad8388SMartin Matuska 		ret = coder->next.memconfig(coder->next.coder,
12881ad8388SMartin Matuska 				memusage, old_memlimit, new_memlimit);
12981ad8388SMartin Matuska 		assert(*old_memlimit == coder->memlimit);
13081ad8388SMartin Matuska 	} else {
13181ad8388SMartin Matuska 		// No coder is configured yet. Use the base value as
13281ad8388SMartin Matuska 		// the current memory usage.
13381ad8388SMartin Matuska 		*memusage = LZMA_MEMUSAGE_BASE;
13481ad8388SMartin Matuska 		*old_memlimit = coder->memlimit;
13581ad8388SMartin Matuska 		ret = LZMA_OK;
13681ad8388SMartin Matuska 	}
13781ad8388SMartin Matuska 
13881ad8388SMartin Matuska 	if (ret == LZMA_OK && new_memlimit != 0)
13981ad8388SMartin Matuska 		coder->memlimit = new_memlimit;
14081ad8388SMartin Matuska 
14181ad8388SMartin Matuska 	return ret;
14281ad8388SMartin Matuska }
14381ad8388SMartin Matuska 
14481ad8388SMartin Matuska 
14581ad8388SMartin Matuska static lzma_ret
14681ad8388SMartin Matuska auto_decoder_init(lzma_next_coder *next, lzma_allocator *allocator,
14781ad8388SMartin Matuska 		uint64_t memlimit, uint32_t flags)
14881ad8388SMartin Matuska {
14981ad8388SMartin Matuska 	lzma_next_coder_init(&auto_decoder_init, next, allocator);
15081ad8388SMartin Matuska 
15181ad8388SMartin Matuska 	if (memlimit == 0)
15281ad8388SMartin Matuska 		return LZMA_PROG_ERROR;
15381ad8388SMartin Matuska 
15481ad8388SMartin Matuska 	if (flags & ~LZMA_SUPPORTED_FLAGS)
15581ad8388SMartin Matuska 		return LZMA_OPTIONS_ERROR;
15681ad8388SMartin Matuska 
15781ad8388SMartin Matuska 	if (next->coder == NULL) {
15881ad8388SMartin Matuska 		next->coder = lzma_alloc(sizeof(lzma_coder), allocator);
15981ad8388SMartin Matuska 		if (next->coder == NULL)
16081ad8388SMartin Matuska 			return LZMA_MEM_ERROR;
16181ad8388SMartin Matuska 
16281ad8388SMartin Matuska 		next->code = &auto_decode;
16381ad8388SMartin Matuska 		next->end = &auto_decoder_end;
16481ad8388SMartin Matuska 		next->get_check = &auto_decoder_get_check;
16581ad8388SMartin Matuska 		next->memconfig = &auto_decoder_memconfig;
16681ad8388SMartin Matuska 		next->coder->next = LZMA_NEXT_CODER_INIT;
16781ad8388SMartin Matuska 	}
16881ad8388SMartin Matuska 
16981ad8388SMartin Matuska 	next->coder->memlimit = memlimit;
17081ad8388SMartin Matuska 	next->coder->flags = flags;
17181ad8388SMartin Matuska 	next->coder->sequence = SEQ_INIT;
17281ad8388SMartin Matuska 
17381ad8388SMartin Matuska 	return LZMA_OK;
17481ad8388SMartin Matuska }
17581ad8388SMartin Matuska 
17681ad8388SMartin Matuska 
17781ad8388SMartin Matuska extern LZMA_API(lzma_ret)
17881ad8388SMartin Matuska lzma_auto_decoder(lzma_stream *strm, uint64_t memlimit, uint32_t flags)
17981ad8388SMartin Matuska {
18081ad8388SMartin Matuska 	lzma_next_strm_init(auto_decoder_init, strm, memlimit, flags);
18181ad8388SMartin Matuska 
18281ad8388SMartin Matuska 	strm->internal->supported_actions[LZMA_RUN] = true;
18381ad8388SMartin Matuska 	strm->internal->supported_actions[LZMA_FINISH] = true;
18481ad8388SMartin Matuska 
18581ad8388SMartin Matuska 	return LZMA_OK;
18681ad8388SMartin Matuska }
187