1*3b35e7eeSXin LI // SPDX-License-Identifier: 0BSD 2*3b35e7eeSXin LI 381ad8388SMartin Matuska /////////////////////////////////////////////////////////////////////////////// 481ad8388SMartin Matuska // 581ad8388SMartin Matuska /// \file auto_decoder.c 673ed8e77SXin LI /// \brief Autodetect between .xz, .lzma (LZMA_Alone), and .lz (lzip) 781ad8388SMartin Matuska // 881ad8388SMartin Matuska // Author: Lasse Collin 981ad8388SMartin Matuska // 1081ad8388SMartin Matuska /////////////////////////////////////////////////////////////////////////////// 1181ad8388SMartin Matuska 1281ad8388SMartin Matuska #include "stream_decoder.h" 1381ad8388SMartin Matuska #include "alone_decoder.h" 1473ed8e77SXin LI #ifdef HAVE_LZIP_DECODER 1573ed8e77SXin LI # include "lzip_decoder.h" 1673ed8e77SXin LI #endif 1781ad8388SMartin Matuska 1881ad8388SMartin Matuska 191456f0f9SXin LI typedef struct { 2073ed8e77SXin LI /// .xz Stream decoder, LZMA_Alone decoder, or lzip decoder 2181ad8388SMartin Matuska lzma_next_coder next; 2281ad8388SMartin Matuska 2381ad8388SMartin Matuska uint64_t memlimit; 2481ad8388SMartin Matuska uint32_t flags; 2581ad8388SMartin Matuska 2681ad8388SMartin Matuska enum { 2781ad8388SMartin Matuska SEQ_INIT, 2881ad8388SMartin Matuska SEQ_CODE, 2981ad8388SMartin Matuska SEQ_FINISH, 3081ad8388SMartin Matuska } sequence; 311456f0f9SXin LI } lzma_auto_coder; 3281ad8388SMartin Matuska 3381ad8388SMartin Matuska 3481ad8388SMartin Matuska static lzma_ret 351456f0f9SXin LI auto_decode(void *coder_ptr, const lzma_allocator *allocator, 3681ad8388SMartin Matuska const uint8_t *restrict in, size_t *restrict in_pos, 3781ad8388SMartin Matuska size_t in_size, uint8_t *restrict out, 3881ad8388SMartin Matuska size_t *restrict out_pos, size_t out_size, lzma_action action) 3981ad8388SMartin Matuska { 401456f0f9SXin LI lzma_auto_coder *coder = coder_ptr; 411456f0f9SXin LI 4281ad8388SMartin Matuska switch (coder->sequence) { 4381ad8388SMartin Matuska case SEQ_INIT: 4481ad8388SMartin Matuska if (*in_pos >= in_size) 4581ad8388SMartin Matuska return LZMA_OK; 4681ad8388SMartin Matuska 4781ad8388SMartin Matuska // Update the sequence now, because we want to continue from 4881ad8388SMartin Matuska // SEQ_CODE even if we return some LZMA_*_CHECK. 4981ad8388SMartin Matuska coder->sequence = SEQ_CODE; 5081ad8388SMartin Matuska 5173ed8e77SXin LI // Detect the file format. .xz files start with 0xFD which 5273ed8e77SXin LI // cannot be the first byte of .lzma (LZMA_Alone) format. 5373ed8e77SXin LI // The .lz format starts with 0x4C which could be the 5473ed8e77SXin LI // first byte of a .lzma file but luckily it would mean 5573ed8e77SXin LI // lc/lp/pb being 4/3/1 which liblzma doesn't support because 5673ed8e77SXin LI // lc + lp > 4. So using just 0x4C to detect .lz is OK here. 5781ad8388SMartin Matuska if (in[*in_pos] == 0xFD) { 5881ad8388SMartin Matuska return_if_error(lzma_stream_decoder_init( 5981ad8388SMartin Matuska &coder->next, allocator, 6081ad8388SMartin Matuska coder->memlimit, coder->flags)); 6173ed8e77SXin LI #ifdef HAVE_LZIP_DECODER 6273ed8e77SXin LI } else if (in[*in_pos] == 0x4C) { 6373ed8e77SXin LI return_if_error(lzma_lzip_decoder_init( 6473ed8e77SXin LI &coder->next, allocator, 6573ed8e77SXin LI coder->memlimit, coder->flags)); 6673ed8e77SXin LI #endif 6781ad8388SMartin Matuska } else { 6881ad8388SMartin Matuska return_if_error(lzma_alone_decoder_init(&coder->next, 6942b10a37SXin LI allocator, coder->memlimit, true)); 7081ad8388SMartin Matuska 7181ad8388SMartin Matuska // If the application wants to know about missing 7281ad8388SMartin Matuska // integrity check or about the check in general, we 7381ad8388SMartin Matuska // need to handle it here, because LZMA_Alone decoder 7481ad8388SMartin Matuska // doesn't accept any flags. 7581ad8388SMartin Matuska if (coder->flags & LZMA_TELL_NO_CHECK) 7681ad8388SMartin Matuska return LZMA_NO_CHECK; 7781ad8388SMartin Matuska 7881ad8388SMartin Matuska if (coder->flags & LZMA_TELL_ANY_CHECK) 7981ad8388SMartin Matuska return LZMA_GET_CHECK; 8081ad8388SMartin Matuska } 8181ad8388SMartin Matuska 8281ad8388SMartin Matuska // Fall through 8381ad8388SMartin Matuska 8481ad8388SMartin Matuska case SEQ_CODE: { 8581ad8388SMartin Matuska const lzma_ret ret = coder->next.code( 8681ad8388SMartin Matuska coder->next.coder, allocator, 8781ad8388SMartin Matuska in, in_pos, in_size, 8881ad8388SMartin Matuska out, out_pos, out_size, action); 8981ad8388SMartin Matuska if (ret != LZMA_STREAM_END 9081ad8388SMartin Matuska || (coder->flags & LZMA_CONCATENATED) == 0) 9181ad8388SMartin Matuska return ret; 9281ad8388SMartin Matuska 9381ad8388SMartin Matuska coder->sequence = SEQ_FINISH; 9481ad8388SMartin Matuska } 9581ad8388SMartin Matuska 9681ad8388SMartin Matuska // Fall through 9781ad8388SMartin Matuska 9881ad8388SMartin Matuska case SEQ_FINISH: 999e6bbe47SXin LI // When LZMA_CONCATENATED was used and we were decoding 1009e6bbe47SXin LI // a LZMA_Alone file, we need to check that there is no 10181ad8388SMartin Matuska // trailing garbage and wait for LZMA_FINISH. 10281ad8388SMartin Matuska if (*in_pos < in_size) 10381ad8388SMartin Matuska return LZMA_DATA_ERROR; 10481ad8388SMartin Matuska 10581ad8388SMartin Matuska return action == LZMA_FINISH ? LZMA_STREAM_END : LZMA_OK; 10681ad8388SMartin Matuska 10781ad8388SMartin Matuska default: 10881ad8388SMartin Matuska assert(0); 10981ad8388SMartin Matuska return LZMA_PROG_ERROR; 11081ad8388SMartin Matuska } 11181ad8388SMartin Matuska } 11281ad8388SMartin Matuska 11381ad8388SMartin Matuska 11481ad8388SMartin Matuska static void 1151456f0f9SXin LI auto_decoder_end(void *coder_ptr, const lzma_allocator *allocator) 11681ad8388SMartin Matuska { 1171456f0f9SXin LI lzma_auto_coder *coder = coder_ptr; 11881ad8388SMartin Matuska lzma_next_end(&coder->next, allocator); 11981ad8388SMartin Matuska lzma_free(coder, allocator); 12081ad8388SMartin Matuska return; 12181ad8388SMartin Matuska } 12281ad8388SMartin Matuska 12381ad8388SMartin Matuska 12481ad8388SMartin Matuska static lzma_check 1251456f0f9SXin LI auto_decoder_get_check(const void *coder_ptr) 12681ad8388SMartin Matuska { 1271456f0f9SXin LI const lzma_auto_coder *coder = coder_ptr; 1281456f0f9SXin LI 12981ad8388SMartin Matuska // It is LZMA_Alone if get_check is NULL. 13081ad8388SMartin Matuska return coder->next.get_check == NULL ? LZMA_CHECK_NONE 13181ad8388SMartin Matuska : coder->next.get_check(coder->next.coder); 13281ad8388SMartin Matuska } 13381ad8388SMartin Matuska 13481ad8388SMartin Matuska 13581ad8388SMartin Matuska static lzma_ret 1361456f0f9SXin LI auto_decoder_memconfig(void *coder_ptr, uint64_t *memusage, 13781ad8388SMartin Matuska uint64_t *old_memlimit, uint64_t new_memlimit) 13881ad8388SMartin Matuska { 1391456f0f9SXin LI lzma_auto_coder *coder = coder_ptr; 1401456f0f9SXin LI 14181ad8388SMartin Matuska lzma_ret ret; 14281ad8388SMartin Matuska 14381ad8388SMartin Matuska if (coder->next.memconfig != NULL) { 14481ad8388SMartin Matuska ret = coder->next.memconfig(coder->next.coder, 14581ad8388SMartin Matuska memusage, old_memlimit, new_memlimit); 14681ad8388SMartin Matuska assert(*old_memlimit == coder->memlimit); 14781ad8388SMartin Matuska } else { 14881ad8388SMartin Matuska // No coder is configured yet. Use the base value as 14981ad8388SMartin Matuska // the current memory usage. 15081ad8388SMartin Matuska *memusage = LZMA_MEMUSAGE_BASE; 15181ad8388SMartin Matuska *old_memlimit = coder->memlimit; 152b71a5db3SXin LI 15381ad8388SMartin Matuska ret = LZMA_OK; 154b71a5db3SXin LI if (new_memlimit != 0 && new_memlimit < *memusage) 155b71a5db3SXin LI ret = LZMA_MEMLIMIT_ERROR; 15681ad8388SMartin Matuska } 15781ad8388SMartin Matuska 15881ad8388SMartin Matuska if (ret == LZMA_OK && new_memlimit != 0) 15981ad8388SMartin Matuska coder->memlimit = new_memlimit; 16081ad8388SMartin Matuska 16181ad8388SMartin Matuska return ret; 16281ad8388SMartin Matuska } 16381ad8388SMartin Matuska 16481ad8388SMartin Matuska 16581ad8388SMartin Matuska static lzma_ret 16653200025SRui Paulo auto_decoder_init(lzma_next_coder *next, const lzma_allocator *allocator, 16781ad8388SMartin Matuska uint64_t memlimit, uint32_t flags) 16881ad8388SMartin Matuska { 16981ad8388SMartin Matuska lzma_next_coder_init(&auto_decoder_init, next, allocator); 17081ad8388SMartin Matuska 17181ad8388SMartin Matuska if (flags & ~LZMA_SUPPORTED_FLAGS) 17281ad8388SMartin Matuska return LZMA_OPTIONS_ERROR; 17381ad8388SMartin Matuska 1741456f0f9SXin LI lzma_auto_coder *coder = next->coder; 1751456f0f9SXin LI if (coder == NULL) { 1761456f0f9SXin LI coder = lzma_alloc(sizeof(lzma_auto_coder), allocator); 1771456f0f9SXin LI if (coder == NULL) 17881ad8388SMartin Matuska return LZMA_MEM_ERROR; 17981ad8388SMartin Matuska 1801456f0f9SXin LI next->coder = coder; 18181ad8388SMartin Matuska next->code = &auto_decode; 18281ad8388SMartin Matuska next->end = &auto_decoder_end; 18381ad8388SMartin Matuska next->get_check = &auto_decoder_get_check; 18481ad8388SMartin Matuska next->memconfig = &auto_decoder_memconfig; 1851456f0f9SXin LI coder->next = LZMA_NEXT_CODER_INIT; 18681ad8388SMartin Matuska } 18781ad8388SMartin Matuska 188b71a5db3SXin LI coder->memlimit = my_max(1, memlimit); 1891456f0f9SXin LI coder->flags = flags; 1901456f0f9SXin LI coder->sequence = SEQ_INIT; 19181ad8388SMartin Matuska 19281ad8388SMartin Matuska return LZMA_OK; 19381ad8388SMartin Matuska } 19481ad8388SMartin Matuska 19581ad8388SMartin Matuska 19681ad8388SMartin Matuska extern LZMA_API(lzma_ret) 19781ad8388SMartin Matuska lzma_auto_decoder(lzma_stream *strm, uint64_t memlimit, uint32_t flags) 19881ad8388SMartin Matuska { 19981ad8388SMartin Matuska lzma_next_strm_init(auto_decoder_init, strm, memlimit, flags); 20081ad8388SMartin Matuska 20181ad8388SMartin Matuska strm->internal->supported_actions[LZMA_RUN] = true; 20281ad8388SMartin Matuska strm->internal->supported_actions[LZMA_FINISH] = true; 20381ad8388SMartin Matuska 20481ad8388SMartin Matuska return LZMA_OK; 20581ad8388SMartin Matuska } 206