1*3b35e7eeSXin LI // SPDX-License-Identifier: 0BSD 2*3b35e7eeSXin LI 381ad8388SMartin Matuska /////////////////////////////////////////////////////////////////////////////// 481ad8388SMartin Matuska // 581ad8388SMartin Matuska /// \file lz_encoder_hash.h 681ad8388SMartin Matuska /// \brief Hash macros for match finders 781ad8388SMartin Matuska // 881ad8388SMartin Matuska // Author: Igor Pavlov 981ad8388SMartin Matuska // 1081ad8388SMartin Matuska /////////////////////////////////////////////////////////////////////////////// 1181ad8388SMartin Matuska 1281ad8388SMartin Matuska #ifndef LZMA_LZ_ENCODER_HASH_H 1381ad8388SMartin Matuska #define LZMA_LZ_ENCODER_HASH_H 1481ad8388SMartin Matuska 1581ad8388SMartin Matuska #if defined(WORDS_BIGENDIAN) && !defined(HAVE_SMALL) 1681ad8388SMartin Matuska // This is to make liblzma produce the same output on big endian 1781ad8388SMartin Matuska // systems that it does on little endian systems. lz_encoder.c 1881ad8388SMartin Matuska // takes care of including the actual table. 19ca6a6373SXin LI lzma_attr_visibility_hidden 2081ad8388SMartin Matuska extern const uint32_t lzma_lz_hash_table[256]; 2181ad8388SMartin Matuska # define hash_table lzma_lz_hash_table 2281ad8388SMartin Matuska #else 2381ad8388SMartin Matuska # include "check.h" 2481ad8388SMartin Matuska # define hash_table lzma_crc32_table[0] 2581ad8388SMartin Matuska #endif 2681ad8388SMartin Matuska 2781ad8388SMartin Matuska #define HASH_2_SIZE (UINT32_C(1) << 10) 2881ad8388SMartin Matuska #define HASH_3_SIZE (UINT32_C(1) << 16) 2981ad8388SMartin Matuska #define HASH_4_SIZE (UINT32_C(1) << 20) 3081ad8388SMartin Matuska 3181ad8388SMartin Matuska #define HASH_2_MASK (HASH_2_SIZE - 1) 3281ad8388SMartin Matuska #define HASH_3_MASK (HASH_3_SIZE - 1) 3381ad8388SMartin Matuska #define HASH_4_MASK (HASH_4_SIZE - 1) 3481ad8388SMartin Matuska 3581ad8388SMartin Matuska #define FIX_3_HASH_SIZE (HASH_2_SIZE) 3681ad8388SMartin Matuska #define FIX_4_HASH_SIZE (HASH_2_SIZE + HASH_3_SIZE) 3781ad8388SMartin Matuska #define FIX_5_HASH_SIZE (HASH_2_SIZE + HASH_3_SIZE + HASH_4_SIZE) 3881ad8388SMartin Matuska 3981ad8388SMartin Matuska // Endianness doesn't matter in hash_2_calc() (no effect on the output). 4081ad8388SMartin Matuska #ifdef TUKLIB_FAST_UNALIGNED_ACCESS 4181ad8388SMartin Matuska # define hash_2_calc() \ 42a8675d92SXin LI const uint32_t hash_value = read16ne(cur) 4381ad8388SMartin Matuska #else 4481ad8388SMartin Matuska # define hash_2_calc() \ 4581ad8388SMartin Matuska const uint32_t hash_value \ 4681ad8388SMartin Matuska = (uint32_t)(cur[0]) | ((uint32_t)(cur[1]) << 8) 4781ad8388SMartin Matuska #endif 4881ad8388SMartin Matuska 4981ad8388SMartin Matuska #define hash_3_calc() \ 5081ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 5181ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 5281ad8388SMartin Matuska const uint32_t hash_value \ 5381ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & mf->hash_mask 5481ad8388SMartin Matuska 5581ad8388SMartin Matuska #define hash_4_calc() \ 5681ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 5781ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 5881ad8388SMartin Matuska const uint32_t hash_3_value \ 5981ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \ 6081ad8388SMartin Matuska const uint32_t hash_value = (temp ^ ((uint32_t)(cur[2]) << 8) \ 6181ad8388SMartin Matuska ^ (hash_table[cur[3]] << 5)) & mf->hash_mask 6281ad8388SMartin Matuska 6381ad8388SMartin Matuska 6481ad8388SMartin Matuska // The following are not currently used. 6581ad8388SMartin Matuska 6681ad8388SMartin Matuska #define hash_5_calc() \ 6781ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 6881ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 6981ad8388SMartin Matuska const uint32_t hash_3_value \ 7081ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \ 7181ad8388SMartin Matuska uint32_t hash_4_value = (temp ^ ((uint32_t)(cur[2]) << 8) ^ \ 7281ad8388SMartin Matuska ^ hash_table[cur[3]] << 5); \ 7381ad8388SMartin Matuska const uint32_t hash_value \ 7481ad8388SMartin Matuska = (hash_4_value ^ (hash_table[cur[4]] << 3)) \ 7581ad8388SMartin Matuska & mf->hash_mask; \ 7681ad8388SMartin Matuska hash_4_value &= HASH_4_MASK 7781ad8388SMartin Matuska 7881ad8388SMartin Matuska /* 7981ad8388SMartin Matuska #define hash_zip_calc() \ 8081ad8388SMartin Matuska const uint32_t hash_value \ 8181ad8388SMartin Matuska = (((uint32_t)(cur[0]) | ((uint32_t)(cur[1]) << 8)) \ 8281ad8388SMartin Matuska ^ hash_table[cur[2]]) & 0xFFFF 8381ad8388SMartin Matuska */ 8481ad8388SMartin Matuska 8581ad8388SMartin Matuska #define hash_zip_calc() \ 8681ad8388SMartin Matuska const uint32_t hash_value \ 8781ad8388SMartin Matuska = (((uint32_t)(cur[2]) | ((uint32_t)(cur[0]) << 8)) \ 8881ad8388SMartin Matuska ^ hash_table[cur[1]]) & 0xFFFF 8981ad8388SMartin Matuska 9081ad8388SMartin Matuska #define mt_hash_2_calc() \ 9181ad8388SMartin Matuska const uint32_t hash_2_value \ 9281ad8388SMartin Matuska = (hash_table[cur[0]] ^ cur[1]) & HASH_2_MASK 9381ad8388SMartin Matuska 9481ad8388SMartin Matuska #define mt_hash_3_calc() \ 9581ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 9681ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 9781ad8388SMartin Matuska const uint32_t hash_3_value \ 9881ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK 9981ad8388SMartin Matuska 10081ad8388SMartin Matuska #define mt_hash_4_calc() \ 10181ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 10281ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 10381ad8388SMartin Matuska const uint32_t hash_3_value \ 10481ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \ 10581ad8388SMartin Matuska const uint32_t hash_4_value = (temp ^ ((uint32_t)(cur[2]) << 8) ^ \ 10681ad8388SMartin Matuska (hash_table[cur[3]] << 5)) & HASH_4_MASK 10781ad8388SMartin Matuska 10881ad8388SMartin Matuska #endif 109