181ad8388SMartin Matuska /////////////////////////////////////////////////////////////////////////////// 281ad8388SMartin Matuska // 381ad8388SMartin Matuska /// \file lz_encoder_hash.h 481ad8388SMartin Matuska /// \brief Hash macros for match finders 581ad8388SMartin Matuska // 681ad8388SMartin Matuska // Author: Igor Pavlov 781ad8388SMartin Matuska // 82f9cd13dSXin LI // This file has been put into the public domain. 92f9cd13dSXin LI // You can do whatever you want with this file. 102f9cd13dSXin LI // 1181ad8388SMartin Matuska /////////////////////////////////////////////////////////////////////////////// 1281ad8388SMartin Matuska 1381ad8388SMartin Matuska #ifndef LZMA_LZ_ENCODER_HASH_H 1481ad8388SMartin Matuska #define LZMA_LZ_ENCODER_HASH_H 1581ad8388SMartin Matuska 1681ad8388SMartin Matuska #if defined(WORDS_BIGENDIAN) && !defined(HAVE_SMALL) 1781ad8388SMartin Matuska // This is to make liblzma produce the same output on big endian 1881ad8388SMartin Matuska // systems that it does on little endian systems. lz_encoder.c 1981ad8388SMartin Matuska // takes care of including the actual table. 20ca6a6373SXin LI lzma_attr_visibility_hidden 2181ad8388SMartin Matuska extern const uint32_t lzma_lz_hash_table[256]; 2281ad8388SMartin Matuska # define hash_table lzma_lz_hash_table 2381ad8388SMartin Matuska #else 2481ad8388SMartin Matuska # include "check.h" 2581ad8388SMartin Matuska # define hash_table lzma_crc32_table[0] 2681ad8388SMartin Matuska #endif 2781ad8388SMartin Matuska 2881ad8388SMartin Matuska #define HASH_2_SIZE (UINT32_C(1) << 10) 2981ad8388SMartin Matuska #define HASH_3_SIZE (UINT32_C(1) << 16) 3081ad8388SMartin Matuska #define HASH_4_SIZE (UINT32_C(1) << 20) 3181ad8388SMartin Matuska 3281ad8388SMartin Matuska #define HASH_2_MASK (HASH_2_SIZE - 1) 3381ad8388SMartin Matuska #define HASH_3_MASK (HASH_3_SIZE - 1) 3481ad8388SMartin Matuska #define HASH_4_MASK (HASH_4_SIZE - 1) 3581ad8388SMartin Matuska 3681ad8388SMartin Matuska #define FIX_3_HASH_SIZE (HASH_2_SIZE) 3781ad8388SMartin Matuska #define FIX_4_HASH_SIZE (HASH_2_SIZE + HASH_3_SIZE) 3881ad8388SMartin Matuska #define FIX_5_HASH_SIZE (HASH_2_SIZE + HASH_3_SIZE + HASH_4_SIZE) 3981ad8388SMartin Matuska 4081ad8388SMartin Matuska // Endianness doesn't matter in hash_2_calc() (no effect on the output). 4181ad8388SMartin Matuska #ifdef TUKLIB_FAST_UNALIGNED_ACCESS 4281ad8388SMartin Matuska # define hash_2_calc() \ 43a8675d92SXin LI const uint32_t hash_value = read16ne(cur) 4481ad8388SMartin Matuska #else 4581ad8388SMartin Matuska # define hash_2_calc() \ 4681ad8388SMartin Matuska const uint32_t hash_value \ 4781ad8388SMartin Matuska = (uint32_t)(cur[0]) | ((uint32_t)(cur[1]) << 8) 4881ad8388SMartin Matuska #endif 4981ad8388SMartin Matuska 5081ad8388SMartin Matuska #define hash_3_calc() \ 5181ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 5281ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 5381ad8388SMartin Matuska const uint32_t hash_value \ 5481ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & mf->hash_mask 5581ad8388SMartin Matuska 5681ad8388SMartin Matuska #define hash_4_calc() \ 5781ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 5881ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 5981ad8388SMartin Matuska const uint32_t hash_3_value \ 6081ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \ 6181ad8388SMartin Matuska const uint32_t hash_value = (temp ^ ((uint32_t)(cur[2]) << 8) \ 6281ad8388SMartin Matuska ^ (hash_table[cur[3]] << 5)) & mf->hash_mask 6381ad8388SMartin Matuska 6481ad8388SMartin Matuska 6581ad8388SMartin Matuska // The following are not currently used. 6681ad8388SMartin Matuska 6781ad8388SMartin Matuska #define hash_5_calc() \ 6881ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 6981ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 7081ad8388SMartin Matuska const uint32_t hash_3_value \ 7181ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \ 7281ad8388SMartin Matuska uint32_t hash_4_value = (temp ^ ((uint32_t)(cur[2]) << 8) ^ \ 7381ad8388SMartin Matuska ^ hash_table[cur[3]] << 5); \ 7481ad8388SMartin Matuska const uint32_t hash_value \ 7581ad8388SMartin Matuska = (hash_4_value ^ (hash_table[cur[4]] << 3)) \ 7681ad8388SMartin Matuska & mf->hash_mask; \ 7781ad8388SMartin Matuska hash_4_value &= HASH_4_MASK 7881ad8388SMartin Matuska 7981ad8388SMartin Matuska /* 8081ad8388SMartin Matuska #define hash_zip_calc() \ 8181ad8388SMartin Matuska const uint32_t hash_value \ 8281ad8388SMartin Matuska = (((uint32_t)(cur[0]) | ((uint32_t)(cur[1]) << 8)) \ 8381ad8388SMartin Matuska ^ hash_table[cur[2]]) & 0xFFFF 8481ad8388SMartin Matuska */ 8581ad8388SMartin Matuska 8681ad8388SMartin Matuska #define hash_zip_calc() \ 8781ad8388SMartin Matuska const uint32_t hash_value \ 8881ad8388SMartin Matuska = (((uint32_t)(cur[2]) | ((uint32_t)(cur[0]) << 8)) \ 8981ad8388SMartin Matuska ^ hash_table[cur[1]]) & 0xFFFF 9081ad8388SMartin Matuska 9181ad8388SMartin Matuska #define mt_hash_2_calc() \ 9281ad8388SMartin Matuska const uint32_t hash_2_value \ 9381ad8388SMartin Matuska = (hash_table[cur[0]] ^ cur[1]) & HASH_2_MASK 9481ad8388SMartin Matuska 9581ad8388SMartin Matuska #define mt_hash_3_calc() \ 9681ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 9781ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 9881ad8388SMartin Matuska const uint32_t hash_3_value \ 9981ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK 10081ad8388SMartin Matuska 10181ad8388SMartin Matuska #define mt_hash_4_calc() \ 10281ad8388SMartin Matuska const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \ 10381ad8388SMartin Matuska const uint32_t hash_2_value = temp & HASH_2_MASK; \ 10481ad8388SMartin Matuska const uint32_t hash_3_value \ 10581ad8388SMartin Matuska = (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \ 10681ad8388SMartin Matuska const uint32_t hash_4_value = (temp ^ ((uint32_t)(cur[2]) << 8) ^ \ 10781ad8388SMartin Matuska (hash_table[cur[3]] << 5)) & HASH_4_MASK 10881ad8388SMartin Matuska 10981ad8388SMartin Matuska #endif 110