181ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
281ad8388SMartin Matuska //
381ad8388SMartin Matuska /// \file       lz_encoder_hash.h
481ad8388SMartin Matuska /// \brief      Hash macros for match finders
581ad8388SMartin Matuska //
681ad8388SMartin Matuska //  Author:     Igor Pavlov
781ad8388SMartin Matuska //
82f9cd13dSXin LI //  This file has been put into the public domain.
92f9cd13dSXin LI //  You can do whatever you want with this file.
102f9cd13dSXin LI //
1181ad8388SMartin Matuska ///////////////////////////////////////////////////////////////////////////////
1281ad8388SMartin Matuska 
1381ad8388SMartin Matuska #ifndef LZMA_LZ_ENCODER_HASH_H
1481ad8388SMartin Matuska #define LZMA_LZ_ENCODER_HASH_H
1581ad8388SMartin Matuska 
1681ad8388SMartin Matuska #if defined(WORDS_BIGENDIAN) && !defined(HAVE_SMALL)
1781ad8388SMartin Matuska 	// This is to make liblzma produce the same output on big endian
1881ad8388SMartin Matuska 	// systems that it does on little endian systems. lz_encoder.c
1981ad8388SMartin Matuska 	// takes care of including the actual table.
20ca6a6373SXin LI 	lzma_attr_visibility_hidden
2181ad8388SMartin Matuska 	extern const uint32_t lzma_lz_hash_table[256];
2281ad8388SMartin Matuska #	define hash_table lzma_lz_hash_table
2381ad8388SMartin Matuska #else
2481ad8388SMartin Matuska #	include "check.h"
2581ad8388SMartin Matuska #	define hash_table lzma_crc32_table[0]
2681ad8388SMartin Matuska #endif
2781ad8388SMartin Matuska 
2881ad8388SMartin Matuska #define HASH_2_SIZE (UINT32_C(1) << 10)
2981ad8388SMartin Matuska #define HASH_3_SIZE (UINT32_C(1) << 16)
3081ad8388SMartin Matuska #define HASH_4_SIZE (UINT32_C(1) << 20)
3181ad8388SMartin Matuska 
3281ad8388SMartin Matuska #define HASH_2_MASK (HASH_2_SIZE - 1)
3381ad8388SMartin Matuska #define HASH_3_MASK (HASH_3_SIZE - 1)
3481ad8388SMartin Matuska #define HASH_4_MASK (HASH_4_SIZE - 1)
3581ad8388SMartin Matuska 
3681ad8388SMartin Matuska #define FIX_3_HASH_SIZE (HASH_2_SIZE)
3781ad8388SMartin Matuska #define FIX_4_HASH_SIZE (HASH_2_SIZE + HASH_3_SIZE)
3881ad8388SMartin Matuska #define FIX_5_HASH_SIZE (HASH_2_SIZE + HASH_3_SIZE + HASH_4_SIZE)
3981ad8388SMartin Matuska 
4081ad8388SMartin Matuska // Endianness doesn't matter in hash_2_calc() (no effect on the output).
4181ad8388SMartin Matuska #ifdef TUKLIB_FAST_UNALIGNED_ACCESS
4281ad8388SMartin Matuska #	define hash_2_calc() \
43a8675d92SXin LI 		const uint32_t hash_value = read16ne(cur)
4481ad8388SMartin Matuska #else
4581ad8388SMartin Matuska #	define hash_2_calc() \
4681ad8388SMartin Matuska 		const uint32_t hash_value \
4781ad8388SMartin Matuska 			= (uint32_t)(cur[0]) | ((uint32_t)(cur[1]) << 8)
4881ad8388SMartin Matuska #endif
4981ad8388SMartin Matuska 
5081ad8388SMartin Matuska #define hash_3_calc() \
5181ad8388SMartin Matuska 	const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \
5281ad8388SMartin Matuska 	const uint32_t hash_2_value = temp & HASH_2_MASK; \
5381ad8388SMartin Matuska 	const uint32_t hash_value \
5481ad8388SMartin Matuska 			= (temp ^ ((uint32_t)(cur[2]) << 8)) & mf->hash_mask
5581ad8388SMartin Matuska 
5681ad8388SMartin Matuska #define hash_4_calc() \
5781ad8388SMartin Matuska 	const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \
5881ad8388SMartin Matuska 	const uint32_t hash_2_value = temp & HASH_2_MASK; \
5981ad8388SMartin Matuska 	const uint32_t hash_3_value \
6081ad8388SMartin Matuska 			= (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \
6181ad8388SMartin Matuska 	const uint32_t hash_value = (temp ^ ((uint32_t)(cur[2]) << 8) \
6281ad8388SMartin Matuska 			^ (hash_table[cur[3]] << 5)) & mf->hash_mask
6381ad8388SMartin Matuska 
6481ad8388SMartin Matuska 
6581ad8388SMartin Matuska // The following are not currently used.
6681ad8388SMartin Matuska 
6781ad8388SMartin Matuska #define hash_5_calc() \
6881ad8388SMartin Matuska 	const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \
6981ad8388SMartin Matuska 	const uint32_t hash_2_value = temp & HASH_2_MASK; \
7081ad8388SMartin Matuska 	const uint32_t hash_3_value \
7181ad8388SMartin Matuska 			= (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \
7281ad8388SMartin Matuska 	uint32_t hash_4_value = (temp ^ ((uint32_t)(cur[2]) << 8) ^ \
7381ad8388SMartin Matuska 			^ hash_table[cur[3]] << 5); \
7481ad8388SMartin Matuska 	const uint32_t hash_value \
7581ad8388SMartin Matuska 			= (hash_4_value ^ (hash_table[cur[4]] << 3)) \
7681ad8388SMartin Matuska 				& mf->hash_mask; \
7781ad8388SMartin Matuska 	hash_4_value &= HASH_4_MASK
7881ad8388SMartin Matuska 
7981ad8388SMartin Matuska /*
8081ad8388SMartin Matuska #define hash_zip_calc() \
8181ad8388SMartin Matuska 	const uint32_t hash_value \
8281ad8388SMartin Matuska 			= (((uint32_t)(cur[0]) | ((uint32_t)(cur[1]) << 8)) \
8381ad8388SMartin Matuska 				^ hash_table[cur[2]]) & 0xFFFF
8481ad8388SMartin Matuska */
8581ad8388SMartin Matuska 
8681ad8388SMartin Matuska #define hash_zip_calc() \
8781ad8388SMartin Matuska 	const uint32_t hash_value \
8881ad8388SMartin Matuska 			= (((uint32_t)(cur[2]) | ((uint32_t)(cur[0]) << 8)) \
8981ad8388SMartin Matuska 				^ hash_table[cur[1]]) & 0xFFFF
9081ad8388SMartin Matuska 
9181ad8388SMartin Matuska #define mt_hash_2_calc() \
9281ad8388SMartin Matuska 	const uint32_t hash_2_value \
9381ad8388SMartin Matuska 			= (hash_table[cur[0]] ^ cur[1]) & HASH_2_MASK
9481ad8388SMartin Matuska 
9581ad8388SMartin Matuska #define mt_hash_3_calc() \
9681ad8388SMartin Matuska 	const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \
9781ad8388SMartin Matuska 	const uint32_t hash_2_value = temp & HASH_2_MASK; \
9881ad8388SMartin Matuska 	const uint32_t hash_3_value \
9981ad8388SMartin Matuska 			= (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK
10081ad8388SMartin Matuska 
10181ad8388SMartin Matuska #define mt_hash_4_calc() \
10281ad8388SMartin Matuska 	const uint32_t temp = hash_table[cur[0]] ^ cur[1]; \
10381ad8388SMartin Matuska 	const uint32_t hash_2_value = temp & HASH_2_MASK; \
10481ad8388SMartin Matuska 	const uint32_t hash_3_value \
10581ad8388SMartin Matuska 			= (temp ^ ((uint32_t)(cur[2]) << 8)) & HASH_3_MASK; \
10681ad8388SMartin Matuska 	const uint32_t hash_4_value = (temp ^ ((uint32_t)(cur[2]) << 8) ^ \
10781ad8388SMartin Matuska 			(hash_table[cur[3]] << 5)) & HASH_4_MASK
10881ad8388SMartin Matuska 
10981ad8388SMartin Matuska #endif
110