p7zip/CPP/7zip/Compress/Lzham/lzhamcomp/lzham_match_accel.h
2017-10-11 12:35:36 +02:00

165 lines
5.7 KiB
C++

// File: lzham_match_accel.h
// See Copyright Notice and license at the end of include/lzham.h
#pragma once
#include "lzham_lzbase.h"
#include "lzham_threading.h"
namespace lzham
{
const uint cMatchAccelMaxSupportedProbes = 128;
const uint cMatchAccelMaxSupportedThreads = 32;
struct node
{
uint m_left;
uint m_right;
};
LZHAM_DEFINE_BITWISE_MOVABLE(node);
#pragma pack(push, 1)
struct dict_match
{
uint m_dist;
uint16 m_len;
inline uint get_dist() const { return m_dist & 0x7FFFFFFF; }
inline uint get_len() const { return m_len + 2; }
inline bool is_last() const { return (int)m_dist < 0; }
};
#pragma pack(pop)
LZHAM_DEFINE_BITWISE_MOVABLE(dict_match);
class search_accelerator
{
LZHAM_NO_COPY_OR_ASSIGNMENT_OP(search_accelerator);
public:
search_accelerator(lzham_malloc_context malloc_context);
lzham_malloc_context get_malloc_context() const { return m_malloc_context; }
// If all_matches is true, the match finder returns all found matches with no filtering.
// Otherwise, the finder will tend to return lists of matches with mostly unique lengths.
// For each length, it will discard matches with worse distances (in the coding sense).
enum
{
cFlagDeterministic = 1,
cFlagLen2Matches = 2,
cFlagHash24 = 4
};
bool init(CLZBase* pLZBase, task_pool* pPool, uint max_helper_threads, uint max_dict_size, uint max_matches, bool all_matches, uint max_probes, uint flags);
void reset();
void flush();
inline uint get_max_dict_size() const { return m_max_dict_size; }
inline uint get_max_dict_size_mask() const { return m_max_dict_size_mask; }
inline uint get_cur_dict_size() const { return m_cur_dict_size; }
inline uint get_lookahead_pos() const { return m_lookahead_pos; }
inline uint get_lookahead_size() const { return m_lookahead_size; }
inline uint get_char(int delta_pos) const { return m_dict[(m_lookahead_pos + delta_pos) & m_max_dict_size_mask]; }
inline uint get_char(uint cur_dict_pos, int delta_pos) const { return m_dict[(cur_dict_pos + delta_pos) & m_max_dict_size_mask]; }
inline const uint8* get_ptr(uint pos) const { return &m_dict[pos]; }
uint get_max_helper_threads() const { return m_max_helper_threads; }
inline uint operator[](uint pos) const { return m_dict[pos]; }
uint get_max_add_bytes() const;
bool add_bytes_begin(uint num_bytes, const uint8* pBytes);
inline atomic32_t get_num_completed_helper_threads() const { return m_num_completed_helper_threads; }
void add_bytes_end();
// Returns the lookahead's raw position/size/dict_size at the time add_bytes_begin() is called.
inline uint get_fill_lookahead_pos() const { return m_fill_lookahead_pos; }
inline uint get_fill_lookahead_size() const { return m_fill_lookahead_size; }
inline uint get_fill_dict_size() const { return m_fill_dict_size; }
uint get_len2_match(uint lookahead_ofs);
dict_match* find_matches(uint lookahead_ofs, bool spin = true);
void advance_bytes(uint num_bytes);
LZHAM_FORCE_INLINE uint get_match_len(uint lookahead_ofs, int dist, uint max_match_len, uint start_match_len = 0) const
{
LZHAM_ASSERT(lookahead_ofs < m_lookahead_size);
LZHAM_ASSERT(start_match_len <= max_match_len);
LZHAM_ASSERT(max_match_len <= (get_lookahead_size() - lookahead_ofs));
const int find_dict_size = m_cur_dict_size + lookahead_ofs;
if (dist > find_dict_size)
return 0;
const uint comp_pos = static_cast<uint>((m_lookahead_pos + lookahead_ofs - dist) & m_max_dict_size_mask);
const uint lookahead_pos = (m_lookahead_pos + lookahead_ofs) & m_max_dict_size_mask;
const uint8* pComp = &m_dict[comp_pos];
const uint8* pLookahead = &m_dict[lookahead_pos];
uint match_len;
for (match_len = start_match_len; match_len < max_match_len; match_len++)
if (pComp[match_len] != pLookahead[match_len])
break;
return match_len;
}
public:
lzham_malloc_context m_malloc_context;
CLZBase* m_pLZBase;
task_pool* m_pTask_pool;
uint m_max_helper_threads;
uint m_max_dict_size;
uint m_max_dict_size_mask;
uint m_lookahead_pos;
uint m_lookahead_size;
uint m_cur_dict_size;
lzham::vector<uint8> m_dict;
lzham::vector<uint> m_hash;
lzham::vector<node> m_nodes;
lzham::vector<dict_match> m_matches;
lzham::vector<atomic32_t> m_match_refs;
enum { cDigramHashSize = 4096 };
lzham::vector<uint> m_digram_hash;
lzham::vector<uint> m_digram_next;
lzham::vector<uint> m_thread_dict_offsets[cMatchAccelMaxSupportedThreads];
uint m_fill_lookahead_pos;
uint m_fill_lookahead_size;
uint m_fill_dict_size;
uint m_max_probes;
uint m_max_matches;
bool m_all_matches;
bool m_deterministic;
bool m_len2_matches;
bool m_hash24;
volatile atomic32_t m_next_match_ref;
volatile atomic32_t m_num_completed_helper_threads;
void find_all_matches_callback_st(uint64 data, void* pData_ptr);
void find_all_matches_callback_mt(uint64 data, void* pData_ptr);
bool find_all_matches(uint num_bytes);
bool find_len2_matches();
};
} // namespace lzham