2017-06-10 02:03:41 +02:00
|
|
|
#include "igzip_lib.h"
|
|
|
|
#include "huffman.h"
|
|
|
|
#include "encode_df.h"
|
|
|
|
#include "igzip_level_buf_structs.h"
|
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
extern uint64_t gen_icf_map_lh1(struct isal_zstream *, struct deflate_icf *, uint32_t);
|
2018-10-02 23:01:57 +02:00
|
|
|
extern void set_long_icf_fg(uint8_t *, uint64_t, uint64_t, struct deflate_icf *);
|
2017-06-10 02:03:41 +02:00
|
|
|
extern void isal_deflate_icf_body_lvl1(struct isal_zstream *);
|
2017-12-05 15:43:04 +01:00
|
|
|
extern void isal_deflate_icf_body_lvl2(struct isal_zstream *);
|
2018-02-08 22:59:36 +01:00
|
|
|
extern void isal_deflate_icf_body_lvl3(struct isal_zstream *);
|
2017-06-10 02:03:41 +02:00
|
|
|
/*
|
|
|
|
*************************************************************
|
|
|
|
* Helper functions
|
|
|
|
************************************************************
|
|
|
|
*/
|
|
|
|
static inline void write_deflate_icf(struct deflate_icf *icf, uint32_t lit_len,
|
|
|
|
uint32_t lit_dist, uint32_t extra_bits)
|
|
|
|
{
|
|
|
|
/* icf->lit_len = lit_len; */
|
|
|
|
/* icf->lit_dist = lit_dist; */
|
|
|
|
/* icf->dist_extra = extra_bits; */
|
|
|
|
|
|
|
|
*(uint32_t *) icf = lit_len | (lit_dist << LIT_LEN_BIT_COUNT)
|
|
|
|
| (extra_bits << (LIT_LEN_BIT_COUNT + DIST_LIT_BIT_COUNT));
|
|
|
|
}
|
|
|
|
|
2018-10-02 23:01:57 +02:00
|
|
|
void set_long_icf_fg_base(uint8_t * next_in, uint64_t processed, uint64_t input_size,
|
|
|
|
struct deflate_icf *match_lookup)
|
2017-06-10 02:03:41 +02:00
|
|
|
{
|
2018-10-02 23:01:57 +02:00
|
|
|
uint8_t *end_processed = next_in + processed;
|
|
|
|
uint8_t *end_in = next_in + input_size;
|
2017-06-10 02:03:41 +02:00
|
|
|
uint32_t dist_code, dist_extra, dist, len;
|
|
|
|
uint32_t match_len;
|
|
|
|
uint32_t dist_start[] = {
|
|
|
|
0x0001, 0x0002, 0x0003, 0x0004, 0x0005, 0x0007, 0x0009, 0x000d,
|
|
|
|
0x0011, 0x0019, 0x0021, 0x0031, 0x0041, 0x0061, 0x0081, 0x00c1,
|
|
|
|
0x0101, 0x0181, 0x0201, 0x0301, 0x0401, 0x0601, 0x0801, 0x0c01,
|
|
|
|
0x1001, 0x1801, 0x2001, 0x3001, 0x4001, 0x6001, 0x0000, 0x0000
|
|
|
|
};
|
|
|
|
|
2018-10-02 23:01:57 +02:00
|
|
|
if (end_in > end_processed + ISAL_LOOK_AHEAD)
|
|
|
|
end_in = end_processed + ISAL_LOOK_AHEAD;
|
|
|
|
|
|
|
|
while (next_in < end_processed) {
|
2017-06-10 02:03:41 +02:00
|
|
|
dist_code = match_lookup->lit_dist;
|
|
|
|
dist_extra = match_lookup->dist_extra;
|
|
|
|
dist = dist_start[dist_code] + dist_extra;
|
|
|
|
len = match_lookup->lit_len;
|
|
|
|
if (len >= 8 + LEN_OFFSET) {
|
2018-10-02 23:01:57 +02:00
|
|
|
match_len = compare((next_in + 8) - dist, next_in + 8,
|
|
|
|
end_in - (next_in + 8)) + LEN_OFFSET + 8;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
while (match_len > match_lookup->lit_len
|
|
|
|
&& match_len >= LEN_OFFSET + SHORTEST_MATCH) {
|
2018-09-27 22:20:13 +02:00
|
|
|
write_deflate_icf(match_lookup,
|
|
|
|
match_len > LEN_MAX ? LEN_MAX : match_len,
|
|
|
|
dist_code, dist_extra);
|
2017-06-10 02:03:41 +02:00
|
|
|
match_lookup++;
|
|
|
|
next_in++;
|
|
|
|
match_len--;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
match_lookup++;
|
|
|
|
next_in++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
*************************************************************
|
|
|
|
* Methods for generating one pass match lookup table
|
|
|
|
************************************************************
|
|
|
|
*/
|
2018-08-17 02:02:59 +02:00
|
|
|
uint64_t gen_icf_map_h1_base(struct isal_zstream *stream,
|
|
|
|
struct deflate_icf *matches_icf_lookup, uint64_t input_size)
|
2017-06-10 02:03:41 +02:00
|
|
|
{
|
|
|
|
|
|
|
|
uint32_t dist, len, extra_bits;
|
|
|
|
uint8_t *next_in = stream->next_in, *end_in = stream->next_in + input_size;
|
|
|
|
uint8_t *file_start = stream->next_in - stream->total_in;
|
|
|
|
uint32_t hash;
|
|
|
|
uint64_t next_bytes, match_bytes;
|
|
|
|
uint64_t match;
|
|
|
|
struct level_buf *level_buf = (struct level_buf *)stream->level_buf;
|
2017-11-30 21:07:22 +01:00
|
|
|
uint16_t *hash_table = level_buf->hash_map.hash_table;
|
2018-06-07 00:48:40 +02:00
|
|
|
uint32_t hist_size = stream->internal_state.dist_mask;
|
2018-06-07 01:33:19 +02:00
|
|
|
uint32_t hash_mask = stream->internal_state.hash_mask;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
if (input_size < ISAL_LOOK_AHEAD)
|
2018-08-17 02:02:59 +02:00
|
|
|
return 0;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-08-17 20:31:50 +02:00
|
|
|
if (stream->internal_state.has_hist == IGZIP_NO_HIST) {
|
|
|
|
matches_icf_lookup->lit_len = *next_in;
|
|
|
|
matches_icf_lookup->lit_dist = 0x1e;
|
|
|
|
matches_icf_lookup->dist_extra = 0;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-06-07 01:33:19 +02:00
|
|
|
hash = compute_hash(*(uint32_t *) next_in) & hash_mask;
|
2018-08-17 20:31:50 +02:00
|
|
|
hash_table[hash] = (uint64_t) (next_in - file_start);
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-08-17 20:31:50 +02:00
|
|
|
next_in++;
|
|
|
|
matches_icf_lookup++;
|
|
|
|
stream->internal_state.has_hist = IGZIP_HIST;
|
|
|
|
}
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
while (next_in < end_in - ISAL_LOOK_AHEAD) {
|
2018-06-07 01:33:19 +02:00
|
|
|
hash = compute_hash(*(uint32_t *) next_in) & hash_mask;
|
2017-06-10 02:03:41 +02:00
|
|
|
dist = (next_in - file_start - hash_table[hash]);
|
2018-06-07 00:48:40 +02:00
|
|
|
dist = ((dist - 1) & hist_size) + 1;
|
2017-06-10 02:03:41 +02:00
|
|
|
hash_table[hash] = (uint64_t) (next_in - file_start);
|
|
|
|
|
|
|
|
match_bytes = *(uint64_t *) (next_in - dist);
|
|
|
|
next_bytes = *(uint64_t *) next_in;
|
|
|
|
match = next_bytes ^ match_bytes;
|
|
|
|
|
2018-05-23 22:36:39 +02:00
|
|
|
len = tzbytecnt(match);
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
if (len >= SHORTEST_MATCH) {
|
|
|
|
len += LEN_OFFSET;
|
|
|
|
get_dist_icf_code(dist, &dist, &extra_bits);
|
|
|
|
write_deflate_icf(matches_icf_lookup, len, dist, extra_bits);
|
|
|
|
} else {
|
|
|
|
write_deflate_icf(matches_icf_lookup, *next_in, 0x1e, 0);
|
|
|
|
}
|
|
|
|
|
|
|
|
next_in++;
|
|
|
|
matches_icf_lookup++;
|
|
|
|
}
|
2018-08-17 02:02:59 +02:00
|
|
|
return next_in - stream->next_in;
|
2017-06-10 02:03:41 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
*************************************************************
|
|
|
|
* One pass methods for parsing provided match lookup table
|
|
|
|
************************************************************
|
|
|
|
*/
|
2018-03-12 17:28:34 +01:00
|
|
|
static struct deflate_icf *compress_icf_map_g(struct isal_zstream *stream,
|
|
|
|
struct deflate_icf *matches_next,
|
|
|
|
struct deflate_icf *matches_end)
|
2017-06-10 02:03:41 +02:00
|
|
|
{
|
|
|
|
uint32_t lit_len, lit_len2, dist;
|
|
|
|
uint64_t code;
|
|
|
|
struct isal_zstate *state = &stream->internal_state;
|
|
|
|
struct level_buf *level_buf = (struct level_buf *)stream->level_buf;
|
|
|
|
struct deflate_icf *matches_start = matches_next;
|
|
|
|
struct deflate_icf *icf_buf_end =
|
|
|
|
level_buf->icf_buf_next +
|
|
|
|
level_buf->icf_buf_avail_out / sizeof(struct deflate_icf);
|
|
|
|
|
|
|
|
while (matches_next < matches_end - 1 && level_buf->icf_buf_next < icf_buf_end - 1) {
|
|
|
|
code = *(uint64_t *) matches_next;
|
|
|
|
lit_len = code & LIT_LEN_MASK;
|
|
|
|
lit_len2 = (code >> ICF_CODE_LEN) & LIT_LEN_MASK;
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.ll_hist[lit_len]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
if (lit_len >= LEN_START) {
|
|
|
|
*(uint32_t *) level_buf->icf_buf_next = code;
|
|
|
|
level_buf->icf_buf_next++;
|
|
|
|
|
|
|
|
dist = (code >> ICF_DIST_OFFSET) & DIST_LIT_MASK;
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.d_hist[dist]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
lit_len -= LEN_OFFSET;
|
|
|
|
matches_next += lit_len;
|
|
|
|
|
|
|
|
} else if (lit_len2 >= LEN_START) {
|
|
|
|
*(uint64_t *) level_buf->icf_buf_next = code;
|
|
|
|
level_buf->icf_buf_next += 2;
|
|
|
|
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.ll_hist[lit_len2]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
dist = (code >> (ICF_CODE_LEN + ICF_DIST_OFFSET)) & DIST_LIT_MASK;
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.d_hist[dist]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
lit_len2 -= LEN_OFFSET - 1;
|
|
|
|
matches_next += lit_len2;
|
|
|
|
|
|
|
|
} else {
|
|
|
|
code = ((lit_len2 + LIT_START) << ICF_DIST_OFFSET) | lit_len;
|
|
|
|
*(uint32_t *) level_buf->icf_buf_next = code;
|
|
|
|
level_buf->icf_buf_next++;
|
|
|
|
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.ll_hist[lit_len2]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
matches_next += 2;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
while (matches_next < matches_end && level_buf->icf_buf_next < icf_buf_end) {
|
|
|
|
code = *(uint32_t *) matches_next;
|
|
|
|
lit_len = code & LIT_LEN_MASK;
|
|
|
|
*(uint32_t *) level_buf->icf_buf_next = code;
|
|
|
|
level_buf->icf_buf_next++;
|
|
|
|
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.ll_hist[lit_len]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
if (lit_len >= LEN_START) {
|
|
|
|
dist = (code >> 10) & 0x1ff;
|
2017-11-30 17:58:30 +01:00
|
|
|
level_buf->hist.d_hist[dist]++;
|
2017-06-10 02:03:41 +02:00
|
|
|
lit_len -= LEN_OFFSET;
|
|
|
|
matches_next += lit_len;
|
|
|
|
} else {
|
|
|
|
matches_next++;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
level_buf->icf_buf_avail_out =
|
|
|
|
(icf_buf_end - level_buf->icf_buf_next) * sizeof(struct deflate_icf);
|
|
|
|
|
|
|
|
state->block_end += matches_next - matches_start;
|
|
|
|
if (matches_next > matches_end && matches_start < matches_end) {
|
|
|
|
stream->next_in += matches_next - matches_end;
|
|
|
|
stream->avail_in -= matches_next - matches_end;
|
|
|
|
stream->total_in += matches_next - matches_end;
|
|
|
|
}
|
|
|
|
|
|
|
|
return matches_next;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
/*
|
|
|
|
*************************************************************
|
|
|
|
* Compression functions combining different methods
|
|
|
|
************************************************************
|
|
|
|
*/
|
|
|
|
static inline void icf_body_next_state(struct isal_zstream *stream)
|
|
|
|
{
|
|
|
|
struct level_buf *level_buf = (struct level_buf *)stream->level_buf;
|
|
|
|
struct isal_zstate *state = &stream->internal_state;
|
|
|
|
|
|
|
|
if (level_buf->icf_buf_avail_out <= 0)
|
|
|
|
state->state = ZSTATE_CREATE_HDR;
|
|
|
|
|
|
|
|
else if (stream->avail_in <= ISAL_LOOK_AHEAD
|
|
|
|
&& (stream->end_of_stream || stream->flush != NO_FLUSH))
|
|
|
|
state->state = ZSTATE_FLUSH_READ_BUFFER;
|
|
|
|
}
|
|
|
|
|
|
|
|
void icf_body_hash1_fillgreedy_lazy(struct isal_zstream *stream)
|
|
|
|
{
|
|
|
|
struct deflate_icf *matches_icf, *matches_next_icf, *matches_end_icf;
|
|
|
|
struct deflate_icf *matches_icf_lookup;
|
|
|
|
struct level_buf *level_buf = (struct level_buf *)stream->level_buf;
|
2018-08-17 02:02:59 +02:00
|
|
|
uint32_t input_size, processed;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2017-11-30 21:07:22 +01:00
|
|
|
matches_icf = level_buf->hash_map.matches;
|
2017-06-10 02:03:41 +02:00
|
|
|
matches_icf_lookup = matches_icf;
|
2017-11-30 21:07:22 +01:00
|
|
|
matches_next_icf = level_buf->hash_map.matches_next;
|
|
|
|
matches_end_icf = level_buf->hash_map.matches_end;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
matches_next_icf = compress_icf_map_g(stream, matches_next_icf, matches_end_icf);
|
|
|
|
|
|
|
|
while (matches_next_icf >= matches_end_icf) {
|
|
|
|
input_size = MATCH_BUF_SIZE;
|
|
|
|
input_size = (input_size > stream->avail_in) ? stream->avail_in : input_size;
|
|
|
|
|
|
|
|
if (input_size <= ISAL_LOOK_AHEAD)
|
|
|
|
break;
|
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
processed = gen_icf_map_h1_base(stream, matches_icf_lookup, input_size);
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-10-02 23:01:57 +02:00
|
|
|
set_long_icf_fg(stream->next_in, processed, input_size, matches_icf_lookup);
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
stream->next_in += processed;
|
|
|
|
stream->avail_in -= processed;
|
|
|
|
stream->total_in += processed;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
matches_end_icf = matches_icf + processed;
|
2017-06-10 02:03:41 +02:00
|
|
|
matches_next_icf = compress_icf_map_g(stream, matches_icf, matches_end_icf);
|
|
|
|
}
|
|
|
|
|
2017-11-30 21:07:22 +01:00
|
|
|
level_buf->hash_map.matches_next = matches_next_icf;
|
|
|
|
level_buf->hash_map.matches_end = matches_end_icf;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
icf_body_next_state(stream);
|
|
|
|
}
|
|
|
|
|
|
|
|
void icf_body_lazyhash1_fillgreedy_greedy(struct isal_zstream *stream)
|
|
|
|
{
|
|
|
|
struct deflate_icf *matches_icf, *matches_next_icf, *matches_end_icf;
|
|
|
|
struct deflate_icf *matches_icf_lookup;
|
|
|
|
struct level_buf *level_buf = (struct level_buf *)stream->level_buf;
|
2018-08-17 02:02:59 +02:00
|
|
|
uint32_t input_size, processed;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2017-11-30 21:07:22 +01:00
|
|
|
matches_icf = level_buf->hash_map.matches;
|
2017-06-10 02:03:41 +02:00
|
|
|
matches_icf_lookup = matches_icf;
|
2017-11-30 21:07:22 +01:00
|
|
|
matches_next_icf = level_buf->hash_map.matches_next;
|
|
|
|
matches_end_icf = level_buf->hash_map.matches_end;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
matches_next_icf = compress_icf_map_g(stream, matches_next_icf, matches_end_icf);
|
|
|
|
|
|
|
|
while (matches_next_icf >= matches_end_icf) {
|
|
|
|
input_size = MATCH_BUF_SIZE;
|
|
|
|
input_size = (input_size > stream->avail_in) ? stream->avail_in : input_size;
|
|
|
|
|
|
|
|
if (input_size <= ISAL_LOOK_AHEAD)
|
|
|
|
break;
|
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
processed = gen_icf_map_lh1(stream, matches_icf_lookup, input_size);
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-10-02 23:01:57 +02:00
|
|
|
set_long_icf_fg(stream->next_in, processed, input_size, matches_icf_lookup);
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
stream->next_in += processed;
|
|
|
|
stream->avail_in -= processed;
|
|
|
|
stream->total_in += processed;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
2018-08-17 02:02:59 +02:00
|
|
|
matches_end_icf = matches_icf + processed;
|
2017-06-10 02:03:41 +02:00
|
|
|
matches_next_icf = compress_icf_map_g(stream, matches_icf, matches_end_icf);
|
|
|
|
}
|
|
|
|
|
2017-11-30 21:07:22 +01:00
|
|
|
level_buf->hash_map.matches_next = matches_next_icf;
|
|
|
|
level_buf->hash_map.matches_end = matches_end_icf;
|
2017-06-10 02:03:41 +02:00
|
|
|
|
|
|
|
icf_body_next_state(stream);
|
|
|
|
}
|
|
|
|
|
2018-02-08 22:59:36 +01:00
|
|
|
void isal_deflate_icf_body(struct isal_zstream *stream)
|
2017-06-10 02:03:41 +02:00
|
|
|
{
|
|
|
|
switch (stream->level) {
|
2017-12-05 15:43:04 +01:00
|
|
|
case 3:
|
2018-02-08 22:59:36 +01:00
|
|
|
isal_deflate_icf_body_lvl3(stream);
|
2017-06-10 02:03:41 +02:00
|
|
|
break;
|
2017-12-05 15:43:04 +01:00
|
|
|
case 2:
|
|
|
|
isal_deflate_icf_body_lvl2(stream);
|
|
|
|
break;
|
2017-06-10 02:03:41 +02:00
|
|
|
case 1:
|
|
|
|
default:
|
|
|
|
isal_deflate_icf_body_lvl1(stream);
|
|
|
|
}
|
|
|
|
}
|