2016-06-02 13:52:23 -07:00
|
|
|
#include <stdint.h>
|
|
|
|
#include "igzip_lib.h"
|
|
|
|
#include "huffman.h"
|
|
|
|
#include "huff_codes.h"
|
|
|
|
#include "bitbuf2.h"
|
|
|
|
|
|
|
|
extern const struct isal_hufftables hufftables_default;
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
static inline void update_state(struct isal_zstream *stream, uint8_t * start_in,
|
|
|
|
uint8_t * next_in, uint8_t * end_in)
|
2016-06-02 13:52:23 -07:00
|
|
|
{
|
|
|
|
struct isal_zstate *state = &stream->internal_state;
|
|
|
|
uint32_t bytes_written;
|
|
|
|
|
2017-06-09 17:03:41 -07:00
|
|
|
if (next_in - start_in > 0)
|
|
|
|
state->has_hist = IGZIP_HIST;
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
stream->next_in = next_in;
|
|
|
|
stream->total_in += next_in - start_in;
|
|
|
|
stream->avail_in = end_in - next_in;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
|
|
|
bytes_written = buffer_used(&state->bitbuf);
|
|
|
|
stream->total_out += bytes_written;
|
|
|
|
stream->next_out += bytes_written;
|
|
|
|
stream->avail_out -= bytes_written;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
void isal_deflate_body_base(struct isal_zstream *stream)
|
|
|
|
{
|
|
|
|
uint32_t literal, hash;
|
|
|
|
uint8_t *start_in, *next_in, *end_in, *end, *next_hash;
|
|
|
|
uint16_t match_length;
|
2016-09-12 13:15:32 -07:00
|
|
|
uint32_t dist;
|
2016-06-02 13:52:23 -07:00
|
|
|
uint64_t code, code_len, code2, code_len2;
|
|
|
|
struct isal_zstate *state = &stream->internal_state;
|
|
|
|
uint16_t *last_seen = state->head;
|
2019-01-08 08:49:23 -07:00
|
|
|
uint8_t *file_start = (uint8_t *) ((uintptr_t) stream->next_in - stream->total_in);
|
2018-06-06 18:48:40 -04:00
|
|
|
uint32_t hist_size = state->dist_mask;
|
2018-06-06 16:33:19 -07:00
|
|
|
uint32_t hash_mask = state->hash_mask;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
|
|
|
if (stream->avail_in == 0) {
|
|
|
|
if (stream->end_of_stream || stream->flush != NO_FLUSH)
|
|
|
|
state->state = ZSTATE_FLUSH_READ_BUFFER;
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
set_buf(&state->bitbuf, stream->next_out, stream->avail_out);
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
start_in = stream->next_in;
|
|
|
|
end_in = start_in + stream->avail_in;
|
|
|
|
next_in = start_in;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-13 15:32:57 -07:00
|
|
|
while (next_in + ISAL_LOOK_AHEAD < end_in) {
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
if (is_full(&state->bitbuf)) {
|
|
|
|
update_state(stream, start_in, next_in, end_in);
|
|
|
|
return;
|
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2021-11-11 12:53:38 +01:00
|
|
|
literal = load_le_u32(next_in);
|
2018-06-06 16:33:19 -07:00
|
|
|
hash = compute_hash(literal) & hash_mask;
|
2017-10-20 15:58:49 -07:00
|
|
|
dist = (next_in - file_start - last_seen[hash]) & 0xFFFF;
|
|
|
|
last_seen[hash] = (uint64_t) (next_in - file_start);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
/* The -1 are to handle the case when dist = 0 */
|
2018-06-06 18:48:40 -04:00
|
|
|
if (dist - 1 < hist_size) {
|
2016-09-12 13:15:32 -07:00
|
|
|
assert(dist != 0);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
match_length = compare258(next_in - dist, next_in, 258);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
if (match_length >= SHORTEST_MATCH) {
|
|
|
|
next_hash = next_in;
|
2016-08-05 14:11:25 -04:00
|
|
|
#ifdef ISAL_LIMIT_HASH_UPDATE
|
2016-09-12 13:15:32 -07:00
|
|
|
end = next_hash + 3;
|
2016-06-02 13:52:23 -07:00
|
|
|
#else
|
2016-09-12 13:15:32 -07:00
|
|
|
end = next_hash + match_length;
|
2016-06-02 13:52:23 -07:00
|
|
|
#endif
|
2016-09-12 13:15:32 -07:00
|
|
|
next_hash++;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
for (; next_hash < end; next_hash++) {
|
2021-11-11 12:53:38 +01:00
|
|
|
literal = load_le_u32(next_hash);
|
2018-06-06 16:33:19 -07:00
|
|
|
hash = compute_hash(literal) & hash_mask;
|
2017-10-20 15:58:49 -07:00
|
|
|
last_seen[hash] = (uint64_t) (next_hash - file_start);
|
2016-09-12 13:15:32 -07:00
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
get_len_code(stream->hufftables, match_length, &code,
|
|
|
|
&code_len);
|
|
|
|
get_dist_code(stream->hufftables, dist, &code2, &code_len2);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
code |= code2 << code_len;
|
|
|
|
code_len += code_len2;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
write_bits(&state->bitbuf, code, code_len);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
next_in += match_length;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
continue;
|
2016-06-02 13:52:23 -07:00
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
get_lit_code(stream->hufftables, literal & 0xFF, &code, &code_len);
|
|
|
|
write_bits(&state->bitbuf, code, code_len);
|
|
|
|
next_in++;
|
2016-06-02 13:52:23 -07:00
|
|
|
}
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
update_state(stream, start_in, next_in, end_in);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
assert(stream->avail_in <= ISAL_LOOK_AHEAD);
|
|
|
|
if (stream->end_of_stream || stream->flush != NO_FLUSH)
|
|
|
|
state->state = ZSTATE_FLUSH_READ_BUFFER;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
|
|
|
return;
|
|
|
|
|
|
|
|
}
|
|
|
|
|
|
|
|
void isal_deflate_finish_base(struct isal_zstream *stream)
|
|
|
|
{
|
|
|
|
uint32_t literal = 0, hash;
|
2016-09-12 13:15:32 -07:00
|
|
|
uint8_t *start_in, *next_in, *end_in, *end, *next_hash;
|
2016-06-02 13:52:23 -07:00
|
|
|
uint16_t match_length;
|
|
|
|
uint32_t dist;
|
|
|
|
uint64_t code, code_len, code2, code_len2;
|
|
|
|
struct isal_zstate *state = &stream->internal_state;
|
|
|
|
uint16_t *last_seen = state->head;
|
2019-01-08 08:49:23 -07:00
|
|
|
uint8_t *file_start = (uint8_t *) ((uintptr_t) stream->next_in - stream->total_in);
|
2018-06-06 18:48:40 -04:00
|
|
|
uint32_t hist_size = state->dist_mask;
|
2018-06-06 16:33:19 -07:00
|
|
|
uint32_t hash_mask = state->hash_mask;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
|
|
|
set_buf(&state->bitbuf, stream->next_out, stream->avail_out);
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
start_in = stream->next_in;
|
|
|
|
end_in = start_in + stream->avail_in;
|
|
|
|
next_in = start_in;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
if (stream->avail_in != 0) {
|
|
|
|
while (next_in + 3 < end_in) {
|
|
|
|
if (is_full(&state->bitbuf)) {
|
|
|
|
update_state(stream, start_in, next_in, end_in);
|
|
|
|
return;
|
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2021-11-11 12:53:38 +01:00
|
|
|
literal = load_le_u32(next_in);
|
2018-06-06 16:33:19 -07:00
|
|
|
hash = compute_hash(literal) & hash_mask;
|
2017-10-20 15:58:49 -07:00
|
|
|
dist = (next_in - file_start - last_seen[hash]) & 0xFFFF;
|
|
|
|
last_seen[hash] = (uint64_t) (next_in - file_start);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2018-06-06 18:48:40 -04:00
|
|
|
if (dist - 1 < hist_size) { /* The -1 are to handle the case when dist = 0 */
|
2017-03-20 10:48:58 -07:00
|
|
|
match_length =
|
|
|
|
compare258(next_in - dist, next_in, end_in - next_in);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
if (match_length >= SHORTEST_MATCH) {
|
|
|
|
next_hash = next_in;
|
2016-08-05 14:11:25 -04:00
|
|
|
#ifdef ISAL_LIMIT_HASH_UPDATE
|
2017-03-20 10:48:58 -07:00
|
|
|
end = next_hash + 3;
|
2016-06-02 13:52:23 -07:00
|
|
|
#else
|
2017-03-20 10:48:58 -07:00
|
|
|
end = next_hash + match_length;
|
2016-06-02 13:52:23 -07:00
|
|
|
#endif
|
2017-03-20 10:48:58 -07:00
|
|
|
next_hash++;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
for (; next_hash < end - 3; next_hash++) {
|
2021-11-11 12:53:38 +01:00
|
|
|
literal = load_le_u32(next_hash);
|
2018-06-06 16:33:19 -07:00
|
|
|
hash = compute_hash(literal) & hash_mask;
|
2017-03-20 10:48:58 -07:00
|
|
|
last_seen[hash] =
|
2017-10-20 15:58:49 -07:00
|
|
|
(uint64_t) (next_hash - file_start);
|
2017-03-20 10:48:58 -07:00
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
get_len_code(stream->hufftables, match_length, &code,
|
|
|
|
&code_len);
|
|
|
|
get_dist_code(stream->hufftables, dist, &code2,
|
|
|
|
&code_len2);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
code |= code2 << code_len;
|
|
|
|
code_len += code_len2;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
write_bits(&state->bitbuf, code, code_len);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
next_in += match_length;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
continue;
|
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
}
|
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
get_lit_code(stream->hufftables, literal & 0xFF, &code, &code_len);
|
|
|
|
write_bits(&state->bitbuf, code, code_len);
|
|
|
|
next_in++;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
}
|
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
while (next_in < end_in) {
|
|
|
|
if (is_full(&state->bitbuf)) {
|
|
|
|
update_state(stream, start_in, next_in, end_in);
|
|
|
|
return;
|
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2017-03-20 10:48:58 -07:00
|
|
|
literal = *next_in;
|
|
|
|
get_lit_code(stream->hufftables, literal & 0xFF, &code, &code_len);
|
|
|
|
write_bits(&state->bitbuf, code, code_len);
|
|
|
|
next_in++;
|
|
|
|
|
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
}
|
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
if (!is_full(&state->bitbuf)) {
|
|
|
|
get_lit_code(stream->hufftables, 256, &code, &code_len);
|
|
|
|
write_bits(&state->bitbuf, code, code_len);
|
|
|
|
state->has_eob = 1;
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
if (stream->end_of_stream == 1)
|
|
|
|
state->state = ZSTATE_TRL;
|
|
|
|
else
|
|
|
|
state->state = ZSTATE_SYNC_FLUSH;
|
|
|
|
}
|
2016-06-02 13:52:23 -07:00
|
|
|
|
2016-09-12 13:15:32 -07:00
|
|
|
update_state(stream, start_in, next_in, end_in);
|
2016-06-02 13:52:23 -07:00
|
|
|
|
|
|
|
return;
|
|
|
|
}
|
2017-06-07 13:40:34 -07:00
|
|
|
|
2017-11-17 10:22:18 -07:00
|
|
|
void isal_deflate_hash_base(uint16_t * hash_table, uint32_t hash_mask,
|
|
|
|
uint32_t current_index, uint8_t * dict, uint32_t dict_len)
|
2017-06-07 13:40:34 -07:00
|
|
|
{
|
|
|
|
uint8_t *next_in = dict;
|
|
|
|
uint8_t *end_in = dict + dict_len - SHORTEST_MATCH;
|
|
|
|
uint32_t literal;
|
|
|
|
uint32_t hash;
|
2017-11-17 10:22:18 -07:00
|
|
|
uint16_t index = current_index - dict_len;
|
2017-06-07 13:40:34 -07:00
|
|
|
|
|
|
|
while (next_in <= end_in) {
|
2021-11-11 12:53:38 +01:00
|
|
|
literal = load_le_u32(next_in);
|
2017-11-17 10:22:18 -07:00
|
|
|
hash = compute_hash(literal) & hash_mask;
|
|
|
|
hash_table[hash] = index;
|
|
|
|
index++;
|
2017-06-07 13:40:34 -07:00
|
|
|
next_in++;
|
|
|
|
}
|
|
|
|
}
|