Multi-thread the lossless cruncher.
BUG=webp:336 Change-Id: I8e861d6a61d51a5cdc4bbd00cd4f17d4ff006d2f
This commit is contained in:
parent
a88c6522f6
commit
f8c2ac15af
@ -364,20 +364,16 @@ typedef struct {
|
|||||||
|
|
||||||
#define CRUNCH_CONFIGS_MAX (kNumEntropyIx * 2)
|
#define CRUNCH_CONFIGS_MAX (kNumEntropyIx * 2)
|
||||||
|
|
||||||
static int AnalyzeAndInit(VP8LEncoder* const enc,
|
static int EncoderAnalyze(VP8LEncoder* const enc,
|
||||||
CrunchConfig crunch_configs[CRUNCH_CONFIGS_MAX],
|
CrunchConfig crunch_configs[CRUNCH_CONFIGS_MAX],
|
||||||
int* const crunch_configs_size,
|
int* const crunch_configs_size,
|
||||||
int* const red_and_blue_always_zero) {
|
int* const red_and_blue_always_zero) {
|
||||||
const WebPPicture* const pic = enc->pic_;
|
const WebPPicture* const pic = enc->pic_;
|
||||||
const int width = pic->width;
|
const int width = pic->width;
|
||||||
const int height = pic->height;
|
const int height = pic->height;
|
||||||
const int pix_cnt = width * height;
|
|
||||||
const WebPConfig* const config = enc->config_;
|
const WebPConfig* const config = enc->config_;
|
||||||
const int method = config->method;
|
const int method = config->method;
|
||||||
const int low_effort = (config->method == 0);
|
const int low_effort = (config->method == 0);
|
||||||
// we round the block size up, so we're guaranteed to have
|
|
||||||
// at max MAX_REFS_BLOCK_PER_IMAGE blocks used:
|
|
||||||
int refs_block_size = (pix_cnt - 1) / MAX_REFS_BLOCK_PER_IMAGE + 1;
|
|
||||||
int i;
|
int i;
|
||||||
int use_palette;
|
int use_palette;
|
||||||
assert(pic != NULL && pic->argb != NULL);
|
assert(pic != NULL && pic->argb != NULL);
|
||||||
@ -428,7 +424,18 @@ static int AnalyzeAndInit(VP8LEncoder* const enc,
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
|
||||||
|
static int EncoderInit(VP8LEncoder* const enc) {
|
||||||
|
const WebPPicture* const pic = enc->pic_;
|
||||||
|
const int width = pic->width;
|
||||||
|
const int height = pic->height;
|
||||||
|
const int pix_cnt = width * height;
|
||||||
|
// we round the block size up, so we're guaranteed to have
|
||||||
|
// at most MAX_REFS_BLOCK_PER_IMAGE blocks used:
|
||||||
|
const int refs_block_size = (pix_cnt - 1) / MAX_REFS_BLOCK_PER_IMAGE + 1;
|
||||||
|
int i;
|
||||||
if (!VP8LHashChainInit(&enc->hash_chain_, pix_cnt)) return 0;
|
if (!VP8LHashChainInit(&enc->hash_chain_, pix_cnt)) return 0;
|
||||||
|
|
||||||
for (i = 0; i < 3; ++i) VP8LBackwardRefsInit(&enc->refs_[i], refs_block_size);
|
for (i = 0; i < 3; ++i) VP8LBackwardRefsInit(&enc->refs_[i], refs_block_size);
|
||||||
@ -1506,37 +1513,47 @@ static void VP8LEncoderDelete(VP8LEncoder* enc) {
|
|||||||
// -----------------------------------------------------------------------------
|
// -----------------------------------------------------------------------------
|
||||||
// Main call
|
// Main call
|
||||||
|
|
||||||
WebPEncodingError VP8LEncodeStream(const WebPConfig* const config,
|
typedef struct {
|
||||||
const WebPPicture* const picture,
|
const WebPConfig* config_;
|
||||||
VP8LBitWriter* const bw, int use_cache) {
|
const WebPPicture* picture_;
|
||||||
|
VP8LBitWriter* bw_;
|
||||||
|
VP8LEncoder* enc_;
|
||||||
|
int use_cache_;
|
||||||
|
CrunchConfig crunch_configs_[CRUNCH_CONFIGS_MAX];
|
||||||
|
int num_crunch_configs_;
|
||||||
|
int red_and_blue_always_zero_;
|
||||||
|
WebPEncodingError err_;
|
||||||
|
WebPAuxStats* stats_;
|
||||||
|
} StreamEncodeContext;
|
||||||
|
|
||||||
|
static int EncodeStreamHook(void* input, void* data2) {
|
||||||
|
StreamEncodeContext* const params = (StreamEncodeContext*)input;
|
||||||
|
const WebPConfig* const config = params->config_;
|
||||||
|
const WebPPicture* const picture = params->picture_;
|
||||||
|
VP8LBitWriter* const bw = params->bw_;
|
||||||
|
VP8LEncoder* const enc = params->enc_;
|
||||||
|
const int use_cache = params->use_cache_;
|
||||||
|
const CrunchConfig* const crunch_configs = params->crunch_configs_;
|
||||||
|
const int num_crunch_configs = params->num_crunch_configs_;
|
||||||
|
const int red_and_blue_always_zero = params->red_and_blue_always_zero_;
|
||||||
|
WebPAuxStats* const stats = params->stats_;
|
||||||
WebPEncodingError err = VP8_ENC_OK;
|
WebPEncodingError err = VP8_ENC_OK;
|
||||||
const int quality = (int)config->quality;
|
const int quality = (int)config->quality;
|
||||||
const int low_effort = (config->method == 0);
|
const int low_effort = (config->method == 0);
|
||||||
const int width = picture->width;
|
const int width = picture->width;
|
||||||
const int height = picture->height;
|
const int height = picture->height;
|
||||||
VP8LEncoder* const enc = VP8LEncoderNew(config, picture);
|
|
||||||
const size_t byte_position = VP8LBitWriterNumBytes(bw);
|
const size_t byte_position = VP8LBitWriterNumBytes(bw);
|
||||||
int use_near_lossless = 0;
|
int use_near_lossless = 0;
|
||||||
int hdr_size = 0;
|
int hdr_size = 0;
|
||||||
int data_size = 0;
|
int data_size = 0;
|
||||||
int use_delta_palette = 0;
|
int use_delta_palette = 0;
|
||||||
CrunchConfig crunch_configs[CRUNCH_CONFIGS_MAX];
|
|
||||||
int num_crunch_configs = 0;
|
|
||||||
int idx;
|
int idx;
|
||||||
int red_and_blue_always_zero = 0;
|
|
||||||
size_t best_size = 0;
|
size_t best_size = 0;
|
||||||
VP8LBitWriter bw_init = *bw, bw_best;
|
VP8LBitWriter bw_init = *bw, bw_best;
|
||||||
|
(void)data2;
|
||||||
|
|
||||||
if (enc == NULL || !VP8LBitWriterClone(bw, &bw_best)) {
|
if (!VP8LBitWriterInit(&bw_best, 0) ||
|
||||||
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
(num_crunch_configs > 1 && !VP8LBitWriterClone(bw, &bw_best))) {
|
||||||
goto Error;
|
|
||||||
}
|
|
||||||
|
|
||||||
// ---------------------------------------------------------------------------
|
|
||||||
// Analyze image (entropy, num_palettes etc)
|
|
||||||
|
|
||||||
if (!AnalyzeAndInit(enc, crunch_configs, &num_crunch_configs,
|
|
||||||
&red_and_blue_always_zero)) {
|
|
||||||
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
||||||
goto Error;
|
goto Error;
|
||||||
}
|
}
|
||||||
@ -1654,8 +1671,7 @@ WebPEncodingError VP8LEncodeStream(const WebPConfig* const config,
|
|||||||
// Store the BitWriter.
|
// Store the BitWriter.
|
||||||
VP8LBitWriterSwap(bw, &bw_best);
|
VP8LBitWriterSwap(bw, &bw_best);
|
||||||
// Update the stats.
|
// Update the stats.
|
||||||
if (picture->stats != NULL) {
|
if (stats != NULL) {
|
||||||
WebPAuxStats* const stats = picture->stats;
|
|
||||||
stats->lossless_features = 0;
|
stats->lossless_features = 0;
|
||||||
if (enc->use_predict_) stats->lossless_features |= 1;
|
if (enc->use_predict_) stats->lossless_features |= 1;
|
||||||
if (enc->use_cross_color_) stats->lossless_features |= 2;
|
if (enc->use_cross_color_) stats->lossless_features |= 2;
|
||||||
@ -1676,10 +1692,147 @@ WebPEncodingError VP8LEncodeStream(const WebPConfig* const config,
|
|||||||
VP8LBitWriterSwap(&bw_best, bw);
|
VP8LBitWriterSwap(&bw_best, bw);
|
||||||
|
|
||||||
Error:
|
Error:
|
||||||
VP8LEncoderDelete(enc);
|
|
||||||
VP8LBitWriterWipeOut(&bw_best);
|
VP8LBitWriterWipeOut(&bw_best);
|
||||||
|
params->err_ = err;
|
||||||
|
// The hook should return false in case of error.
|
||||||
|
return (err == VP8_ENC_OK);
|
||||||
|
}
|
||||||
|
|
||||||
|
WebPEncodingError VP8LEncodeStream(const WebPConfig* const config,
|
||||||
|
const WebPPicture* const picture,
|
||||||
|
VP8LBitWriter* const bw_main,
|
||||||
|
int use_cache) {
|
||||||
|
WebPEncodingError err = VP8_ENC_OK;
|
||||||
|
VP8LEncoder* const enc_main = VP8LEncoderNew(config, picture);
|
||||||
|
VP8LEncoder* enc_side = NULL;
|
||||||
|
CrunchConfig crunch_configs[CRUNCH_CONFIGS_MAX];
|
||||||
|
int num_crunch_configs_main, num_crunch_configs_side = 0;
|
||||||
|
int idx;
|
||||||
|
int red_and_blue_always_zero = 0;
|
||||||
|
WebPWorker worker_main, worker_side;
|
||||||
|
StreamEncodeContext params_main, params_side;
|
||||||
|
// The main thread uses picture->stats, the side thread uses stats_side.
|
||||||
|
WebPAuxStats stats_side;
|
||||||
|
VP8LBitWriter bw_side;
|
||||||
|
const WebPWorkerInterface* const worker_interface = WebPGetWorkerInterface();
|
||||||
|
int ok_main;
|
||||||
|
|
||||||
|
// Analyze image (entropy, num_palettes etc)
|
||||||
|
if (enc_main == NULL ||
|
||||||
|
!EncoderAnalyze(enc_main, crunch_configs, &num_crunch_configs_main,
|
||||||
|
&red_and_blue_always_zero) ||
|
||||||
|
!EncoderInit(enc_main) || !VP8LBitWriterInit(&bw_side, 0)) {
|
||||||
|
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
||||||
|
goto Error;
|
||||||
|
}
|
||||||
|
|
||||||
|
// Split the configs between the main and side threads (if any).
|
||||||
|
if (config->thread_level > 0) {
|
||||||
|
num_crunch_configs_side = num_crunch_configs_main / 2;
|
||||||
|
for (idx = 0; idx < num_crunch_configs_side; ++idx) {
|
||||||
|
params_side.crunch_configs_[idx] =
|
||||||
|
crunch_configs[num_crunch_configs_main - num_crunch_configs_side +
|
||||||
|
idx];
|
||||||
|
}
|
||||||
|
params_side.num_crunch_configs_ = num_crunch_configs_side;
|
||||||
|
}
|
||||||
|
num_crunch_configs_main -= num_crunch_configs_side;
|
||||||
|
for (idx = 0; idx < num_crunch_configs_main; ++idx) {
|
||||||
|
params_main.crunch_configs_[idx] = crunch_configs[idx];
|
||||||
|
}
|
||||||
|
params_main.num_crunch_configs_ = num_crunch_configs_main;
|
||||||
|
|
||||||
|
// Fill in the parameters for the thread workers.
|
||||||
|
{
|
||||||
|
const int params_size = (num_crunch_configs_side > 0) ? 2 : 1;
|
||||||
|
for (idx = 0; idx < params_size; ++idx) {
|
||||||
|
// Create the parameters for each worker.
|
||||||
|
WebPWorker* const worker = (idx == 0) ? &worker_main : &worker_side;
|
||||||
|
StreamEncodeContext* const param =
|
||||||
|
(idx == 0) ? ¶ms_main : ¶ms_side;
|
||||||
|
param->config_ = config;
|
||||||
|
param->picture_ = picture;
|
||||||
|
param->use_cache_ = use_cache;
|
||||||
|
param->red_and_blue_always_zero_ = red_and_blue_always_zero;
|
||||||
|
if (idx == 0) {
|
||||||
|
param->stats_ = picture->stats;
|
||||||
|
param->bw_ = bw_main;
|
||||||
|
param->enc_ = enc_main;
|
||||||
|
} else {
|
||||||
|
param->stats_ = (picture->stats == NULL) ? NULL : &stats_side;
|
||||||
|
// Create a side bit writer.
|
||||||
|
if (!VP8LBitWriterClone(bw_main, &bw_side)) {
|
||||||
|
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
||||||
|
goto Error;
|
||||||
|
}
|
||||||
|
param->bw_ = &bw_side;
|
||||||
|
// Create a side encoder.
|
||||||
|
enc_side = VP8LEncoderNew(config, picture);
|
||||||
|
if (enc_side == NULL || !EncoderInit(enc_side)) {
|
||||||
|
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
||||||
|
goto Error;
|
||||||
|
}
|
||||||
|
// Copy the values that were computed for the main encoder.
|
||||||
|
enc_side->histo_bits_ = enc_main->histo_bits_;
|
||||||
|
enc_side->transform_bits_ = enc_main->transform_bits_;
|
||||||
|
enc_side->palette_size_ = enc_main->palette_size_;
|
||||||
|
memcpy(enc_side->palette_, enc_main->palette_,
|
||||||
|
sizeof(enc_main->palette_));
|
||||||
|
param->enc_ = enc_side;
|
||||||
|
}
|
||||||
|
// Create the workers.
|
||||||
|
worker_interface->Init(worker);
|
||||||
|
worker->data1 = param;
|
||||||
|
worker->data2 = NULL;
|
||||||
|
worker->hook = (WebPWorkerHook)EncodeStreamHook;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
// Start the second thread if needed.
|
||||||
|
if (num_crunch_configs_side != 0) {
|
||||||
|
if (!worker_interface->Reset(&worker_side)) {
|
||||||
|
err = VP8_ENC_ERROR_OUT_OF_MEMORY;
|
||||||
|
goto Error;
|
||||||
|
}
|
||||||
|
// This line is here and not in the param initialization above to remove a
|
||||||
|
// Clang static analyzer warning.
|
||||||
|
memcpy(&stats_side, picture->stats, sizeof(stats_side));
|
||||||
|
// This line is only useful to remove a Clang static analyzer warning.
|
||||||
|
params_side.err_ = VP8_ENC_OK;
|
||||||
|
worker_interface->Launch(&worker_side);
|
||||||
|
}
|
||||||
|
// Execute the main thread.
|
||||||
|
worker_interface->Execute(&worker_main);
|
||||||
|
ok_main = worker_interface->Sync(&worker_main);
|
||||||
|
worker_interface->End(&worker_main);
|
||||||
|
if (num_crunch_configs_side != 0) {
|
||||||
|
// Wait for the second thread.
|
||||||
|
const int ok_side = worker_interface->Sync(&worker_side);
|
||||||
|
worker_interface->End(&worker_side);
|
||||||
|
if (!ok_main || !ok_side) {
|
||||||
|
err = ok_main ? params_side.err_ : params_main.err_;
|
||||||
|
goto Error;
|
||||||
|
}
|
||||||
|
if (VP8LBitWriterNumBytes(&bw_side) < VP8LBitWriterNumBytes(bw_main)) {
|
||||||
|
VP8LBitWriterSwap(bw_main, &bw_side);
|
||||||
|
if (picture->stats != NULL) {
|
||||||
|
memcpy(picture->stats, &stats_side, sizeof(*picture->stats));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
} else {
|
||||||
|
if (!ok_main) {
|
||||||
|
err = params_main.err_;
|
||||||
|
goto Error;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
Error:
|
||||||
|
VP8LBitWriterWipeOut(&bw_side);
|
||||||
|
VP8LEncoderDelete(enc_main);
|
||||||
|
VP8LEncoderDelete(enc_side);
|
||||||
return err;
|
return err;
|
||||||
}
|
}
|
||||||
|
|
||||||
#undef CRUNCH_CONFIGS_MAX
|
#undef CRUNCH_CONFIGS_MAX
|
||||||
|
|
||||||
int VP8LEncodeImage(const WebPConfig* const config,
|
int VP8LEncodeImage(const WebPConfig* const config,
|
||||||
|
@ -243,7 +243,6 @@ int VP8LBitWriterClone(const VP8LBitWriter* const src,
|
|||||||
VP8LBitWriter* const dst) {
|
VP8LBitWriter* const dst) {
|
||||||
const size_t current_size = src->cur_ - src->buf_;
|
const size_t current_size = src->cur_ - src->buf_;
|
||||||
assert(src->cur_ >= src->buf_ && src->cur_ <= src->end_);
|
assert(src->cur_ >= src->buf_ && src->cur_ <= src->end_);
|
||||||
memset(dst, 0, sizeof(*dst));
|
|
||||||
if (!VP8LBitWriterResize(dst, current_size)) return 0;
|
if (!VP8LBitWriterResize(dst, current_size)) return 0;
|
||||||
memcpy(dst->buf_, src->buf_, current_size);
|
memcpy(dst->buf_, src->buf_, current_size);
|
||||||
dst->bits_ = src->bits_;
|
dst->bits_ = src->bits_;
|
||||||
|
@ -100,7 +100,7 @@ typedef struct {
|
|||||||
int error_;
|
int error_;
|
||||||
} VP8LBitWriter;
|
} VP8LBitWriter;
|
||||||
|
|
||||||
static WEBP_INLINE size_t VP8LBitWriterNumBytes(VP8LBitWriter* const bw) {
|
static WEBP_INLINE size_t VP8LBitWriterNumBytes(const VP8LBitWriter* const bw) {
|
||||||
return (bw->cur_ - bw->buf_) + ((bw->used_ + 7) >> 3);
|
return (bw->cur_ - bw->buf_) + ((bw->used_ + 7) >> 3);
|
||||||
}
|
}
|
||||||
|
|
||||||
|
Loading…
x
Reference in New Issue
Block a user