9ce3a7d76c
Using 4 threads, frame parallel decode is ~3x faster than single thread decode and around 30% faster than tile parallel decode for frame parallel encoded video on both Android and desktop with 4 threads. Decode speed is scalable to threads too which means decode could be even faster with more threads. Change-Id: Ia0a549aaa3e83b5a17b31d8299aa496ea4f21e3e
96 lines
2.6 KiB
C
96 lines
2.6 KiB
C
/*
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
|
*
|
|
* Use of this source code is governed by a BSD-style license
|
|
* that can be found in the LICENSE file in the root of the source
|
|
* tree. An additional intellectual property rights grant can be found
|
|
* in the file PATENTS. All contributing project authors may
|
|
* be found in the AUTHORS file in the root of the source tree.
|
|
*/
|
|
|
|
#ifndef VP9_DECODER_VP9_DECODER_H_
|
|
#define VP9_DECODER_VP9_DECODER_H_
|
|
|
|
#include "./vpx_config.h"
|
|
|
|
#include "vpx/vpx_codec.h"
|
|
#include "vpx_scale/yv12config.h"
|
|
|
|
#include "vp9/common/vp9_onyxc_int.h"
|
|
#include "vp9/common/vp9_ppflags.h"
|
|
#include "vp9/common/vp9_thread.h"
|
|
|
|
#include "vp9/decoder/vp9_decoder.h"
|
|
#include "vp9/decoder/vp9_dthread.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
// TODO(hkuang): combine this with TileWorkerData.
|
|
typedef struct TileData {
|
|
VP9_COMMON *cm;
|
|
vp9_reader bit_reader;
|
|
DECLARE_ALIGNED(16, MACROBLOCKD, xd);
|
|
} TileData;
|
|
|
|
typedef struct VP9Decoder {
|
|
DECLARE_ALIGNED(16, MACROBLOCKD, mb);
|
|
|
|
DECLARE_ALIGNED(16, VP9_COMMON, common);
|
|
|
|
int ready_for_new_data;
|
|
|
|
int refresh_frame_flags;
|
|
|
|
int frame_parallel_decode; // frame-based threading.
|
|
|
|
// TODO(hkuang): Combine this with cur_buf in macroblockd as they are
|
|
// the same.
|
|
RefCntBuffer *cur_buf; // Current decoding frame buffer.
|
|
RefCntBuffer *prev_buf; // Previous decoding frame buffer.
|
|
|
|
VP9Worker *frame_worker_owner; // frame_worker that owns this pbi.
|
|
VP9Worker lf_worker;
|
|
VP9Worker *tile_workers;
|
|
int num_tile_workers;
|
|
|
|
TileData *tile_data;
|
|
int total_tiles;
|
|
|
|
VP9LfSync lf_row_sync;
|
|
|
|
vpx_decrypt_cb decrypt_cb;
|
|
void *decrypt_state;
|
|
|
|
int max_threads;
|
|
int inv_tile_order;
|
|
} VP9Decoder;
|
|
|
|
int vp9_receive_compressed_data(struct VP9Decoder *pbi,
|
|
size_t size, const uint8_t **dest);
|
|
|
|
int vp9_get_raw_frame(struct VP9Decoder *pbi, YV12_BUFFER_CONFIG *sd,
|
|
vp9_ppflags_t *flags);
|
|
|
|
vpx_codec_err_t vp9_copy_reference_dec(struct VP9Decoder *pbi,
|
|
VP9_REFFRAME ref_frame_flag,
|
|
YV12_BUFFER_CONFIG *sd);
|
|
|
|
vpx_codec_err_t vp9_set_reference_dec(VP9_COMMON *cm,
|
|
VP9_REFFRAME ref_frame_flag,
|
|
YV12_BUFFER_CONFIG *sd);
|
|
|
|
int vp9_get_reference_dec(struct VP9Decoder *pbi,
|
|
int index, YV12_BUFFER_CONFIG **fb);
|
|
|
|
struct VP9Decoder *vp9_decoder_create(BufferPool *const pool);
|
|
|
|
void vp9_decoder_remove(struct VP9Decoder *pbi);
|
|
|
|
#ifdef __cplusplus
|
|
} // extern "C"
|
|
#endif
|
|
|
|
#endif // VP9_DECODER_VP9_DECODER_H_
|