x86: vc1dsp_mmx: Move yasm initiation steps to vc1dsp_init
That's where all yasm initiation steps are. Also removes the overlap between the two files.
This commit is contained in:
parent
607f820ec7
commit
a079cbf458
@ -63,17 +63,23 @@ static void vc1_h_loop_filter16_sse4(uint8_t *src, int stride, int pq)
|
|||||||
ff_vc1_h_loop_filter8_sse4(src, stride, pq);
|
ff_vc1_h_loop_filter8_sse4(src, stride, pq);
|
||||||
ff_vc1_h_loop_filter8_sse4(src+8*stride, stride, pq);
|
ff_vc1_h_loop_filter8_sse4(src+8*stride, stride, pq);
|
||||||
}
|
}
|
||||||
static void avg_vc1_mspel_mc00_mmxext(uint8_t *dst, const uint8_t *src,
|
|
||||||
ptrdiff_t stride, int rnd)
|
#define DECLARE_FUNCTION(OP, DEPTH, INSN) \
|
||||||
{
|
static void OP##vc1_mspel_mc00_##DEPTH##INSN(uint8_t *dst, \
|
||||||
ff_avg_pixels8_mmxext(dst, src, stride, 8);
|
const uint8_t *src, ptrdiff_t stride, int rnd) \
|
||||||
}
|
{ \
|
||||||
static void avg_vc1_mspel_mc00_16_sse2(uint8_t *dst, const uint8_t *src,
|
ff_ ## OP ## pixels ## DEPTH ## INSN(dst, src, stride, DEPTH); \
|
||||||
ptrdiff_t stride, int rnd)
|
|
||||||
{
|
|
||||||
ff_avg_pixels16_sse2(dst, src, stride, 16);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
|
DECLARE_FUNCTION(put_, 8, _mmx)
|
||||||
|
DECLARE_FUNCTION(put_, 16, _mmx)
|
||||||
|
DECLARE_FUNCTION(avg_, 8, _mmx)
|
||||||
|
DECLARE_FUNCTION(avg_, 16, _mmx)
|
||||||
|
DECLARE_FUNCTION(avg_, 8, _mmxext)
|
||||||
|
DECLARE_FUNCTION(avg_, 16, _mmxext)
|
||||||
|
DECLARE_FUNCTION(put_, 16, _sse2)
|
||||||
|
DECLARE_FUNCTION(avg_, 16, _sse2)
|
||||||
|
|
||||||
#endif /* HAVE_YASM */
|
#endif /* HAVE_YASM */
|
||||||
|
|
||||||
void ff_put_vc1_chroma_mc8_nornd_mmx (uint8_t *dst, uint8_t *src,
|
void ff_put_vc1_chroma_mc8_nornd_mmx (uint8_t *dst, uint8_t *src,
|
||||||
@ -109,6 +115,11 @@ av_cold void ff_vc1dsp_init_x86(VC1DSPContext *dsp)
|
|||||||
#if HAVE_YASM
|
#if HAVE_YASM
|
||||||
if (EXTERNAL_MMX(cpu_flags)) {
|
if (EXTERNAL_MMX(cpu_flags)) {
|
||||||
dsp->put_no_rnd_vc1_chroma_pixels_tab[0] = ff_put_vc1_chroma_mc8_nornd_mmx;
|
dsp->put_no_rnd_vc1_chroma_pixels_tab[0] = ff_put_vc1_chroma_mc8_nornd_mmx;
|
||||||
|
|
||||||
|
dsp->put_vc1_mspel_pixels_tab[1][0] = put_vc1_mspel_mc00_8_mmx;
|
||||||
|
dsp->put_vc1_mspel_pixels_tab[0][0] = put_vc1_mspel_mc00_16_mmx;
|
||||||
|
dsp->avg_vc1_mspel_pixels_tab[1][0] = avg_vc1_mspel_mc00_8_mmx;
|
||||||
|
dsp->avg_vc1_mspel_pixels_tab[0][0] = avg_vc1_mspel_mc00_16_mmx;
|
||||||
}
|
}
|
||||||
if (EXTERNAL_AMD3DNOW(cpu_flags)) {
|
if (EXTERNAL_AMD3DNOW(cpu_flags)) {
|
||||||
dsp->avg_no_rnd_vc1_chroma_pixels_tab[0] = ff_avg_vc1_chroma_mc8_nornd_3dnow;
|
dsp->avg_no_rnd_vc1_chroma_pixels_tab[0] = ff_avg_vc1_chroma_mc8_nornd_3dnow;
|
||||||
@ -117,13 +128,16 @@ av_cold void ff_vc1dsp_init_x86(VC1DSPContext *dsp)
|
|||||||
ASSIGN_LF(mmxext);
|
ASSIGN_LF(mmxext);
|
||||||
dsp->avg_no_rnd_vc1_chroma_pixels_tab[0] = ff_avg_vc1_chroma_mc8_nornd_mmxext;
|
dsp->avg_no_rnd_vc1_chroma_pixels_tab[0] = ff_avg_vc1_chroma_mc8_nornd_mmxext;
|
||||||
|
|
||||||
dsp->avg_vc1_mspel_pixels_tab[1][0] = avg_vc1_mspel_mc00_mmxext;
|
dsp->avg_vc1_mspel_pixels_tab[1][0] = avg_vc1_mspel_mc00_8_mmxext;
|
||||||
|
dsp->avg_vc1_mspel_pixels_tab[0][0] = avg_vc1_mspel_mc00_16_mmxext;
|
||||||
}
|
}
|
||||||
if (EXTERNAL_SSE2(cpu_flags)) {
|
if (EXTERNAL_SSE2(cpu_flags)) {
|
||||||
dsp->vc1_v_loop_filter8 = ff_vc1_v_loop_filter8_sse2;
|
dsp->vc1_v_loop_filter8 = ff_vc1_v_loop_filter8_sse2;
|
||||||
dsp->vc1_h_loop_filter8 = ff_vc1_h_loop_filter8_sse2;
|
dsp->vc1_h_loop_filter8 = ff_vc1_h_loop_filter8_sse2;
|
||||||
dsp->vc1_v_loop_filter16 = vc1_v_loop_filter16_sse2;
|
dsp->vc1_v_loop_filter16 = vc1_v_loop_filter16_sse2;
|
||||||
dsp->vc1_h_loop_filter16 = vc1_h_loop_filter16_sse2;
|
dsp->vc1_h_loop_filter16 = vc1_h_loop_filter16_sse2;
|
||||||
|
|
||||||
|
dsp->put_vc1_mspel_pixels_tab[0][0] = put_vc1_mspel_mc00_16_sse2;
|
||||||
dsp->avg_vc1_mspel_pixels_tab[0][0] = avg_vc1_mspel_mc00_16_sse2;
|
dsp->avg_vc1_mspel_pixels_tab[0][0] = avg_vc1_mspel_mc00_16_sse2;
|
||||||
}
|
}
|
||||||
if (EXTERNAL_SSSE3(cpu_flags)) {
|
if (EXTERNAL_SSSE3(cpu_flags)) {
|
||||||
|
@ -728,39 +728,12 @@ static void vc1_inv_trans_8x8_dc_mmxext(uint8_t *dest, int linesize,
|
|||||||
);
|
);
|
||||||
}
|
}
|
||||||
|
|
||||||
#if HAVE_MMX_EXTERNAL
|
|
||||||
static void put_vc1_mspel_mc00_mmx(uint8_t *dst, const uint8_t *src,
|
|
||||||
ptrdiff_t stride, int rnd)
|
|
||||||
{
|
|
||||||
ff_put_pixels8_mmx(dst, src, stride, 8);
|
|
||||||
}
|
|
||||||
static void put_vc1_mspel_mc00_16_mmx(uint8_t *dst, const uint8_t *src,
|
|
||||||
ptrdiff_t stride, int rnd)
|
|
||||||
{
|
|
||||||
ff_put_pixels16_mmx(dst, src, stride, 16);
|
|
||||||
}
|
|
||||||
static void avg_vc1_mspel_mc00_mmx(uint8_t *dst, const uint8_t *src,
|
|
||||||
ptrdiff_t stride, int rnd)
|
|
||||||
{
|
|
||||||
ff_avg_pixels8_mmx(dst, src, stride, 8);
|
|
||||||
}
|
|
||||||
static void avg_vc1_mspel_mc00_16_mmx(uint8_t *dst, const uint8_t *src,
|
|
||||||
ptrdiff_t stride, int rnd)
|
|
||||||
{
|
|
||||||
ff_avg_pixels16_mmx(dst, src, stride, 16);
|
|
||||||
}
|
|
||||||
#endif
|
|
||||||
|
|
||||||
#define FN_ASSIGN(OP, X, Y, INSN) \
|
#define FN_ASSIGN(OP, X, Y, INSN) \
|
||||||
dsp->OP##vc1_mspel_pixels_tab[1][X+4*Y] = OP##vc1_mspel_mc##X##Y##INSN; \
|
dsp->OP##vc1_mspel_pixels_tab[1][X+4*Y] = OP##vc1_mspel_mc##X##Y##INSN; \
|
||||||
dsp->OP##vc1_mspel_pixels_tab[0][X+4*Y] = OP##vc1_mspel_mc##X##Y##_16##INSN
|
dsp->OP##vc1_mspel_pixels_tab[0][X+4*Y] = OP##vc1_mspel_mc##X##Y##_16##INSN
|
||||||
|
|
||||||
av_cold void ff_vc1dsp_init_mmx(VC1DSPContext *dsp)
|
av_cold void ff_vc1dsp_init_mmx(VC1DSPContext *dsp)
|
||||||
{
|
{
|
||||||
#if HAVE_MMX_EXTERNAL
|
|
||||||
FN_ASSIGN(put_, 0, 0, _mmx);
|
|
||||||
FN_ASSIGN(avg_, 0, 0, _mmx);
|
|
||||||
#endif
|
|
||||||
FN_ASSIGN(put_, 0, 1, _mmx);
|
FN_ASSIGN(put_, 0, 1, _mmx);
|
||||||
FN_ASSIGN(put_, 0, 2, _mmx);
|
FN_ASSIGN(put_, 0, 2, _mmx);
|
||||||
FN_ASSIGN(put_, 0, 3, _mmx);
|
FN_ASSIGN(put_, 0, 3, _mmx);
|
||||||
|
Loading…
x
Reference in New Issue
Block a user