optimized the normal bitstream writer, its faster than the alternative one on p3 now ... lets hope its at least not slower on p4 & k7

Originally committed as revision 299 to svn://svn.ffmpeg.org/ffmpeg/trunk
This commit is contained in:
Michael Niedermayer 2002-02-15 00:14:01 +00:00
parent 332105e446
commit d8cf5aea49
3 changed files with 93 additions and 124 deletions

View File

@ -36,6 +36,7 @@
#include <ctype.h> #include <ctype.h>
#include <signal.h> #include <signal.h>
#include "bswap.h" // needed for the bitstream writer in common.h which is included in avformat.h
#include "avformat.h" #include "avformat.h"
/* maximum number of simultaneous HTTP connections */ /* maximum number of simultaneous HTTP connections */

View File

@ -29,82 +29,28 @@ void init_put_bits(PutBitContext *s,
s->buf = buffer; s->buf = buffer;
s->buf_end = s->buf + buffer_size; s->buf_end = s->buf + buffer_size;
s->data_out_size = 0; s->data_out_size = 0;
#ifdef ALT_BITSTREAM_WRITER
s->index=0;
((uint32_t*)(s->buf))[0]=0;
// memset(buffer, 0, buffer_size);
if(write_data!=NULL) if(write_data!=NULL)
{ {
fprintf(stderr, "write Data callback is not supported\n"); fprintf(stderr, "write Data callback is not supported\n");
} }
#ifdef ALT_BITSTREAM_WRITER
s->index=0;
((uint32_t*)(s->buf))[0]=0;
// memset(buffer, 0, buffer_size);
#else #else
s->write_data = write_data;
s->opaque = opaque;
s->buf_ptr = s->buf; s->buf_ptr = s->buf;
s->bit_cnt=0; s->bit_left=32;
s->bit_buf=0; s->bit_buf=0;
#endif #endif
} }
#ifndef ALT_BITSTREAM_WRITER
static void flush_buffer(PutBitContext *s)
{
int size;
if (s->write_data) {
size = s->buf_ptr - s->buf;
if (size > 0)
s->write_data(s->opaque, s->buf, size);
s->buf_ptr = s->buf;
s->data_out_size += size;
}
}
void put_bits(PutBitContext *s, int n, unsigned int value)
{
unsigned int bit_buf;
int bit_cnt;
#ifdef STATS
st_out_bit_counts[st_current_index] += n;
#endif
// printf("put_bits=%d %x\n", n, value);
assert(n == 32 || value < (1U << n));
bit_buf = s->bit_buf;
bit_cnt = s->bit_cnt;
// printf("n=%d value=%x cnt=%d buf=%x\n", n, value, bit_cnt, bit_buf);
/* XXX: optimize */
if (n < (32-bit_cnt)) {
bit_buf |= value << (32 - n - bit_cnt);
bit_cnt+=n;
} else {
bit_buf |= value >> (n + bit_cnt - 32);
*(UINT32 *)s->buf_ptr = be2me_32(bit_buf);
//printf("bitbuf = %08x\n", bit_buf);
s->buf_ptr+=4;
if (s->buf_ptr >= s->buf_end)
flush_buffer(s);
bit_cnt=bit_cnt + n - 32;
if (bit_cnt == 0) {
bit_buf = 0;
} else {
bit_buf = value << (32 - bit_cnt);
}
}
s->bit_buf = bit_buf;
s->bit_cnt = bit_cnt;
}
#endif
/* return the number of bits output */ /* return the number of bits output */
INT64 get_bit_count(PutBitContext *s) INT64 get_bit_count(PutBitContext *s)
{ {
#ifdef ALT_BITSTREAM_WRITER #ifdef ALT_BITSTREAM_WRITER
return s->data_out_size * 8 + s->index; return s->data_out_size * 8 + s->index;
#else #else
return (s->buf_ptr - s->buf + s->data_out_size) * 8 + (INT64)s->bit_cnt; return (s->buf_ptr - s->buf + s->data_out_size) * 8 + 32 - (INT64)s->bit_left;
#endif #endif
} }
@ -113,7 +59,7 @@ void align_put_bits(PutBitContext *s)
#ifdef ALT_BITSTREAM_WRITER #ifdef ALT_BITSTREAM_WRITER
put_bits(s,( - s->index) & 7,0); put_bits(s,( - s->index) & 7,0);
#else #else
put_bits(s,(8 - s->bit_cnt) & 7,0); put_bits(s,s->bit_left & 7,0);
#endif #endif
} }
@ -123,79 +69,35 @@ void flush_put_bits(PutBitContext *s)
#ifdef ALT_BITSTREAM_WRITER #ifdef ALT_BITSTREAM_WRITER
align_put_bits(s); align_put_bits(s);
#else #else
while (s->bit_cnt > 0) { s->bit_buf<<= s->bit_left;
while (s->bit_left < 32) {
/* XXX: should test end of buffer */ /* XXX: should test end of buffer */
*s->buf_ptr++=s->bit_buf >> 24; *s->buf_ptr++=s->bit_buf >> 24;
s->bit_buf<<=8; s->bit_buf<<=8;
s->bit_cnt-=8; s->bit_left+=8;
} }
flush_buffer(s); s->bit_left=32;
s->bit_cnt=0;
s->bit_buf=0; s->bit_buf=0;
#endif #endif
} }
#ifndef ALT_BITSTREAM_WRITER
/* for jpeg : escape 0xff with 0x00 after it */
void jput_bits(PutBitContext *s, int n, unsigned int value)
{
unsigned int bit_buf, b;
int bit_cnt, i;
assert(n == 32 || value < (1U << n));
bit_buf = s->bit_buf;
bit_cnt = s->bit_cnt;
//printf("n=%d value=%x cnt=%d buf=%x\n", n, value, bit_cnt, bit_buf);
/* XXX: optimize */
if (n < (32-bit_cnt)) {
bit_buf |= value << (32 - n - bit_cnt);
bit_cnt+=n;
} else {
bit_buf |= value >> (n + bit_cnt - 32);
/* handle escape */
for(i=0;i<4;i++) {
b = (bit_buf >> 24);
*(s->buf_ptr++) = b;
if (b == 0xff)
*(s->buf_ptr++) = 0;
bit_buf <<= 8;
}
/* we flush the buffer sooner to handle worst case */
if (s->buf_ptr >= (s->buf_end - 8))
flush_buffer(s);
bit_cnt=bit_cnt + n - 32;
if (bit_cnt == 0) {
bit_buf = 0;
} else {
bit_buf = value << (32 - bit_cnt);
}
}
s->bit_buf = bit_buf;
s->bit_cnt = bit_cnt;
}
#endif
/* pad the end of the output stream with zeros */ /* pad the end of the output stream with zeros */
#ifndef ALT_BITSTREAM_WRITER #ifndef ALT_BITSTREAM_WRITER
void jflush_put_bits(PutBitContext *s) void jflush_put_bits(PutBitContext *s)
{ {
unsigned int b; unsigned int b;
s->bit_buf |= ~1U >> s->bit_cnt; /* set all the unused bits to one */ s->bit_buf<<= s->bit_left;
s->bit_buf |= ~1U >> (32 - s->bit_left); /* set all the unused bits to one */
while (s->bit_cnt > 0) { while (s->bit_left < 32) {
b = s->bit_buf >> 24; b = s->bit_buf >> 24;
*s->buf_ptr++ = b; *s->buf_ptr++ = b;
if (b == 0xff) if (b == 0xff)
*s->buf_ptr++ = 0; *s->buf_ptr++ = 0;
s->bit_buf<<=8; s->bit_buf<<=8;
s->bit_cnt-=8; s->bit_left+=8;
} }
flush_buffer(s); s->bit_left=32;
s->bit_cnt=0;
s->bit_buf=0; s->bit_buf=0;
} }
#else #else

View File

@ -168,10 +168,8 @@ typedef struct PutBitContext {
int index; int index;
#else #else
UINT32 bit_buf; UINT32 bit_buf;
int bit_cnt; int bit_left;
UINT8 *buf, *buf_ptr, *buf_end; UINT8 *buf, *buf_ptr, *buf_end;
void *opaque;
WriteDataFunc write_data;
#endif #endif
INT64 data_out_size; /* in bytes */ INT64 data_out_size; /* in bytes */
} PutBitContext; } PutBitContext;
@ -181,18 +179,11 @@ void init_put_bits(PutBitContext *s,
void *opaque, void *opaque,
void (*write_data)(void *, UINT8 *, int)); void (*write_data)(void *, UINT8 *, int));
#ifndef ALT_BITSTREAM_WRITER
void put_bits(PutBitContext *s, int n, unsigned int value);
#endif
INT64 get_bit_count(PutBitContext *s); /* XXX: change function name */ INT64 get_bit_count(PutBitContext *s); /* XXX: change function name */
void align_put_bits(PutBitContext *s); void align_put_bits(PutBitContext *s);
void flush_put_bits(PutBitContext *s); void flush_put_bits(PutBitContext *s);
/* jpeg specific put_bits */ /* jpeg specific put_bits */
#ifndef ALT_BITSTREAM_WRITER
void jput_bits(PutBitContext *s, int n, unsigned int value);
#endif
void jflush_put_bits(PutBitContext *s); void jflush_put_bits(PutBitContext *s);
/* bit input */ /* bit input */
@ -238,6 +229,42 @@ static inline uint32_t unaligned32(const void *v) {
#endif #endif
#endif //!ARCH_X86 #endif //!ARCH_X86
#ifndef ALT_BITSTREAM_WRITER
static inline void put_bits(PutBitContext *s, int n, unsigned int value)
{
unsigned int bit_buf;
int bit_left;
#ifdef STATS
st_out_bit_counts[st_current_index] += n;
#endif
// printf("put_bits=%d %x\n", n, value);
assert(n == 32 || value < (1U << n));
bit_buf = s->bit_buf;
bit_left = s->bit_left;
// printf("n=%d value=%x cnt=%d buf=%x\n", n, value, bit_cnt, bit_buf);
/* XXX: optimize */
if (n < bit_left) {
bit_buf = (bit_buf<<n) | value;
bit_left-=n;
} else {
bit_buf<<=bit_left;
bit_buf |= value >> (n - bit_left);
*(UINT32 *)s->buf_ptr = be2me_32(bit_buf);
//printf("bitbuf = %08x\n", bit_buf);
s->buf_ptr+=4;
bit_left+=32 - n;
bit_buf = value;
}
s->bit_buf = bit_buf;
s->bit_left = bit_left;
}
#endif
#ifdef ALT_BITSTREAM_WRITER #ifdef ALT_BITSTREAM_WRITER
static inline void put_bits(PutBitContext *s, int n, unsigned int value) static inline void put_bits(PutBitContext *s, int n, unsigned int value)
{ {
@ -304,6 +331,45 @@ static inline void put_bits(PutBitContext *s, int n, unsigned int value)
} }
#endif #endif
#ifndef ALT_BITSTREAM_WRITER
/* for jpeg : escape 0xff with 0x00 after it */
static inline void jput_bits(PutBitContext *s, int n, unsigned int value)
{
unsigned int bit_buf, b;
int bit_left, i;
assert(n == 32 || value < (1U << n));
bit_buf = s->bit_buf;
bit_left = s->bit_left;
//printf("n=%d value=%x cnt=%d buf=%x\n", n, value, bit_cnt, bit_buf);
/* XXX: optimize */
if (n < bit_left) {
bit_buf = (bit_buf<<n) | value;
bit_left-=n;
} else {
bit_buf<<=bit_left;
bit_buf |= value >> (n - bit_left);
/* handle escape */
for(i=0;i<4;i++) {
b = (bit_buf >> 24);
*(s->buf_ptr++) = b;
if (b == 0xff)
*(s->buf_ptr++) = 0;
bit_buf <<= 8;
}
bit_left+= 32 - n;
bit_buf = value;
}
s->bit_buf = bit_buf;
s->bit_left = bit_left;
}
#endif
#ifdef ALT_BITSTREAM_WRITER #ifdef ALT_BITSTREAM_WRITER
static inline void jput_bits(PutBitContext *s, int n, int value) static inline void jput_bits(PutBitContext *s, int n, int value)
{ {