ruby: use malloc/realloc for stream buffer

This commit is contained in:
frsyuki 2010-05-26 07:01:28 +09:00
parent 26bc835c7e
commit 5fa589691c

@ -27,16 +27,17 @@ static ID s_readpartial;
int s_ascii_8bit; int s_ascii_8bit;
#endif #endif
static ID s_slice_bang; struct unpack_buffer {
#ifdef RUBY_VM size_t size;
static ID s_clear; size_t free;
#endif char* ptr;
};
typedef struct { typedef struct {
int finished; int finished;
VALUE source; VALUE source;
size_t offset; size_t offset;
VALUE buffer; struct unpack_buffer buffer;
VALUE stream; VALUE stream;
VALUE streambuf; VALUE streambuf;
ID stream_append_method; ID stream_append_method;
@ -129,8 +130,16 @@ static inline int template_callback_map_item(unpack_user* u, VALUE* c, VALUE k,
#endif #endif
static inline int template_callback_raw(unpack_user* u, const char* b, const char* p, unsigned int l, VALUE* o) static inline int template_callback_raw(unpack_user* u, const char* b, const char* p, unsigned int l, VALUE* o)
{ *o = (l <= COW_MIN_SIZE) ? rb_str_new(p, l) : rb_str_substr(u->source, p - b, l); return 0; } //{ *o = (l <= COW_MIN_SIZE) ? rb_str_new(p, l) : rb_str_substr(u->source, p - b, l); return 0; }
//{ *o = rb_str_new(p, l); return 0; } //{ *o = rb_str_new(p, l); return 0; }
{
if(u->source == Qnil || l <= COW_MIN_SIZE) {
*o = rb_str_new(p, l);
} else {
*o = rb_str_substr(u->source, p - b, l);
}
return 0;
}
#include "msgpack/unpack_template.h" #include "msgpack/unpack_template.h"
@ -209,6 +218,27 @@ static int template_execute_wrap(msgpack_unpack_t* mp,
return ret; return ret;
} }
static int template_execute_wrap_each(msgpack_unpack_t* mp,
const char* ptr, size_t dlen, size_t* from)
{
VALUE args[4] = {
(VALUE)mp,
(VALUE)ptr,
(VALUE)dlen,
(VALUE)from,
};
// FIXME execute実行中はmp->topが更新されないのでGC markが機能しない
rb_gc_disable();
int ret = (int)rb_rescue(template_execute_do, (VALUE)args,
template_execute_rescue, Qnil);
rb_gc_enable();
return ret;
}
static VALUE cUnpacker; static VALUE cUnpacker;
@ -220,15 +250,26 @@ static VALUE cUnpacker;
static VALUE eUnpackError; static VALUE eUnpackError;
#ifndef MSGPACK_UNPACKER_BUFFER_INIT_SIZE
#define MSGPACK_UNPACKER_BUFFER_INIT_SIZE (32*1024)
#endif
#ifndef MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE
#define MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE (8*1024)
#endif
static void MessagePack_Unpacker_free(void* data) static void MessagePack_Unpacker_free(void* data)
{ {
if(data) { free(data); } if(data) {
msgpack_unpack_t* mp = (msgpack_unpack_t*)data;
free(mp->user.buffer.ptr);
free(mp);
}
} }
static void MessagePack_Unpacker_mark(msgpack_unpack_t *mp) static void MessagePack_Unpacker_mark(msgpack_unpack_t *mp)
{ {
unsigned int i; unsigned int i;
rb_gc_mark(mp->user.buffer);
rb_gc_mark(mp->user.stream); rb_gc_mark(mp->user.stream);
rb_gc_mark(mp->user.streambuf); rb_gc_mark(mp->user.streambuf);
for(i=0; i < mp->top; ++i) { for(i=0; i < mp->top; ++i) {
@ -255,14 +296,6 @@ static ID append_method_of(VALUE stream)
} }
} }
#ifndef MSGPACK_UNPACKER_BUFFER_INIT_SIZE
#define MSGPACK_UNPACKER_BUFFER_INIT_SIZE (32*1024)
#endif
#ifndef MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE
#define MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE (8*1024)
#endif
/** /**
* Document-method: MessagePack::Unpacker#initialize * Document-method: MessagePack::Unpacker#initialize
* *
@ -297,7 +330,9 @@ static VALUE MessagePack_Unpacker_initialize(int argc, VALUE *argv, VALUE self)
template_init(mp); template_init(mp);
mp->user.finished = 0; mp->user.finished = 0;
mp->user.offset = 0; mp->user.offset = 0;
mp->user.buffer = rb_str_buf_new(MSGPACK_UNPACKER_BUFFER_INIT_SIZE); mp->user.buffer.size = 0;
mp->user.buffer.free = 0;
mp->user.buffer.ptr = NULL;
mp->user.stream = stream; mp->user.stream = stream;
mp->user.streambuf = rb_str_buf_new(MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE); mp->user.streambuf = rb_str_buf_new(MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE);
mp->user.stream_append_method = append_method_of(stream); mp->user.stream_append_method = append_method_of(stream);
@ -363,34 +398,66 @@ static VALUE MessagePack_Unpacker_stream_set(VALUE self, VALUE val)
# define NEED_MORE_CAPA(s,size) (!FL_TEST(s,STR_NOCAPA) && RSTRING(s)->aux.capa < size) # define NEED_MORE_CAPA(s,size) (!FL_TEST(s,STR_NOCAPA) && RSTRING(s)->aux.capa < size)
#endif #endif
static void try_rewind_buffer(msgpack_unpack_t* mp, size_t required) static void feed_buffer(msgpack_unpack_t* mp, const char* ptr, size_t len)
{ {
VALUE buffer = mp->user.buffer; struct unpack_buffer* buffer = &mp->user.buffer;
size_t need_capa = RSTRING_LEN(buffer) + required; if(buffer->size == 0) {
char* tmp = (char*)malloc(MSGPACK_UNPACKER_BUFFER_INIT_SIZE);
// FIXME check tmp == NULL
buffer->ptr = tmp;
buffer->free = MSGPACK_UNPACKER_BUFFER_INIT_SIZE;
buffer->size = 0;
if(NEED_MORE_CAPA(buffer, need_capa)) { } else if(buffer->size <= mp->user.offset) {
/* FIXME /* clear buffer and rewind offset */
#ifdef RUBY_VM buffer->free += buffer->size;
if(RSTRING_LEN(buffer) <= mp->user.offset) { buffer->size = 0;
rb_funcall(buffer, s_clear, 0);
mp->user.offset = 0;
return;
}
#endif
rb_funcall(buffer, s_slice_bang, 2, LONG2FIX(0), LONG2FIX(mp->user.offset));
mp->user.offset = 0;
*/
size_t not_parsed = RSTRING_LEN(buffer) - mp->user.offset;
size_t nsize = MSGPACK_UNPACKER_BUFFER_INIT_SIZE * 2;
while(nsize < not_parsed + required) {
nsize *= 2;
}
VALUE nbuffer = rb_str_buf_new(nsize);
rb_str_buf_cat(nbuffer, RSTRING_PTR(buffer)+mp->user.offset, not_parsed);
mp->user.buffer = nbuffer;
mp->user.offset = 0; mp->user.offset = 0;
} }
if(len <= buffer->free) {
/* enough free space: just copy */
memcpy(buffer->ptr+buffer->size, ptr, len);
buffer->size += len;
buffer->free -= len;
return;
}
size_t csize = buffer->size + buffer->free;
if(mp->user.offset <= buffer->size / 2) {
/* parsed less than half: realloc and copy */
csize *= 2;
while(csize < buffer->size + len) {
csize *= 2;
}
char* tmp = (char*)realloc(buffer->ptr, csize);
// FIXME check tmp == NULL
memcpy(tmp + buffer->size, ptr, len);
buffer->ptr = tmp;
buffer->free = csize - buffer->size;
return;
}
size_t not_parsed = buffer->size - mp->user.offset;
if(csize < not_parsed + len) {
/* more buffer size */
csize *= 2;
while(csize < not_parsed + len) {
csize *= 2;
}
char* tmp = (char*)realloc(buffer->ptr, csize);
// FIXME check tmp == NULL
buffer->ptr = tmp;
}
memcpy(buffer->ptr+not_parsed, ptr, not_parsed);
buffer->size = not_parsed;
buffer->free = csize - buffer->size;
buffer->ptr = buffer->ptr;
mp->user.offset = 0;
} }
/** /**
@ -405,8 +472,7 @@ static VALUE MessagePack_Unpacker_feed(VALUE self, VALUE data)
{ {
UNPACKER(self, mp); UNPACKER(self, mp);
StringValue(data); StringValue(data);
try_rewind_buffer(mp, RSTRING_LEN(data)); feed_buffer(mp, RSTRING_PTR(data), RSTRING_LEN(data));
rb_str_cat(mp->user.buffer, RSTRING_PTR(data), RSTRING_LEN(data));
return Qnil; return Qnil;
} }
@ -432,18 +498,12 @@ static VALUE MessagePack_Unpacker_fill(VALUE self)
return Qnil; return Qnil;
} }
long len; rb_funcall(mp->user.stream, mp->user.stream_append_method, 2,
if(RSTRING_LEN(mp->user.buffer) == 0) { LONG2FIX(MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE),
rb_funcall(mp->user.stream, mp->user.stream_append_method, 2, mp->user.streambuf);
LONG2FIX(MSGPACK_UNPACKER_BUFFER_INIT_SIZE), mp->user.buffer);
len = RSTRING_LEN(mp->user.buffer); size_t len = RSTRING_LEN(mp->user.streambuf);
} else { feed_buffer(mp, RSTRING_PTR(mp->user.streambuf), len);
rb_funcall(mp->user.stream, mp->user.stream_append_method, 2,
LONG2FIX(MSGPACK_UNPACKER_BUFFER_RESERVE_SIZE), mp->user.streambuf);
len = RSTRING_LEN(mp->user.streambuf);
try_rewind_buffer(mp, len);
rb_str_cat(mp->user.buffer, RSTRING_PTR(mp->user.streambuf), RSTRING_LEN(mp->user.streambuf));
}
return LONG2FIX(len); return LONG2FIX(len);
} }
@ -470,7 +530,7 @@ static VALUE MessagePack_Unpacker_each(VALUE self)
#endif #endif
while(1) { while(1) {
if(RSTRING_LEN(mp->user.buffer) <= mp->user.offset) { if(mp->user.buffer.size <= mp->user.offset) {
do_fill: do_fill:
{ {
VALUE len = MessagePack_Unpacker_fill(self); VALUE len = MessagePack_Unpacker_fill(self);
@ -480,8 +540,9 @@ static VALUE MessagePack_Unpacker_each(VALUE self)
} }
} }
ret = template_execute_wrap(mp, mp->user.buffer, ret = template_execute_wrap_each(mp,
RSTRING_LEN(mp->user.buffer), &mp->user.offset); mp->user.buffer.ptr, mp->user.buffer.size,
&mp->user.offset);
if(ret < 0) { if(ret < 0) {
rb_raise(eUnpackError, "parse error."); rb_raise(eUnpackError, "parse error.");
@ -689,11 +750,6 @@ void Init_msgpack_unpack(VALUE mMessagePack)
s_ascii_8bit = rb_enc_find_index("ASCII-8BIT"); s_ascii_8bit = rb_enc_find_index("ASCII-8BIT");
#endif #endif
s_slice_bang = rb_intern("slice!");
#ifdef RUBY_VM
s_clear = rb_intern("clear");
#endif
eUnpackError = rb_define_class_under(mMessagePack, "UnpackError", rb_eStandardError); eUnpackError = rb_define_class_under(mMessagePack, "UnpackError", rb_eStandardError);
cUnpacker = rb_define_class_under(mMessagePack, "Unpacker", rb_cObject); cUnpacker = rb_define_class_under(mMessagePack, "Unpacker", rb_cObject);
rb_define_alloc_func(cUnpacker, MessagePack_Unpacker_alloc); rb_define_alloc_func(cUnpacker, MessagePack_Unpacker_alloc);