Skip to content

Commit

Permalink
* ext/psych/parser.c: prevent a memory leak by protecting calls to
Browse files Browse the repository at this point in the history
  handler callbacks.
* test/psych/test_parser.rb: test to demonstrate leak.
  • Loading branch information
tenderlove committed Feb 28, 2012
1 parent 9eb1264 commit 3ef54d1
Show file tree
Hide file tree
Showing 3 changed files with 155 additions and 24 deletions.
6 changes: 6 additions & 0 deletions CHANGELOG.rdoc
@@ -1,3 +1,9 @@
Fri Feb 24 13:54:33 2012 Aaron Patterson <aaron@tenderlovemaking.com>

* ext/psych/parser.c: prevent a memory leak by protecting calls to
handler callbacks.
* test/psych/test_parser.rb: test to demonstrate leak.

Fri Feb 24 08:08:38 2012 Aaron Patterson <aaron@tenderlovemaking.com>

* ext/psych/parser.c: set parser encoding based on the YAML input
Expand Down
143 changes: 119 additions & 24 deletions ext/psych/parser.c
Expand Up @@ -154,6 +154,68 @@ static VALUE transcode_io(VALUE src, int * parser_encoding)

#endif

static VALUE protected_start_stream(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall(args[0], id_start_stream, 1, args[1]);
}

static VALUE protected_start_document(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall3(args[0], id_start_document, 3, args + 1);
}

static VALUE protected_end_document(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall(args[0], id_end_document, 1, args[1]);
}

static VALUE protected_alias(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall(args[0], id_alias, 1, args[1]);
}

static VALUE protected_scalar(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall3(args[0], id_scalar, 6, args + 1);
}

static VALUE protected_start_sequence(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall3(args[0], id_start_sequence, 4, args + 1);
}

static VALUE protected_end_sequence(VALUE handler)
{
return rb_funcall(handler, id_end_sequence, 0);
}

static VALUE protected_start_mapping(VALUE pointer)
{
VALUE *args = (VALUE *)pointer;
return rb_funcall3(args[0], id_start_mapping, 4, args + 1);
}

static VALUE protected_end_mapping(VALUE handler)
{
return rb_funcall(handler, id_end_mapping, 0);
}

static VALUE protected_empty(VALUE handler)
{
return rb_funcall(handler, id_empty, 0);
}

static VALUE protected_end_stream(VALUE handler)
{
return rb_funcall(handler, id_end_stream, 0);
}

/*
* call-seq:
* parser.parse(yaml)
Expand All @@ -170,6 +232,7 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)
yaml_event_t event;
int done = 0;
int tainted = 0;
int state = 0;
int parser_encoding = YAML_ANY_ENCODING;
#ifdef HAVE_RUBY_ENCODING_H
int encoding = rb_utf8_encindex();
Expand Down Expand Up @@ -223,14 +286,18 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)
}

switch(event.type) {
case YAML_STREAM_START_EVENT:

rb_funcall(handler, id_start_stream, 1,
INT2NUM((long)event.data.stream_start.encoding)
);
break;
case YAML_STREAM_START_EVENT:
{
VALUE args[2];

args[0] = handler;
args[1] = INT2NUM((long)event.data.stream_start.encoding);
rb_protect(protected_start_stream, (VALUE)args, &state);
}
break;
case YAML_DOCUMENT_START_EVENT:
{
VALUE args[4];
/* Get a list of tag directives (if any) */
VALUE tag_directives = rb_ary_new();
/* Grab the document version */
Expand Down Expand Up @@ -268,19 +335,25 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)
rb_ary_push(tag_directives, rb_ary_new3((long)2, handle, prefix));
}
}
rb_funcall(handler, id_start_document, 3,
version, tag_directives,
event.data.document_start.implicit == 1 ? Qtrue : Qfalse
);
args[0] = handler;
args[1] = version;
args[2] = tag_directives;
args[3] = event.data.document_start.implicit == 1 ? Qtrue : Qfalse;
rb_protect(protected_start_document, (VALUE)args, &state);
}
break;
case YAML_DOCUMENT_END_EVENT:
rb_funcall(handler, id_end_document, 1,
event.data.document_end.implicit == 1 ? Qtrue : Qfalse
);
{
VALUE args[2];

args[0] = handler;
args[1] = event.data.document_end.implicit == 1 ? Qtrue : Qfalse;
rb_protect(protected_end_document, (VALUE)args, &state);
}
break;
case YAML_ALIAS_EVENT:
{
VALUE args[2];
VALUE alias = Qnil;
if(event.data.alias.anchor) {
alias = rb_str_new2((const char *)event.data.alias.anchor);
Expand All @@ -290,11 +363,14 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)
#endif
}

rb_funcall(handler, id_alias, 1, alias);
args[0] = handler;
args[1] = alias;
rb_protect(protected_alias, (VALUE)args, &state);
}
break;
case YAML_SCALAR_EVENT:
{
VALUE args[7];
VALUE anchor = Qnil;
VALUE tag = Qnil;
VALUE plain_implicit, quoted_implicit, style;
Expand Down Expand Up @@ -332,12 +408,19 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)

style = INT2NUM((long)event.data.scalar.style);

rb_funcall(handler, id_scalar, 6,
val, anchor, tag, plain_implicit, quoted_implicit, style);
args[0] = handler;
args[1] = val;
args[2] = anchor;
args[3] = tag;
args[4] = plain_implicit;
args[5] = quoted_implicit;
args[6] = style;
rb_protect(protected_scalar, (VALUE)args, &state);
}
break;
case YAML_SEQUENCE_START_EVENT:
{
VALUE args[5];
VALUE anchor = Qnil;
VALUE tag = Qnil;
VALUE implicit, style;
Expand All @@ -363,15 +446,21 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)

style = INT2NUM((long)event.data.sequence_start.style);

rb_funcall(handler, id_start_sequence, 4,
anchor, tag, implicit, style);
args[0] = handler;
args[1] = anchor;
args[2] = tag;
args[3] = implicit;
args[4] = style;

rb_protect(protected_start_sequence, (VALUE)args, &state);
}
break;
case YAML_SEQUENCE_END_EVENT:
rb_funcall(handler, id_end_sequence, 0);
rb_protect(protected_end_sequence, handler, &state);
break;
case YAML_MAPPING_START_EVENT:
{
VALUE args[5];
VALUE anchor = Qnil;
VALUE tag = Qnil;
VALUE implicit, style;
Expand All @@ -396,22 +485,28 @@ static VALUE parse(int argc, VALUE *argv, VALUE self)

style = INT2NUM((long)event.data.mapping_start.style);

rb_funcall(handler, id_start_mapping, 4,
anchor, tag, implicit, style);
args[0] = handler;
args[1] = anchor;
args[2] = tag;
args[3] = implicit;
args[4] = style;

rb_protect(protected_start_mapping, (VALUE)args, &state);
}
break;
case YAML_MAPPING_END_EVENT:
rb_funcall(handler, id_end_mapping, 0);
rb_protect(protected_end_mapping, handler, &state);
break;
case YAML_NO_EVENT:
rb_funcall(handler, id_empty, 0);
rb_protect(protected_empty, handler, &state);
break;
case YAML_STREAM_END_EVENT:
rb_funcall(handler, id_end_stream, 0);
rb_protect(protected_end_stream, handler, &state);
done = 1;
break;
}
yaml_event_delete(&event);
if (state) rb_jump_tag(state);
}

return self;
Expand Down
30 changes: 30 additions & 0 deletions test/psych/test_parser.rb
Expand Up @@ -32,6 +32,36 @@ def setup
@handler.parser = @parser
end

def test_exception_memory_leak
yaml = <<-eoyaml
%YAML 1.1
%TAG ! tag:tenderlovemaking.com,2009:
--- &ponies
- first element
- *ponies
- foo: bar
...
eoyaml

[:start_stream, :start_document, :end_document, :alias, :scalar,
:start_sequence, :end_sequence, :start_mapping, :end_mapping,
:end_stream].each do |method|

klass = Class.new(Psych::Handler) do
define_method(method) do |*args|
raise
end
end

parser = Psych::Parser.new klass.new
2.times {
assert_raises(RuntimeError, method.to_s) do
parser.parse yaml
end
}
end
end

def test_multiparse
3.times do
@parser.parse '--- foo'
Expand Down

0 comments on commit 3ef54d1

Please sign in to comment.