ruby-changes:27770
From: nobu <ko1@a...>
Date: Tue, 19 Mar 2013 17:09:43 +0900 (JST)
Subject: [ruby-changes:27770] nobu:r39822 (trunk): convert with one converter
nobu 2013-03-19 17:09:33 +0900 (Tue, 19 Mar 2013) New Revision: 39822 http://svn.ruby-lang.org/cgi-bin/viewvc.cgi?view=rev&revision=39822 Log: convert with one converter * string.c (rb_str_conv_enc_opts): convert with one converter, instead of re-creating converters for each buffer expansion. Modified files: trunk/ChangeLog trunk/string.c Index: ChangeLog =================================================================== --- ChangeLog (revision 39821) +++ ChangeLog (revision 39822) @@ -1,3 +1,8 @@ https://github.com/ruby/ruby/blob/trunk/ChangeLog#L1 +Tue Mar 19 17:09:30 2013 Nobuyoshi Nakada <nobu@r...> + + * string.c (rb_str_conv_enc_opts): convert with one converter, instead + of re-creating converters for each buffer expansion. + Tue Mar 19 17:06:50 2013 Nobuyoshi Nakada <nobu@r...> * dir.c (glob_helper): compose HFS file names from UTF8-MAC. Index: string.c =================================================================== --- string.c (revision 39821) +++ string.c (revision 39822) @@ -492,12 +492,15 @@ RUBY_ALIAS_FUNCTION(rb_tainted_str_new2( https://github.com/ruby/ruby/blob/trunk/string.c#L492 VALUE rb_str_conv_enc_opts(VALUE str, rb_encoding *from, rb_encoding *to, int ecflags, VALUE ecopts) { + extern VALUE rb_cEncodingConverter; rb_econv_t *ec; rb_econv_result_t ret; - long len; + long len, olen; + VALUE econv_wrapper; VALUE newstr; - const unsigned char *sp; - unsigned char *dp; + const unsigned char *start, *sp; + unsigned char *dest, *dp; + size_t converted_output = 0; if (!to) return str; if (!from) from = rb_enc_get(str); @@ -513,23 +516,38 @@ rb_str_conv_enc_opts(VALUE str, rb_encod https://github.com/ruby/ruby/blob/trunk/string.c#L516 len = RSTRING_LEN(str); newstr = rb_str_new(0, len); + olen = len; - retry: ec = rb_econv_open_opts(from->name, to->name, ecflags, ecopts); if (!ec) return str; + econv_wrapper = rb_obj_alloc(rb_cEncodingConverter); + DATA_PTR(econv_wrapper) = ec; sp = (unsigned char*)RSTRING_PTR(str); - dp = (unsigned char*)RSTRING_PTR(newstr); - ret = rb_econv_convert(ec, &sp, (unsigned char*)RSTRING_END(str), - &dp, (unsigned char*)RSTRING_END(newstr), 0); + start = sp; + while ((dest = (unsigned char*)RSTRING_PTR(newstr)), + (dp = dest + converted_output), + (ret = rb_econv_convert(ec, &sp, start + len, &dp, dest + olen, 0)), + ret == econv_destination_buffer_full) { + /* destination buffer short */ + size_t converted_input = sp - start; + size_t rest = len - converted_input; + converted_output = dp - dest; + rb_str_set_len(newstr, converted_output); + if (converted_input && converted_output && + rest < (LONG_MAX / converted_output)) { + rest = (rest * converted_output) / converted_input; + } + else { + rest = olen; + } + olen += rest < 2 ? 2 : rest; + rb_str_resize(newstr, olen); + } + DATA_PTR(econv_wrapper) = 0; rb_econv_close(ec); + rb_gc_force_recycle(econv_wrapper); switch (ret) { - case econv_destination_buffer_full: - /* destination buffer short */ - len = len < 2 ? 2 : len * 2; - rb_str_resize(newstr, len); - goto retry; - case econv_finished: len = dp - (unsigned char*)RSTRING_PTR(newstr); rb_str_set_len(newstr, len); -- ML: ruby-changes@q... Info: http://www.atdot.net/~ko1/quickml/