ruby-changes:2663
From: ko1@a...
Date: 9 Dec 2007 12:50:55 +0900
Subject: [ruby-changes:2663] akr - Ruby:r14154 (trunk): * re.c (append_utf8): check unicode range.
akr 2007-12-09 12:50:11 +0900 (Sun, 09 Dec 2007) New Revision: 14154 Modified files: trunk/ChangeLog trunk/re.c trunk/test/ruby/test_m17n.rb Log: * re.c (append_utf8): check unicode range. http://svn.ruby-lang.org/cgi-bin/viewvc.cgi/trunk/ChangeLog?r1=14154&r2=14153 http://svn.ruby-lang.org/cgi-bin/viewvc.cgi/trunk/re.c?r1=14154&r2=14153 http://svn.ruby-lang.org/cgi-bin/viewvc.cgi/trunk/test/ruby/test_m17n.rb?r1=14154&r2=14153 Index: re.c =================================================================== --- re.c (revision 14153) +++ re.c (revision 14154) @@ -1425,9 +1425,22 @@ } static int +check_unicode_range(unsigned long code, onig_errmsg_buffer err) +{ + if ((0xd800 <= code && code <= 0xdfff) || /* Surrogates */ + 0x10ffff < code) { + strcpy(err, "invalid Unicode range"); + return -1; + } + return 0; +} + +static int append_utf8(unsigned long uv, VALUE buf, rb_encoding **encp, onig_errmsg_buffer err) { + if (check_unicode_range(uv, err) != 0) + return -1; if (uv < 0x80) { char escbuf[5]; snprintf(escbuf, sizeof(escbuf), "\\x%02x", (int)uv); @@ -1468,10 +1481,6 @@ strcpy(err, "invalid Unicode range"); return -1; } - if (0x10ffff < code) { - strcpy(err, "invalid Unicode range"); - return -1; - } p += len; if (append_utf8(code, buf, encp, err) != 0) return -1; Index: ChangeLog =================================================================== --- ChangeLog (revision 14153) +++ ChangeLog (revision 14154) @@ -1,3 +1,7 @@ +Sun Dec 9 12:49:34 2007 Tanaka Akira <akr@f...> + + * re.c (append_utf8): check unicode range. + Sun Dec 9 12:39:01 2007 Nobuyoshi Nakada <nobu@r...> * lib/cgi.rb (read_multipart): exclude blanks from header values. Index: test/ruby/test_m17n.rb =================================================================== --- test/ruby/test_m17n.rb (revision 14153) +++ test/ruby/test_m17n.rb (revision 14154) @@ -446,6 +446,16 @@ #assert_raise(SyntaxError) { s1, s2 = u('\xc2'), u('\xa1'); /#{s1}#{s2}/ } end + def test_regexp_unicode + assert_nothing_raised { eval '/\u{0}/' } + assert_nothing_raised { eval '/\u{D7FF}/' } + assert_raise(SyntaxError) { eval '/\u{D800}/' } + assert_raise(SyntaxError) { eval '/\u{DFFF}/' } + assert_nothing_raised { eval '/\u{E000}/' } + assert_nothing_raised { eval '/\u{10FFFF}/' } + assert_raise(SyntaxError) { eval '/\u{110000}/' } + end + def test_regexp_mixed_unicode assert_raise(SyntaxError) { eval(a(%{/\xc2\xa0\\u{6666}/})) } assert_raise(SyntaxError) { eval(e(%{/\xc2\xa0\\u{6666}/})) } -- ML: ruby-changes@q... Info: http://www.atdot.net/~ko1/quickml