ruby-changes:3408
From: ko1@a...
Date: 6 Jan 2008 04:15:17 +0900
Subject: [ruby-changes:3408] akr - Ruby:r14901 (trunk): split combinational tests.
akr 2008-01-06 04:14:24 +0900 (Sun, 06 Jan 2008) New Revision: 14901 Added files: trunk/test/ruby/test_m17n_comb.rb Modified files: trunk/test/ruby/test_m17n.rb Log: split combinational tests. http://svn.ruby-lang.org/cgi-bin/viewvc.cgi/trunk/test/ruby/test_m17n_comb.rb http://svn.ruby-lang.org/cgi-bin/viewvc.cgi/trunk/test/ruby/test_m17n.rb?r1=14901&r2=14900&diff_format=u Index: test/ruby/test_m17n.rb =================================================================== --- test/ruby/test_m17n.rb (revision 14900) +++ test/ruby/test_m17n.rb (revision 14901) @@ -78,50 +78,6 @@ assert_regexp_fixed_encoding(r) end - STRINGS = [ - a(""), e(""), s(""), u(""), - a("a"), e("a"), s("a"), u("a"), - a("."), e("."), s("."), u("."), - - # single character - a("\x80"), a("\xff"), - e("\xa1\xa1"), e("\xfe\xfe"), - e("\x8e\xa1"), e("\x8e\xfe"), - e("\x8f\xa1\xa1"), e("\x8f\xfe\xfe"), - s("\x81\x40"), s("\xfc\xfc"), - s("\xa1"), s("\xdf"), - u("\xc2\x80"), u("\xf4\x8f\xbf\xbf"), - - # same byte sequence - a("\xc2\xa1"), e("\xc2\xa1"), s("\xc2\xa1"), u("\xc2\xa1"), - - s("\x81A"), # mutibyte character which contains "A" - s("\x81a"), # mutibyte character which contains "a" - - # invalid - e("\xa1"), e("\x80"), - s("\x81"), s("\x80"), - u("\xc2"), u("\x80"), - - # for transitivity test - u("\xe0\xa0\xa1"), - e("\xe0\xa0\xa1"), - s("\xe0\xa0\xa1"), - ] - - def combination(*args) - if args.empty? - yield [] - else - arg = args.shift - arg.each {|v| - combination(*args) {|vs| - yield [v, *vs] - } - } - end - end - def encdump(str) "#{str.dump}.force_encoding(#{str.encoding.name.dump})" end @@ -164,34 +120,6 @@ end end - def each_slice_call - combination(STRINGS, -2..2) {|s, nth| - yield s, nth - } - combination(STRINGS, -2..2, 0..2) {|s, nth, len| - yield s, nth, len - } - combination(STRINGS, STRINGS) {|s, substr| - yield s, substr - } - combination(STRINGS, -2..2, 0..2) {|s, first, last| - yield s, first..last - yield s, first...last - } - combination(STRINGS, STRINGS) {|s1, s2| - if !s2.valid_encoding? - next - end - yield s1, Regexp.new(Regexp.escape(s2)) - } - combination(STRINGS, STRINGS, 0..2) {|s1, s2, nth| - if !s2.valid_encoding? - next - end - yield s1, Regexp.new(Regexp.escape(s2)), nth - } - end - def str_enc_compatible?(*strs) encs = [] strs.each {|s| @@ -669,36 +597,6 @@ assert_equal(Encoding::ASCII_8BIT, s.encoding) end - def test_str_new - STRINGS.each {|s| - t = String.new(s) - assert_strenc(a(s), s.encoding, t) - } - end - - def test_str_plus - combination(STRINGS, STRINGS) {|s1, s2| - if s1.encoding != s2.encoding && !s1.ascii_only? && !s2.ascii_only? - assert_raise(ArgumentError) { s1 + s2 } - else - t = s1 + s2 - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert_equal(a(s1) + a(s2), a(t)) - assert_str_enc_propagation(t, s1, s2) - end - } - end - - def test_str_times - STRINGS.each {|s| - [0,1,2].each {|n| - t = s * n - assert(t.valid_encoding?) if s.valid_encoding? - assert_strenc(a(s) * n, s.encoding, t) - } - } - end - def test_sprintf_c assert_strenc("\x80", 'ASCII-8BIT', a("%c") % 128) #assert_raise(ArgumentError) { a("%c") % 0xc2a1 } @@ -710,15 +608,6 @@ assert_strenc("\u{c2}", 'UTF-8', u("%c") % 0xc2) end - def test_sprintf_s - STRINGS.each {|s| - assert_strenc(a(s), s.encoding, "%s".force_encoding(s.encoding) % s) - if !s.empty? # xxx - assert_strenc(a(s), s.encoding, a("%s") % s) - end - } - end - def test_sprintf_p assert_strenc('""', 'ASCII-8BIT', a("%p") % a("")) assert_strenc('""', 'EUC-JP', e("%p") % e("")) @@ -741,67 +630,12 @@ assert_strenc('"\x00"', 'UTF-8', u("%p") % u("\x00")) end - def test_str_eq_reflexive - STRINGS.each {|s| - assert(s == s, "#{encdump s} == #{encdump s}") - } - end - - def test_str_eq_symmetric - combination(STRINGS, STRINGS) {|s1, s2| - if s1 == s2 - assert(s2 == s1, "#{encdump s2} == #{encdump s1}") - else - assert(!(s2 == s1), "!(#{encdump s2} == #{encdump s1})") - end - } - end - - def test_str_eq_transitive - combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| - if s1 == s2 && s2 == s3 - assert(s1 == s3, "transitive: #{encdump s1} == #{encdump s2} == #{encdump s3}") - end - } - end - - def test_str_eq - combination(STRINGS, STRINGS) {|s1, s2| - desc_eq = "#{encdump s1} == #{encdump s2}" - if s1.ascii_only? && s2.ascii_only? && a(s1) == a(s2) - assert(s1 == s2, desc_eq) - elsif s1.encoding == s2.encoding && a(s1) == a(s2) - assert(s1 == s2, desc_eq) - assert(!(s1 != s2)) - assert_equal(0, s1 <=> s2) - else - assert(!(s1 == s2), "!(#{desc_eq})") - assert(s1 != s2) - assert_not_equal(0, s1 <=> s2) - end - } - end - def test_str_lt assert(a("a") < a("\xa1")) assert(a("a") < s("\xa1")) assert(s("a") < a("\xa1")) end - def test_str_concat - combination(STRINGS, STRINGS) {|s1, s2| - s = s1.dup - if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding - s << s2 - assert(s.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert_equal(a(s), a(s1) + a(s2)) - assert_str_enc_propagation(s, s1, s2) - else - assert_raise(ArgumentError) { s << s2 } - end - } - end - def test_str_aref assert_equal(a("\xc2"), a("\xc2\xa1")[0]) assert_equal(a("\xa1"), a("\xc2\xa1")[1]) @@ -813,17 +647,6 @@ assert_equal(nil, s("\xc2\xa1")[2]) assert_equal(u("\xc2\xa1"), u("\xc2\xa1")[0]) assert_equal(nil, u("\xc2\xa1")[1]) - - STRINGS.each {|s| - t = '' - 0.upto(s.length-1) {|i| - u = s[i] - assert(u.valid_encoding?) if s.valid_encoding? - t << u - } - assert_equal(t, s) - } - end def test_str_aref_len @@ -838,26 +661,6 @@ assert_equal(u("\xc2\xa2"), u("\xc2\xa1\xc2\xa2\xc2\xa3")[1, 1]) assert_equal(u("\xc2\xa2\xc2\xa3"), u("\xc2\xa1\xc2\xa2\xc2\xa3")[1, 2]) - - STRINGS.each {|s| - t = '' - 0.upto(s.length-1) {|i| - u = s[i,1] - assert(u.valid_encoding?) if s.valid_encoding? - t << u - } - assert_equal(t, s) - } - - STRINGS.each {|s| - t = '' - 0.step(s.length-1, 2) {|i| - u = s[i,2] - assert(u.valid_encoding?) if s.valid_encoding? - t << u - } - assert_equal(t, s) - } end def test_str_aref_substr @@ -872,888 +675,17 @@ assert_equal(nil, u("\xc2\xa1\xc2\xa2\xc2\xa3")[u("\xa1\xc2")]) assert_raise(ArgumentError) { u("\xc2\xa1\xc2\xa2\xc2\xa3")[a("\xa1\xc2")] } - - combination(STRINGS, STRINGS) {|s1, s2| - if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding - t = s1[s2] - if t != nil - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert_equal(s2, t) - assert_match(/#{Regexp.escape(a(s2))}/, a(s1)) - if s1.valid_encoding? - assert_match(/#{Regexp.escape(s2)}/, s1) - end - end - else - assert_raise(ArgumentError) { s1[s2] } - end - } end - def test_str_aref_range2 - combination(STRINGS, -2..2, -2..2) {|s, first, last| - t = s[first..last] - if first < 0 - first += s.length - if first < 0 - assert_nil(t, "#{s.inspect}[#{first}..#{last}]") - next - end - end - if s.length < first - assert_nil(t, "#{s.inspect}[#{first}..#{last}]") - next - end - assert(t.valid_encoding?) if s.valid_encoding? - if last < 0 - last += s.length - end - t2 = '' - first.upto(last) {|i| - c = s[i] - t2 << c if c - } - assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]") - } - end - - def test_str_aref_range3 - combination(STRINGS, -2..2, -2..2) {|s, first, last| - t = s[first...last] - if first < 0 - first += s.length - if first < 0 - assert_nil(t, "#{s.inspect}[#{first}..#{last}]") - next - end - end - if s.length < first - assert_nil(t, "#{s.inspect}[#{first}..#{last}]") - next - end - if last < 0 - last += s.length - end - assert(t.valid_encoding?) if s.valid_encoding? - t2 = '' - first.upto(last-1) {|i| - c = s[i] - t2 << c if c - } - assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]") - } - end - - def test_str_assign - combination(STRINGS, STRINGS) {|s1, s2| - (-2).upto(2) {|i| - t = s1.dup - if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding - if i < -s1.length || s1.length < i - assert_raise(IndexError) { t[i] = s2 } - else - t[i] = s2 - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert(a(t).index(a(s2))) - if s1.valid_encoding? && s2.valid_encoding? - if i == s1.length && s2.empty? - assert_nil(t[i]) - elsif i < 0 - assert_equal(s2, t[i-s2.length+1,s2.length], - "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i-s2.length+1},#{s2.length}]") - else - assert_equal(s2, t[i,s2.length], - "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i},#{s2.length}]") - end - end - end - else - assert_raise(ArgumentError) { t[i] = s2 } - end - } - } - end - - def test_str_assign_len - combination(STRINGS, -2..2, 0..2, STRINGS) {|s1, i, len, s2| - t = s1.dup - if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding - if i < -s1.length || s1.length < i - assert_raise(IndexError) { t[i,len] = s2 } - else - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - t[i,len] = s2 - assert(a(t).index(a(s2))) - if s1.valid_encoding? && s2.valid_encoding? - if i == s1.length && s2.empty? - assert_nil(t[i]) - elsif i < 0 - if -i < len - len = -i - end - assert_equal(s2, t[i-s2.length+len,s2.length], - "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i-s2.length+len},#{s2.length}]") - else - assert_equal(s2, t[i,s2.length], - "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i},#{s2.length}]") - end - end - end - else - assert_raise(ArgumentError) { t[i,len] = s2 } - end - } - end - - def test_str_assign_substr - combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| - t = s1.dup - encs = [ - !s1.ascii_only? ? s1.encoding : nil, - !s2.ascii_only? ? s2.encoding : nil, - !s3.ascii_only? ? s3.encoding : nil].uniq.compact - if 1 < encs.length - assert_raise(ArgumentError, IndexError) { t[s2] = s3 } - else - if encs.empty? - encs = [ - s1.encoding, - s2.encoding, - s3.encoding].uniq.reject {|e| e == Encoding.find("ASCII-8BIT") } - if encs.empty? - encs = [Encoding.find("ASCII-8BIT")] - end - end - if !t[s2] - else - t[s2] = s3 - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? && s3.valid_encoding? - end - end - } - end - - def test_str_assign_range2 - combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2| - t = s1.dup - if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding - if first < -s1.length || s1.length < first - assert_raise(RangeError) { t[first..last] = s2 } - else - t[first..last] = s2 - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert(a(t).index(a(s2))) - if s1.valid_encoding? && s2.valid_encoding? - if first < 0 - assert_equal(s2, t[s1.length+first, s2.length]) - else - assert_equal(s2, t[first, s2.length]) - end - end - end - else - assert_raise(ArgumentError, RangeError, - "t=#{encdump(s1)};t[#{first}..#{last}]=#{encdump(s2)}") { - t[first..last] = s2 - } - end - } - end - - def test_str_assign_range3 - combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2| - t = s1.dup - if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding - if first < -s1.length || s1.length < first - assert_raise(RangeError) { t[first...last] = s2 } - else - t[first...last] = s2 - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert(a(t).index(a(s2))) - if s1.valid_encoding? && s2.valid_encoding? - if first < 0 - assert_equal(s2, t[s1.length+first, s2.length]) - else - assert_equal(s2, t[first, s2.length]) - end - end - end - else - assert_raise(ArgumentError, RangeError, - "t=#{encdump(s1)};t[#{first}...#{last}]=#{encdump(s2)}") { - t[first...last] = s2 - } - end - } - end - - def test_str_cmp - combination(STRINGS, STRINGS) {|s1, s2| - desc = "#{encdump s1} <=> #{encdump s2}" - r = s1 <=> s2 - if s1 == s2 - assert_equal(0, r, desc) - else - assert_not_equal(0, r, desc) - end - } - end - - def test_str_capitalize - STRINGS.each {|s| - begin - t1 = s.capitalize - rescue ArgumentError - assert(!s.valid_encoding?) - next - end - assert(t1.valid_encoding?) if s.valid_encoding? - assert(t1.casecmp(s)) - t2 = s.dup - t2.capitalize! - assert_equal(t1, t2) - assert_equal(s.downcase.sub(/\A[a-z]/) {|ch| a(ch).upcase }, t1) - } - end - - def test_str_casecmp - combination(STRINGS, STRINGS) {|s1, s2| - #puts "#{encdump(s1)}.casecmp(#{encdump(s2)})" - begin - r = s1.casecmp(s2) - rescue ArgumentError - assert(!s1.valid_encoding? || !s2.valid_encoding?) - next - end - #assert_equal(s1.upcase <=> s2.upcase, r) - } - end - def test_str_center assert_encoding("EUC-JP", "a".center(5, "\xa1\xa2".force_encoding("euc-jp")).encoding) - - combination(STRINGS, [0,1,2,3,10]) {|s1, width| - t = s1.center(width) - assert(a(t).index(a(s1))) - } - combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2| - if s2.empty? - assert_raise(ArgumentError) { s1.center(width, s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.center(width, s2) } - next - end - t = s1.center(width, s2) - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert(a(t).index(a(s1))) - assert_str_enc_propagation(t, s1, s2) if (t != s1) - } end - def test_str_ljust - combination(STRINGS, [0,1,2,3,10]) {|s1, width| - t = s1.ljust(width) - assert(a(t).index(a(s1))) - } - combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2| - if s2.empty? - assert_raise(ArgumentError) { s1.ljust(width, s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.ljust(width, s2) } - next - end - t = s1.ljust(width, s2) - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert(a(t).index(a(s1))) - assert_str_enc_propagation(t, s1, s2) if (t != s1) - } - end - - def test_str_rjust - combination(STRINGS, [0,1,2,3,10]) {|s1, width| - t = s1.rjust(width) - assert(a(t).index(a(s1))) - } - combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2| - if s2.empty? - assert_raise(ArgumentError) { s1.rjust(width, s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.rjust(width, s2) } - next - end - t = s1.rjust(width, s2) - assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? - assert(a(t).index(a(s1))) - assert_str_enc_propagation(t, s1, s2) if (t != s1) - } - end - - def test_str_chomp - combination(STRINGS, STRINGS) {|s1, s2| - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.chomp(s2) } - next - end - t = s1.chomp(s2) - assert(t.valid_encoding?, "#{encdump(s1)}.chomp(#{encdump(s2)})") if s1.valid_encoding? && s2.valid_encoding? - assert_equal(s1.encoding, t.encoding) - t2 = s1.dup - t2.chomp!(s2) - assert_equal(t, t2) - } - end - - def test_str_chop - STRINGS.each {|s| - s = s.dup - desc = "#{encdump s}.chop" - if !s.valid_encoding? - #assert_raise(ArgumentError, desc) { s.chop } - begin - s.chop - rescue ArgumentError - e = $! - end - next if e - end - t = nil - assert_nothing_raised(desc) { t = s.chop } - assert(t.valid_encoding?) if s.valid_encoding? - assert(a(s).index(a(t))) - t2 = s.dup - t2.chop! - assert_equal(t, t2) - } - end - - def test_str_clear - STRINGS.each {|s| - t = s.dup - t.clear - assert(t.valid_encoding?) - assert(t.empty?) - } - end - - def test_str_clone - STRINGS.each {|s| - t = s.clone - assert_equal(s, t) - assert_equal(s.encoding, t.encoding) - assert_equal(a(s), a(t)) - } - end - - def test_str_dup - STRINGS.each {|s| - t = s.dup - assert_equal(s, t) - assert_equal(s.encoding, t.encoding) - assert_equal(a(s), a(t)) - } - end - - def test_str_count - combination(STRINGS, STRINGS) {|s1, s2| - if !s1.valid_encoding? || !s2.valid_encoding? - assert_raise(ArgumentError) { s1.count(s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.count(s2) } - next - end - n = s1.count(s2) - n0 = a(s1).count(a(s2)) - assert_operator(n, :<=, n0) - } - end - - def test_str_crypt - combination(STRINGS, STRINGS) {|str, salt| - if a(salt).length < 2 - assert_raise(ArgumentError) { str.crypt(salt) } - next - end - t = str.crypt(salt) - assert_equal(a(str).crypt(a(salt)), t) - assert_encoding('ASCII-8BIT', t.encoding) - } - end - - def test_str_delete - combination(STRINGS, STRINGS) {|s1, s2| - if !s1.valid_encoding? || !s2.valid_encoding? - assert_raise(ArgumentError) { s1.delete(s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.delete(s2) } - next - end - t = s1.delete(s2) - assert(t.valid_encoding?) - assert_equal(t.encoding, s1.encoding) - assert_operator(t.length, :<=, s1.length) - t2 = s1.dup - t2.delete!(s2) - assert_equal(t, t2) - } - end - - def test_str_downcase - STRINGS.each {|s| - if !s.valid_encoding? - assert_raise(ArgumentError) { s.downcase } - next - end - t = s.downcase - assert(t.valid_encoding?) - assert_equal(t.encoding, s.encoding) - assert(t.casecmp(s)) - t2 = s.dup - t2.downcase! - assert_equal(t, t2) - } - end - - def test_str_dump - STRINGS.each {|s| - t = s.dump - assert(t.valid_encoding?) - assert(t.ascii_only?) - u = eval(t) - assert_equal(a(s), a(u)) - } - end - - def test_str_each_line - combination(STRINGS, STRINGS) {|s1, s2| - if !s1.valid_encoding? || !s2.valid_encoding? - assert_raise(ArgumentError) { s1.each_line(s2) {} } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.each_line(s2) {} } - next - end - lines = [] - s1.each_line(s2) {|line| - assert(line.valid_encoding?) - assert_equal(s1.encoding, line.encoding) - lines << line - } - next if lines.size == 0 - s2 = lines.join('') - assert_equal(s1.encoding, s2.encoding) - assert_equal(s1, s2) - } - end - - def test_str_each_byte - STRINGS.each {|s| - bytes = [] - s.each_byte {|b| - bytes << b - } - a(s).split(//).each_with_index {|ch, i| - assert_equal(ch.ord, bytes[i]) - } - } - end - - def test_str_empty? - STRINGS.each {|s| - if s.length == 0 - assert(s.empty?) - else - assert(!s.empty?) - end - } - end - - def test_str_hex - STRINGS.each {|s| - t = s.hex - t2 = a(s)[/\A[0-9a-fA-Fx]*/].hex - assert_equal(t2, t) - } - end - - def test_str_include? - combination(STRINGS, STRINGS) {|s1, s2| - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.include?(s2) } - assert_raise(ArgumentError) { s1.index(s2) } - assert_raise(ArgumentError) { s1.rindex(s2) } - next - end - t = s1.include?(s2) - if t - assert(a(s1).include?(a(s2))) - assert(s1.index(s2)) - assert(s1.rindex(s2)) - else - assert(!s1.index(s2)) - assert(!s1.rindex(s2), "!#{encdump(s1)}.rindex(#{encdump(s2)})") - end - if s2.empty? - assert_equal(true, t) - next - end - if !s1.valid_encoding? || !s2.valid_encoding? - assert_equal(false, t, "#{encdump s1}.include?(#{encdump s2})") - next - end - if t && s1.valid_encoding? && s2.valid_encoding? - assert_match(/#{Regexp.escape(s2)}/, s1) - else - assert_no_match(/#{Regexp.escape(s2)}/, s1) - end - } - end - - def test_str_index - combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos| - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.index(s2) } - next - end - t = s1.index(s2, pos) - if s2.empty? - if pos < 0 && pos+s1.length < 0 - assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); - elsif pos < 0 - assert_equal(s1.length+pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); - elsif s1.length < pos - assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); - else - assert_equal(pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); - end - next - end - if !s1.valid_encoding? || !s2.valid_encoding? - assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); - next - end - if t - re = /#{Regexp.escape(s2)}/ - assert(re.match(s1, pos)) - assert_equal($`.length, t, "#{encdump s1}.index(#{encdump s2}, #{pos})") - else - assert_no_match(/#{Regexp.escape(s2)}/, s1[pos..-1]) - end - } - end - - def test_str_rindex - combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos| - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.rindex(s2) } - next - end - t = s1.rindex(s2, pos) - if s2.empty? - if pos < 0 && pos+s1.length < 0 - assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") - elsif pos < 0 - assert_equal(s1.length+pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") - elsif s1.length < pos - assert_equal(s1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") - else - assert_equal(pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") - end - next - end - if !s1.valid_encoding? || !s2.valid_encoding? - assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") - next - end - if t - #puts "#{encdump s1}.rindex(#{encdump s2}, #{pos}) => #{t}" - assert(a(s1).index(a(s2))) - pos2 = pos - pos2 += s1.length if pos < 0 - re = /\A(.{0,#{pos2}})#{Regexp.escape(s2)}/m - assert(re.match(s1), "#{re.inspect}.match(#{encdump(s1)})") - assert_equal($1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") - else - re = /#{Regexp.escape(s2)}/ - n = re =~ s1 - if n - if pos < 0 - assert_operator(n, :>, s1.length+pos) - else - assert_operator(n, :>, pos) - end - end - end - } - end - - def test_str_insert - combination(STRINGS, 0..2, STRINGS) {|s1, nth, s2| - t1 = s1.dup - t2 = s1.dup - begin - t1[nth, 0] = s2 - rescue ArgumentError, IndexError => e1 - end - begin - t2.insert(nth, s2) - rescue ArgumentError, IndexError => e2 - end - assert_equal(t1, t2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t") - assert_equal(e1.class, e2.class, "begin #{encdump s1}.insert(#{nth},#{encdump s2}); rescue ArgumentError, IndexError => e; e end") - } - combination(STRINGS, -2..-1, STRINGS) {|s1, nth, s2| - next if s1.length + nth < 0 - next unless s1.valid_encoding? - next unless s2.valid_encoding? - t1 = s1.dup - begin - t1.insert(nth, s2) - slen = s2.length - assert_equal(t1[nth-slen+1,slen], s2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t") - rescue ArgumentError, IndexError => e - end - } - end - - def test_str_intern - STRINGS.each {|s| - if /\0/ =~ a(s) - assert_raise(ArgumentError) { s.intern } - else - sym = s.intern - assert_equal(s, sym.to_s) - end - } - end - - def test_str_length - STRINGS.each {|s| - assert_operator(s.length, :<=, s.bytesize) - } - end - - def test_str_oct - STRINGS.each {|s| - t = s.oct - t2 = a(s)[/\A[0-9a-fA-FxXbB]*/].oct - assert_equal(t2, t) - } - end - - def test_str_replace - combination(STRINGS, STRINGS) {|s1, s2| - t = s1.dup - t.replace s2 - assert_equal(s2, t) - assert_equal(s2.encoding, t.encoding) - } - end - - def test_str_reverse - STRINGS.each {|s| - t = s.reverse - assert_equal(s.bytesize, t.bytesize) - if !s.valid_encoding? - assert_operator(t.length, :<=, s.length) - next - end - assert_equal(s, t.reverse) - } - end - - def test_str_scan - combination(STRINGS, STRINGS) {|s1, s2| - if !s2.valid_encoding? - assert_raise(RegexpError) { s1.scan(s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.scan(s2) } - next - end - if !s1.valid_encoding? - assert_raise(ArgumentError) { s1.scan(s2) } - next - end - r = s1.scan(s2) - r.each {|t| - assert_equal(s2, t) - } - } - end - - def test_str_slice - each_slice_call {|obj, *args| - assert_same_result(lambda { obj[*args] }, lambda { obj.slice(*args) }) - } - end - - def test_str_slice! - each_slice_call {|s, *args| - t = s.dup - begin - r = t.slice!(*args) - rescue - e = $! - end - if e - assert_raise(e.class) { s.slice(*args) } - next - end - if !r - assert_nil(s.slice(*args)) - next - end - assert_equal(s.slice(*args), r) - assert_equal(s.bytesize, r.bytesize + t.bytesize) - if args.length == 1 && String === args[0] - assert_equal(args[0].encoding, r.encoding, - "#{encdump s}.slice!#{encdumpargs args}.encoding") - else - assert_equal(s.encoding, r.encoding, - "#{encdump s}.slice!#{encdumpargs args}.encoding") - end - if [s, *args].all? {|o| !(String === o) || o.valid_encoding? } - assert(r.valid_encoding?) - assert(t.valid_encoding?) - assert_equal(s.length, r.length + t.length) - end - } - end - - def test_str_split - combination(STRINGS, STRINGS) {|s1, s2| - if !s2.valid_encoding? - assert_raise(RegexpError) { s1.split(s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.split(s2) } - next - end - if !s1.valid_encoding? - assert_raise(ArgumentError) { s1.split(s2) } - next - end - t = s1.split(s2) - t.each {|r| - assert(a(s1).include?(a(r))) - assert_equal(s1.encoding, r.encoding) - } - assert(a(s1).include?(t.map {|u| a(u) }.join(a(s2)))) - if s1.valid_encoding? && s2.valid_encoding? - t.each {|r| - assert(r.valid_encoding?) - } - end - } - end - - def test_str_squeeze - combination(STRINGS, STRINGS) {|s1, s2| - if !s1.valid_encoding? || !s2.valid_encoding? - assert_raise(ArgumentError, "#{encdump s1}.squeeze(#{encdump s2})") { s1.squeeze(s2) } - next - end - if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding - assert_raise(ArgumentError) { s1.squeeze(s2) } - next - end - t = s1.squeeze(s2) - assert_operator(t.length, :<=, s1.length) - t2 = s1.dup - t2.squeeze!(s2) - assert_equal(t, t2) - } - end - def test_squeeze s = "\xa3\xb0\xa3\xb1\xa3\xb1\xa3\xb3\xa3\xb4".force_encoding("euc-jp") assert_equal("\xa3\xb0\xa3\xb1\xa3\xb3\xa3\xb4".force_encoding("euc-jp"), s.squeeze) end - def test_str_strip - STRINGS.each {|s| - if !s.valid_encoding? - assert_raise(ArgumentError, "#{encdump s}.strip") { s.strip } - next - end - t = s.strip - l = s.lstrip - r = s.rstrip - assert_operator(l.length, :<=, s.length) - assert_operator(r.length, :<=, s.length) - assert_operator(t.length, :<=, l.length) - assert_operator(t.length, :<=, r.length) - t2 = s.dup - t2.strip! - assert_equal(t, t2) - l2 = s.dup - l2.lstrip! - assert_equal(l, l2) - r2 = s.dup - r2.rstrip! - assert_equal(r, r2) - } - end - - def test_str_sum - STRINGS.each {|s| - assert_equal(a(s).sum, s.sum) - } - end - - def test_str_swapcase - STRINGS.each {|s| - if !s.valid_encoding? - assert_raise(ArgumentError, "#{encdump s}.swapcase") { s.swapcase } - next - end - t1 = s.swapcase - assert(t1.valid_encoding?) if s.valid_encoding? - assert(t1.casecmp(s)) - t2 = s.dup - t2.swapcase! - assert_equal(t1, t2) - t3 = t1.swapcase - assert_equal(s, t3); - } - end - - - def test_str_to_f - STRINGS.each {|s| - assert_nothing_raised { s.to_f } - } - end - - def test_str_to_i - STRINGS.each {|s| - assert_nothing_raised { s.to_i } - 2.upto(36) {|radix| - assert_nothing_raised { s.to_i(radix) } - } - } - end - - def test_str_to_s - STRINGS.each {|s| - assert_same(s, s.to_s) - assert_same(s, s.to_str) - } - end - def test_tr s = "\x81\x41".force_encoding("shift_jis") assert_equal(s.tr("A", "B"), s) @@ -1766,111 +698,13 @@ assert_equal("\xA1\xA1".force_encoding("EUC-JP"), "a".force_encoding("ASCII-8BIT").tr("a".force_encoding("ASCII-8BIT"), "\xA1\xA1".force_encoding("EUC-JP"))) - combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| - desc = "#{encdump s1}.tr(#{encdump s2}, #{encdump s3})" - if s1.empty? - assert_equal(s1, s1.tr(s2, s3), desc) - next - end - if !str_enc_compatible?(s1, s2, s3) - assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } - next - end - if !s1.valid_encoding? - assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } - next - end - if s2.empty? - assert_equal(s1, s1.tr(s2, s3), desc) - next - end - if !s2.valid_encoding? || !s3.valid_encoding? - assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } - next - end - t = s1.tr(s2, s3) - assert_operator(s1.length, :>=, t.length, desc) - } end def test_tr_s assert_equal("\xA1\xA1".force_encoding("EUC-JP"), "a".force_encoding("ASCII-8BIT").tr("a".force_encoding("ASCII-8BIT"), "\xA1\xA1".force_encoding("EUC-JP"))) - - combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| - desc = "#{encdump s1}.tr_s(#{encdump s2}, #{encdump s3})" - if s1.empty? - assert_equal(s1, s1.tr_s(s2, s3), desc) - next - end - if !s1.valid_encoding? - assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) } - next - end - if !str_enc_compatible?(s1, s2, s3) - assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } - next - end - if s2.empty? - assert_equal(s1, s1.tr_s(s2, s3), desc) - next - end - if !s2.valid_encoding? || !s3.valid_encoding? - assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) } - next - end - - t = nil - assert_nothing_raised(desc) { t = s1.tr_s(s1, s3) } - assert_operator(s1.length, :>=, t.length, desc) - } end - def test_str_upcase - STRINGS.each {|s| - desc = "#{encdump s}.upcase" - if !s.valid_encoding? - assert_raise(ArgumentError, desc) { s.upcase } - next - end - t1 = s.upcase - assert(t1.valid_encoding?) - assert(t1.casecmp(s)) - t2 = s.dup - t2.upcase! - assert_equal(t1, t2) - } - end - - def test_str_succ - starts = [ - e("\xA1\xA1"), - e("\xFE\xFE") - ] - STRINGS.each {|s0| - next if s0.empty? - s = s0.dup - n = 1000 - h = {} - n.times {|i| - if h[s] - assert(false, "#{encdump s} cycle with succ! #{i-h[s]} times") - end - h[s] = i - assert_operator(s.length, :<=, s0.length + Math.log2(i+1) + 1, "#{encdump s0} succ! #{i} times => #{encdump s}") - s.succ! - } - } - end - - def test_str_hash - combination(STRINGS, STRINGS) {|s1, s2| - if s1.eql?(s2) - assert_equal(s1.hash, s2.hash, "#{encdump s1}.hash == #{encdump s2}.dump") - end - } - end - def test_sub s = "abc".sub(/b/, "\xa1\xa1".force_encoding("euc-jp")) assert_encoding("EUC-JP", s.encoding) @@ -1921,11 +755,6 @@ end def test_marshal - STRINGS.each {|s| - m = Marshal.dump(s) - t = Marshal.load(m) - assert_equal(s, t) - } end def test_env @@ -1934,114 +763,4 @@ assert_equal(Encoding::ASCII_8BIT, v.encoding) } end - - def test_str_sub - combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| - if !s2.valid_encoding? - assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) } - next - end - r2 = Regexp.new(Regexp.escape(s2)) - [ - [ - "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { s1.sub(r2, s3) } - ], - [ - "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { s1.sub(r2) { s3 } } - ], - [ - "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { s1.gsub(r2, s3) } - ], - [ - "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { s1.gsub(r2) { s3 } } - ] - ].each {|desc, doit| - if !s1.valid_encoding? - assert_raise(ArgumentError, desc) { doit.call } - next - end - if !str_enc_compatible?(s1, s2) - assert_raise(ArgumentError, desc) { doit.call } - next - end - if !s1.include?(s2) - assert_equal(s1, doit.call) - next - end - if !str_enc_compatible?(s1, s3) - assert_raise(ArgumentError, desc) { doit.call } - next - end - t = nil - assert_nothing_raised(desc) { - t = doit.call - } - if s2 == s3 - assert_equal(s1, t, desc) - else - assert_not_equal(s1, t, desc) - end - } - } - end - - def test_str_sub! - combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| - if !s2.valid_encoding? - assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) } - next - end - r2 = Regexp.new(Regexp.escape(s2)) - [ - [ - "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { t=s1.dup; [t, t.sub!(r2, s3)] } - ], - [ - "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { t=s1.dup; [t, t.sub!(r2) { s3 }] } - ], - [ - "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { t=s1.dup; [t, t.gsub!(r2, s3)] } - ], - [ - "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})", - lambda { t=s1.dup; [t, t.gsub!(r2) { s3 }] } - ] - ].each {|desc, doit| - if !s1.valid_encoding? - assert_raise(ArgumentError, desc) { doit.call } - next - end - if !str_enc_compatible?(s1, s2) - assert_raise(ArgumentError, desc) { doit.call } - next - end - if !s1.include?(s2) - assert_equal([s1, nil], doit.call) - next - end - if !str_enc_compatible?(s1, s3) - assert_raise(ArgumentError, desc) { doit.call } - next - end - t = ret = nil - assert_nothing_raised(desc) { - t, ret = doit.call - } - assert(ret) - if s2 == s3 - assert_equal(s1, t, desc) - else - assert_not_equal(s1, t, desc) - end - } - } - end - end Index: test/ruby/test_m17n_comb.rb =================================================================== --- test/ruby/test_m17n_comb.rb (revision 0) +++ test/ruby/test_m17n_comb.rb (revision 14901) @@ -0,0 +1,1434 @@ +require 'test/unit' +require 'stringio' + +class TestM17NComb < Test::Unit::TestCase + def assert_encoding(encname, actual, message=nil) + assert_equal(Encoding.find(encname), actual, message) + end + + module AESU + def a(str) str.dup.force_encoding("ASCII-8BIT") end + def e(str) str.dup.force_encoding("EUC-JP") end + def s(str) str.dup.force_encoding("Shift_JIS") end + def u(str) str.dup.force_encoding("UTF-8") end + end + include AESU + extend AESU + + def assert_strenc(bytes, enc, actual, message=nil) + assert_instance_of(String, actual, message) + enc = Encoding.find(enc) if String === enc + assert_equal(enc, actual.encoding, message) + assert_equal(a(bytes), a(actual), message) + end + + def assert_warning(pat, mesg=nil) + begin + org_stderr = $stderr + $stderr = StringIO.new(warn = '') + yield + ensure + $stderr = org_stderr + end + assert_match(pat, warn, mesg) + end + + def assert_regexp_generic_encoding(r) + assert(!r.fixed_encoding?) + %w[ASCII-8BIT EUC-JP Shift_JIS UTF-8].each {|ename| + # "\xc2\xa1" is a valid sequence for ASCII-8BIT, EUC-JP, Shift_JIS and UTF-8. + assert_nothing_raised { r =~ "\xc2\xa1".force_encoding(ename) } + } + end + + def assert_regexp_fixed_encoding(r) + assert(r.fixed_encoding?) + %w[ASCII-8BIT EUC-JP Shift_JIS UTF-8].each {|ename| + enc = Encoding.find(ename) + if enc == r.encoding + assert_nothing_raised { r =~ "\xc2\xa1".force_encoding(enc) } + else + assert_raise(ArgumentError) { r =~ "\xc2\xa1".force_encoding(enc) } + end + } + end + + def assert_regexp_generic_ascii(r) + assert_encoding("ASCII-8BIT", r.encoding) + assert_regexp_generic_encoding(r) + end + + def assert_regexp_fixed_ascii8bit(r) + assert_encoding("ASCII-8BIT", r.encoding) + assert_regexp_fixed_encoding(r) + end + + def assert_regexp_fixed_eucjp(r) + assert_encoding("EUC-JP", r.encoding) + assert_regexp_fixed_encoding(r) + end + + def assert_regexp_fixed_sjis(r) + assert_encoding("Shift_JIS", r.encoding) + assert_regexp_fixed_encoding(r) + end + + def assert_regexp_fixed_utf8(r) + assert_encoding("UTF-8", r.encoding) + assert_regexp_fixed_encoding(r) + end + + STRINGS = [ + a(""), e(""), s(""), u(""), + a("a"), e("a"), s("a"), u("a"), + a("."), e("."), s("."), u("."), + + # single character + a("\x80"), a("\xff"), + e("\xa1\xa1"), e("\xfe\xfe"), + e("\x8e\xa1"), e("\x8e\xfe"), + e("\x8f\xa1\xa1"), e("\x8f\xfe\xfe"), + s("\x81\x40"), s("\xfc\xfc"), + s("\xa1"), s("\xdf"), + u("\xc2\x80"), u("\xf4\x8f\xbf\xbf"), + + # same byte sequence + a("\xc2\xa1"), e("\xc2\xa1"), s("\xc2\xa1"), u("\xc2\xa1"), + + s("\x81A"), # mutibyte character which contains "A" + s("\x81a"), # mutibyte character which contains "a" + + # invalid + e("\xa1"), e("\x80"), + s("\x81"), s("\x80"), + u("\xc2"), u("\x80"), + + # for transitivity test + u("\xe0\xa0\xa1"), + e("\xe0\xa0\xa1"), + s("\xe0\xa0\xa1"), + ] + + def combination(*args) + if args.empty? + yield [] + else + arg = args.shift + arg.each {|v| + combination(*args) {|vs| + yield [v, *vs] + } + } + end + end + + def encdump(str) + "#{str.dump}.force_encoding(#{str.encoding.name.dump})" + end + + def encdumpargs(args) + r = '(' + args.each_with_index {|a, i| + r << ',' if 0 < i + if String === a + r << encdump(a) + else + r << a.inspect + end + } + r << ')' + r + end + + def assert_str_enc_propagation(t, s1, s2) + if !s1.ascii_only? + assert_equal(s1.encoding, t.encoding) + elsif !s2.ascii_only? + assert_equal(s2.encoding, t.encoding) + else + assert([s1.encoding, s2.encoding].include?(t.encoding)) + end + end + + def assert_same_result(expected_proc, actual_proc) + e = nil + begin + t = expected_proc.call + rescue + e = $! + end + if e + assert_raise(e.class) { actual_proc.call } + else + assert_equal(t, actual_proc.call) + end + end + + def each_slice_call + combination(STRINGS, -2..2) {|s, nth| + yield s, nth + } + combination(STRINGS, -2..2, 0..2) {|s, nth, len| + yield s, nth, len + } + combination(STRINGS, STRINGS) {|s, substr| + yield s, substr + } + combination(STRINGS, -2..2, 0..2) {|s, first, last| + yield s, first..last + yield s, first...last + } + combination(STRINGS, STRINGS) {|s1, s2| + if !s2.valid_encoding? + next + end + yield s1, Regexp.new(Regexp.escape(s2)) + } + combination(STRINGS, STRINGS, 0..2) {|s1, s2, nth| + if !s2.valid_encoding? + next + end + yield s1, Regexp.new(Regexp.escape(s2)), nth + } + end + + def str_enc_compatible?(*strs) + encs = [] + strs.each {|s| + encs << s.encoding if !s.ascii_only? + } + encs.uniq! + encs.length <= 1 + end + + # tests start + + def test_str_new + STRINGS.each {|s| + t = String.new(s) + assert_strenc(a(s), s.encoding, t) + } + end + + def test_str_plus + combination(STRINGS, STRINGS) {|s1, s2| + if s1.encoding != s2.encoding && !s1.ascii_only? && !s2.ascii_only? + assert_raise(ArgumentError) { s1 + s2 } + else + t = s1 + s2 + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert_equal(a(s1) + a(s2), a(t)) + assert_str_enc_propagation(t, s1, s2) + end + } + end + + def test_str_times + STRINGS.each {|s| + [0,1,2].each {|n| + t = s * n + assert(t.valid_encoding?) if s.valid_encoding? + assert_strenc(a(s) * n, s.encoding, t) + } + } + end + + def test_sprintf_s + STRINGS.each {|s| + assert_strenc(a(s), s.encoding, "%s".force_encoding(s.encoding) % s) + if !s.empty? # xxx + assert_strenc(a(s), s.encoding, a("%s") % s) + end + } + end + + def test_str_eq_reflexive + STRINGS.each {|s| + assert(s == s, "#{encdump s} == #{encdump s}") + } + end + + def test_str_eq_symmetric + combination(STRINGS, STRINGS) {|s1, s2| + if s1 == s2 + assert(s2 == s1, "#{encdump s2} == #{encdump s1}") + else + assert(!(s2 == s1), "!(#{encdump s2} == #{encdump s1})") + end + } + end + + def test_str_eq_transitive + combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| + if s1 == s2 && s2 == s3 + assert(s1 == s3, "transitive: #{encdump s1} == #{encdump s2} == #{encdump s3}") + end + } + end + + def test_str_eq + combination(STRINGS, STRINGS) {|s1, s2| + desc_eq = "#{encdump s1} == #{encdump s2}" + if s1.ascii_only? && s2.ascii_only? && a(s1) == a(s2) + assert(s1 == s2, desc_eq) + elsif s1.encoding == s2.encoding && a(s1) == a(s2) + assert(s1 == s2, desc_eq) + assert(!(s1 != s2)) + assert_equal(0, s1 <=> s2) + else + assert(!(s1 == s2), "!(#{desc_eq})") + assert(s1 != s2) + assert_not_equal(0, s1 <=> s2) + end + } + end + + def test_str_concat + combination(STRINGS, STRINGS) {|s1, s2| + s = s1.dup + if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding + s << s2 + assert(s.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert_equal(a(s), a(s1) + a(s2)) + assert_str_enc_propagation(s, s1, s2) + else + assert_raise(ArgumentError) { s << s2 } + end + } + end + + def test_str_aref + + STRINGS.each {|s| + t = '' + 0.upto(s.length-1) {|i| + u = s[i] + assert(u.valid_encoding?) if s.valid_encoding? + t << u + } + assert_equal(t, s) + } + + end + + def test_str_aref_len + + STRINGS.each {|s| + t = '' + 0.upto(s.length-1) {|i| + u = s[i,1] + assert(u.valid_encoding?) if s.valid_encoding? + t << u + } + assert_equal(t, s) + } + + STRINGS.each {|s| + t = '' + 0.step(s.length-1, 2) {|i| + u = s[i,2] + assert(u.valid_encoding?) if s.valid_encoding? + t << u + } + assert_equal(t, s) + } + end + + def test_str_aref_substr + + combination(STRINGS, STRINGS) {|s1, s2| + if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding + t = s1[s2] + if t != nil + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert_equal(s2, t) + assert_match(/#{Regexp.escape(a(s2))}/, a(s1)) + if s1.valid_encoding? + assert_match(/#{Regexp.escape(s2)}/, s1) + end + end + else + assert_raise(ArgumentError) { s1[s2] } + end + } + end + + def test_str_aref_range2 + combination(STRINGS, -2..2, -2..2) {|s, first, last| + t = s[first..last] + if first < 0 + first += s.length + if first < 0 + assert_nil(t, "#{s.inspect}[#{first}..#{last}]") + next + end + end + if s.length < first + assert_nil(t, "#{s.inspect}[#{first}..#{last}]") + next + end + assert(t.valid_encoding?) if s.valid_encoding? + if last < 0 + last += s.length + end + t2 = '' + first.upto(last) {|i| + c = s[i] + t2 << c if c + } + assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]") + } + end + + def test_str_aref_range3 + combination(STRINGS, -2..2, -2..2) {|s, first, last| + t = s[first...last] + if first < 0 + first += s.length + if first < 0 + assert_nil(t, "#{s.inspect}[#{first}..#{last}]") + next + end + end + if s.length < first + assert_nil(t, "#{s.inspect}[#{first}..#{last}]") + next + end + if last < 0 + last += s.length + end + assert(t.valid_encoding?) if s.valid_encoding? + t2 = '' + first.upto(last-1) {|i| + c = s[i] + t2 << c if c + } + assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]") + } + end + + def test_str_assign + combination(STRINGS, STRINGS) {|s1, s2| + (-2).upto(2) {|i| + t = s1.dup + if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding + if i < -s1.length || s1.length < i + assert_raise(IndexError) { t[i] = s2 } + else + t[i] = s2 + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert(a(t).index(a(s2))) + if s1.valid_encoding? && s2.valid_encoding? + if i == s1.length && s2.empty? + assert_nil(t[i]) + elsif i < 0 + assert_equal(s2, t[i-s2.length+1,s2.length], + "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i-s2.length+1},#{s2.length}]") + else + assert_equal(s2, t[i,s2.length], + "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i},#{s2.length}]") + end + end + end + else + assert_raise(ArgumentError) { t[i] = s2 } + end + } + } + end + + def test_str_assign_len + combination(STRINGS, -2..2, 0..2, STRINGS) {|s1, i, len, s2| + t = s1.dup + if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding + if i < -s1.length || s1.length < i + assert_raise(IndexError) { t[i,len] = s2 } + else + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + t[i,len] = s2 + assert(a(t).index(a(s2))) + if s1.valid_encoding? && s2.valid_encoding? + if i == s1.length && s2.empty? + assert_nil(t[i]) + elsif i < 0 + if -i < len + len = -i + end + assert_equal(s2, t[i-s2.length+len,s2.length], + "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i-s2.length+len},#{s2.length}]") + else + assert_equal(s2, t[i,s2.length], + "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i},#{s2.length}]") + end + end + end + else + assert_raise(ArgumentError) { t[i,len] = s2 } + end + } + end + + def test_str_assign_substr + combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| + t = s1.dup + encs = [ + !s1.ascii_only? ? s1.encoding : nil, + !s2.ascii_only? ? s2.encoding : nil, + !s3.ascii_only? ? s3.encoding : nil].uniq.compact + if 1 < encs.length + assert_raise(ArgumentError, IndexError) { t[s2] = s3 } + else + if encs.empty? + encs = [ + s1.encoding, + s2.encoding, + s3.encoding].uniq.reject {|e| e == Encoding.find("ASCII-8BIT") } + if encs.empty? + encs = [Encoding.find("ASCII-8BIT")] + end + end + if !t[s2] + else + t[s2] = s3 + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? && s3.valid_encoding? + end + end + } + end + + def test_str_assign_range2 + combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2| + t = s1.dup + if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding + if first < -s1.length || s1.length < first + assert_raise(RangeError) { t[first..last] = s2 } + else + t[first..last] = s2 + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert(a(t).index(a(s2))) + if s1.valid_encoding? && s2.valid_encoding? + if first < 0 + assert_equal(s2, t[s1.length+first, s2.length]) + else + assert_equal(s2, t[first, s2.length]) + end + end + end + else + assert_raise(ArgumentError, RangeError, + "t=#{encdump(s1)};t[#{first}..#{last}]=#{encdump(s2)}") { + t[first..last] = s2 + } + end + } + end + + def test_str_assign_range3 + combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2| + t = s1.dup + if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding + if first < -s1.length || s1.length < first + assert_raise(RangeError) { t[first...last] = s2 } + else + t[first...last] = s2 + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert(a(t).index(a(s2))) + if s1.valid_encoding? && s2.valid_encoding? + if first < 0 + assert_equal(s2, t[s1.length+first, s2.length]) + else + assert_equal(s2, t[first, s2.length]) + end + end + end + else + assert_raise(ArgumentError, RangeError, + "t=#{encdump(s1)};t[#{first}...#{last}]=#{encdump(s2)}") { + t[first...last] = s2 + } + end + } + end + + def test_str_cmp + combination(STRINGS, STRINGS) {|s1, s2| + desc = "#{encdump s1} <=> #{encdump s2}" + r = s1 <=> s2 + if s1 == s2 + assert_equal(0, r, desc) + else + assert_not_equal(0, r, desc) + end + } + end + + def test_str_capitalize + STRINGS.each {|s| + begin + t1 = s.capitalize + rescue ArgumentError + assert(!s.valid_encoding?) + next + end + assert(t1.valid_encoding?) if s.valid_encoding? + assert(t1.casecmp(s)) + t2 = s.dup + t2.capitalize! + assert_equal(t1, t2) + assert_equal(s.downcase.sub(/\A[a-z]/) {|ch| a(ch).upcase }, t1) + } + end + + def test_str_casecmp + combination(STRINGS, STRINGS) {|s1, s2| + #puts "#{encdump(s1)}.casecmp(#{encdump(s2)})" + begin + r = s1.casecmp(s2) + rescue ArgumentError + assert(!s1.valid_encoding? || !s2.valid_encoding?) + next + end + #assert_equal(s1.upcase <=> s2.upcase, r) + } + end + + def test_str_center + + combination(STRINGS, [0,1,2,3,10]) {|s1, width| + t = s1.center(width) + assert(a(t).index(a(s1))) + } + combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2| + if s2.empty? + assert_raise(ArgumentError) { s1.center(width, s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.center(width, s2) } + next + end + t = s1.center(width, s2) + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert(a(t).index(a(s1))) + assert_str_enc_propagation(t, s1, s2) if (t != s1) + } + end + + def test_str_ljust + combination(STRINGS, [0,1,2,3,10]) {|s1, width| + t = s1.ljust(width) + assert(a(t).index(a(s1))) + } + combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2| + if s2.empty? + assert_raise(ArgumentError) { s1.ljust(width, s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.ljust(width, s2) } + next + end + t = s1.ljust(width, s2) + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert(a(t).index(a(s1))) + assert_str_enc_propagation(t, s1, s2) if (t != s1) + } + end + + def test_str_rjust + combination(STRINGS, [0,1,2,3,10]) {|s1, width| + t = s1.rjust(width) + assert(a(t).index(a(s1))) + } + combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2| + if s2.empty? + assert_raise(ArgumentError) { s1.rjust(width, s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.rjust(width, s2) } + next + end + t = s1.rjust(width, s2) + assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? + assert(a(t).index(a(s1))) + assert_str_enc_propagation(t, s1, s2) if (t != s1) + } + end + + def test_str_chomp + combination(STRINGS, STRINGS) {|s1, s2| + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.chomp(s2) } + next + end + t = s1.chomp(s2) + assert(t.valid_encoding?, "#{encdump(s1)}.chomp(#{encdump(s2)})") if s1.valid_encoding? && s2.valid_encoding? + assert_equal(s1.encoding, t.encoding) + t2 = s1.dup + t2.chomp!(s2) + assert_equal(t, t2) + } + end + + def test_str_chop + STRINGS.each {|s| + s = s.dup + desc = "#{encdump s}.chop" + if !s.valid_encoding? + #assert_raise(ArgumentError, desc) { s.chop } + begin + s.chop + rescue ArgumentError + e = $! + end + next if e + end + t = nil + assert_nothing_raised(desc) { t = s.chop } + assert(t.valid_encoding?) if s.valid_encoding? + assert(a(s).index(a(t))) + t2 = s.dup + t2.chop! + assert_equal(t, t2) + } + end + + def test_str_clear + STRINGS.each {|s| + t = s.dup + t.clear + assert(t.valid_encoding?) + assert(t.empty?) + } + end + + def test_str_clone + STRINGS.each {|s| + t = s.clone + assert_equal(s, t) + assert_equal(s.encoding, t.encoding) + assert_equal(a(s), a(t)) + } + end + + def test_str_dup + STRINGS.each {|s| + t = s.dup + assert_equal(s, t) + assert_equal(s.encoding, t.encoding) + assert_equal(a(s), a(t)) + } + end + + def test_str_count + combination(STRINGS, STRINGS) {|s1, s2| + if !s1.valid_encoding? || !s2.valid_encoding? + assert_raise(ArgumentError) { s1.count(s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.count(s2) } + next + end + n = s1.count(s2) + n0 = a(s1).count(a(s2)) + assert_operator(n, :<=, n0) + } + end + + def test_str_crypt + combination(STRINGS, STRINGS) {|str, salt| + if a(salt).length < 2 + assert_raise(ArgumentError) { str.crypt(salt) } + next + end + t = str.crypt(salt) + assert_equal(a(str).crypt(a(salt)), t) + assert_encoding('ASCII-8BIT', t.encoding) + } + end + + def test_str_delete + combination(STRINGS, STRINGS) {|s1, s2| + if !s1.valid_encoding? || !s2.valid_encoding? + assert_raise(ArgumentError) { s1.delete(s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.delete(s2) } + next + end + t = s1.delete(s2) + assert(t.valid_encoding?) + assert_equal(t.encoding, s1.encoding) + assert_operator(t.length, :<=, s1.length) + t2 = s1.dup + t2.delete!(s2) + assert_equal(t, t2) + } + end + + def test_str_downcase + STRINGS.each {|s| + if !s.valid_encoding? + assert_raise(ArgumentError) { s.downcase } + next + end + t = s.downcase + assert(t.valid_encoding?) + assert_equal(t.encoding, s.encoding) + assert(t.casecmp(s)) + t2 = s.dup + t2.downcase! + assert_equal(t, t2) + } + end + + def test_str_dump + STRINGS.each {|s| + t = s.dump + assert(t.valid_encoding?) + assert(t.ascii_only?) + u = eval(t) + assert_equal(a(s), a(u)) + } + end + + def test_str_each_line + combination(STRINGS, STRINGS) {|s1, s2| + if !s1.valid_encoding? || !s2.valid_encoding? + assert_raise(ArgumentError) { s1.each_line(s2) {} } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.each_line(s2) {} } + next + end + lines = [] + s1.each_line(s2) {|line| + assert(line.valid_encoding?) + assert_equal(s1.encoding, line.encoding) + lines << line + } + next if lines.size == 0 + s2 = lines.join('') + assert_equal(s1.encoding, s2.encoding) + assert_equal(s1, s2) + } + end + + def test_str_each_byte + STRINGS.each {|s| + bytes = [] + s.each_byte {|b| + bytes << b + } + a(s).split(//).each_with_index {|ch, i| + assert_equal(ch.ord, bytes[i]) + } + } + end + + def test_str_empty? + STRINGS.each {|s| + if s.length == 0 + assert(s.empty?) + else + assert(!s.empty?) + end + } + end + + def test_str_hex + STRINGS.each {|s| + t = s.hex + t2 = a(s)[/\A[0-9a-fA-Fx]*/].hex + assert_equal(t2, t) + } + end + + def test_str_include? + combination(STRINGS, STRINGS) {|s1, s2| + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.include?(s2) } + assert_raise(ArgumentError) { s1.index(s2) } + assert_raise(ArgumentError) { s1.rindex(s2) } + next + end + t = s1.include?(s2) + if t + assert(a(s1).include?(a(s2))) + assert(s1.index(s2)) + assert(s1.rindex(s2)) + else + assert(!s1.index(s2)) + assert(!s1.rindex(s2), "!#{encdump(s1)}.rindex(#{encdump(s2)})") + end + if s2.empty? + assert_equal(true, t) + next + end + if !s1.valid_encoding? || !s2.valid_encoding? + assert_equal(false, t, "#{encdump s1}.include?(#{encdump s2})") + next + end + if t && s1.valid_encoding? && s2.valid_encoding? + assert_match(/#{Regexp.escape(s2)}/, s1) + else + assert_no_match(/#{Regexp.escape(s2)}/, s1) + end + } + end + + def test_str_index + combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos| + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.index(s2) } + next + end + t = s1.index(s2, pos) + if s2.empty? + if pos < 0 && pos+s1.length < 0 + assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); + elsif pos < 0 + assert_equal(s1.length+pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); + elsif s1.length < pos + assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); + else + assert_equal(pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); + end + next + end + if !s1.valid_encoding? || !s2.valid_encoding? + assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})"); + next + end + if t + re = /#{Regexp.escape(s2)}/ + assert(re.match(s1, pos)) + assert_equal($`.length, t, "#{encdump s1}.index(#{encdump s2}, #{pos})") + else + assert_no_match(/#{Regexp.escape(s2)}/, s1[pos..-1]) + end + } + end + + def test_str_rindex + combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos| + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.rindex(s2) } + next + end + t = s1.rindex(s2, pos) + if s2.empty? + if pos < 0 && pos+s1.length < 0 + assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") + elsif pos < 0 + assert_equal(s1.length+pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") + elsif s1.length < pos + assert_equal(s1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") + else + assert_equal(pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") + end + next + end + if !s1.valid_encoding? || !s2.valid_encoding? + assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") + next + end + if t + #puts "#{encdump s1}.rindex(#{encdump s2}, #{pos}) => #{t}" + assert(a(s1).index(a(s2))) + pos2 = pos + pos2 += s1.length if pos < 0 + re = /\A(.{0,#{pos2}})#{Regexp.escape(s2)}/m + assert(re.match(s1), "#{re.inspect}.match(#{encdump(s1)})") + assert_equal($1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})") + else + re = /#{Regexp.escape(s2)}/ + n = re =~ s1 + if n + if pos < 0 + assert_operator(n, :>, s1.length+pos) + else + assert_operator(n, :>, pos) + end + end + end + } + end + + def test_str_insert + combination(STRINGS, 0..2, STRINGS) {|s1, nth, s2| + t1 = s1.dup + t2 = s1.dup + begin + t1[nth, 0] = s2 + rescue ArgumentError, IndexError => e1 + end + begin + t2.insert(nth, s2) + rescue ArgumentError, IndexError => e2 + end + assert_equal(t1, t2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t") + assert_equal(e1.class, e2.class, "begin #{encdump s1}.insert(#{nth},#{encdump s2}); rescue ArgumentError, IndexError => e; e end") + } + combination(STRINGS, -2..-1, STRINGS) {|s1, nth, s2| + next if s1.length + nth < 0 + next unless s1.valid_encoding? + next unless s2.valid_encoding? + t1 = s1.dup + begin + t1.insert(nth, s2) + slen = s2.length + assert_equal(t1[nth-slen+1,slen], s2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t") + rescue ArgumentError, IndexError => e + end + } + end + + def test_str_intern + STRINGS.each {|s| + if /\0/ =~ a(s) + assert_raise(ArgumentError) { s.intern } + else + sym = s.intern + assert_equal(s, sym.to_s) + end + } + end + + def test_str_length + STRINGS.each {|s| + assert_operator(s.length, :<=, s.bytesize) + } + end + + def test_str_oct + STRINGS.each {|s| + t = s.oct + t2 = a(s)[/\A[0-9a-fA-FxXbB]*/].oct + assert_equal(t2, t) + } + end + + def test_str_replace + combination(STRINGS, STRINGS) {|s1, s2| + t = s1.dup + t.replace s2 + assert_equal(s2, t) + assert_equal(s2.encoding, t.encoding) + } + end + + def test_str_reverse + STRINGS.each {|s| + t = s.reverse + assert_equal(s.bytesize, t.bytesize) + if !s.valid_encoding? + assert_operator(t.length, :<=, s.length) + next + end + assert_equal(s, t.reverse) + } + end + + def test_str_scan + combination(STRINGS, STRINGS) {|s1, s2| + if !s2.valid_encoding? + assert_raise(RegexpError) { s1.scan(s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.scan(s2) } + next + end + if !s1.valid_encoding? + assert_raise(ArgumentError) { s1.scan(s2) } + next + end + r = s1.scan(s2) + r.each {|t| + assert_equal(s2, t) + } + } + end + + def test_str_slice + each_slice_call {|obj, *args| + assert_same_result(lambda { obj[*args] }, lambda { obj.slice(*args) }) + } + end + + def test_str_slice! + each_slice_call {|s, *args| + t = s.dup + begin + r = t.slice!(*args) + rescue + e = $! + end + if e + assert_raise(e.class) { s.slice(*args) } + next + end + if !r + assert_nil(s.slice(*args)) + next + end + assert_equal(s.slice(*args), r) + assert_equal(s.bytesize, r.bytesize + t.bytesize) + if args.length == 1 && String === args[0] + assert_equal(args[0].encoding, r.encoding, + "#{encdump s}.slice!#{encdumpargs args}.encoding") + else + assert_equal(s.encoding, r.encoding, + "#{encdump s}.slice!#{encdumpargs args}.encoding") + end + if [s, *args].all? {|o| !(String === o) || o.valid_encoding? } + assert(r.valid_encoding?) + assert(t.valid_encoding?) + assert_equal(s.length, r.length + t.length) + end + } + end + + def test_str_split + combination(STRINGS, STRINGS) {|s1, s2| + if !s2.valid_encoding? + assert_raise(RegexpError) { s1.split(s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.split(s2) } + next + end + if !s1.valid_encoding? + assert_raise(ArgumentError) { s1.split(s2) } + next + end + t = s1.split(s2) + t.each {|r| + assert(a(s1).include?(a(r))) + assert_equal(s1.encoding, r.encoding) + } + assert(a(s1).include?(t.map {|u| a(u) }.join(a(s2)))) + if s1.valid_encoding? && s2.valid_encoding? + t.each {|r| + assert(r.valid_encoding?) + } + end + } + end + + def test_str_squeeze + combination(STRINGS, STRINGS) {|s1, s2| + if !s1.valid_encoding? || !s2.valid_encoding? + assert_raise(ArgumentError, "#{encdump s1}.squeeze(#{encdump s2})") { s1.squeeze(s2) } + next + end + if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding + assert_raise(ArgumentError) { s1.squeeze(s2) } + next + end + t = s1.squeeze(s2) + assert_operator(t.length, :<=, s1.length) + t2 = s1.dup + t2.squeeze!(s2) + assert_equal(t, t2) + } + end + + def test_str_strip + STRINGS.each {|s| + if !s.valid_encoding? + assert_raise(ArgumentError, "#{encdump s}.strip") { s.strip } + next + end + t = s.strip + l = s.lstrip + r = s.rstrip + assert_operator(l.length, :<=, s.length) + assert_operator(r.length, :<=, s.length) + assert_operator(t.length, :<=, l.length) + assert_operator(t.length, :<=, r.length) + t2 = s.dup + t2.strip! + assert_equal(t, t2) + l2 = s.dup + l2.lstrip! + assert_equal(l, l2) + r2 = s.dup + r2.rstrip! + assert_equal(r, r2) + } + end + + def test_str_sum + STRINGS.each {|s| + assert_equal(a(s).sum, s.sum) + } + end + + def test_str_swapcase + STRINGS.each {|s| + if !s.valid_encoding? + assert_raise(ArgumentError, "#{encdump s}.swapcase") { s.swapcase } + next + end + t1 = s.swapcase + assert(t1.valid_encoding?) if s.valid_encoding? + assert(t1.casecmp(s)) + t2 = s.dup + t2.swapcase! + assert_equal(t1, t2) + t3 = t1.swapcase + assert_equal(s, t3); + } + end + + + def test_str_to_f + STRINGS.each {|s| + assert_nothing_raised { s.to_f } + } + end + + def test_str_to_i + STRINGS.each {|s| + assert_nothing_raised { s.to_i } + 2.upto(36) {|radix| + assert_nothing_raised { s.to_i(radix) } + } + } + end + + def test_str_to_s + STRINGS.each {|s| + assert_same(s, s.to_s) + assert_same(s, s.to_str) + } + end + + def test_tr + combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| + desc = "#{encdump s1}.tr(#{encdump s2}, #{encdump s3})" + if s1.empty? + assert_equal(s1, s1.tr(s2, s3), desc) + next + end + if !str_enc_compatible?(s1, s2, s3) + assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } + next + end + if !s1.valid_encoding? + assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } + next + end + if s2.empty? + assert_equal(s1, s1.tr(s2, s3), desc) + next + end + if !s2.valid_encoding? || !s3.valid_encoding? + assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } + next + end + t = s1.tr(s2, s3) + assert_operator(s1.length, :>=, t.length, desc) + } + end + + def test_tr_s + combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| + desc = "#{encdump s1}.tr_s(#{encdump s2}, #{encdump s3})" + if s1.empty? + assert_equal(s1, s1.tr_s(s2, s3), desc) + next + end + if !s1.valid_encoding? + assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) } + next + end + if !str_enc_compatible?(s1, s2, s3) + assert_raise(ArgumentError, desc) { s1.tr(s2, s3) } + next + end + if s2.empty? + assert_equal(s1, s1.tr_s(s2, s3), desc) + next + end + if !s2.valid_encoding? || !s3.valid_encoding? + assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) } + next + end + + t = nil + assert_nothing_raised(desc) { t = s1.tr_s(s1, s3) } + assert_operator(s1.length, :>=, t.length, desc) + } + end + + def test_str_upcase + STRINGS.each {|s| + desc = "#{encdump s}.upcase" + if !s.valid_encoding? + assert_raise(ArgumentError, desc) { s.upcase } + next + end + t1 = s.upcase + assert(t1.valid_encoding?) + assert(t1.casecmp(s)) + t2 = s.dup + t2.upcase! + assert_equal(t1, t2) + } + end + + def test_str_succ + starts = [ + e("\xA1\xA1"), + e("\xFE\xFE") + ] + STRINGS.each {|s0| + next if s0.empty? + s = s0.dup + n = 1000 + h = {} + n.times {|i| + if h[s] + assert(false, "#{encdump s} cycle with succ! #{i-h[s]} times") + end + h[s] = i + assert_operator(s.length, :<=, s0.length + Math.log2(i+1) + 1, "#{encdump s0} succ! #{i} times => #{encdump s}") + s.succ! + } + } + end + + def test_str_hash + combination(STRINGS, STRINGS) {|s1, s2| + if s1.eql?(s2) + assert_equal(s1.hash, s2.hash, "#{encdump s1}.hash == #{encdump s2}.dump") + end + } + end + + def test_marshal + STRINGS.each {|s| + m = Marshal.dump(s) + t = Marshal.load(m) + assert_equal(s, t) + } + end + + def test_str_sub + combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| + if !s2.valid_encoding? + assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) } + next + end + r2 = Regexp.new(Regexp.escape(s2)) + [ + [ + "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { s1.sub(r2, s3) } + ], + [ + "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { s1.sub(r2) { s3 } } + ], + [ + "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { s1.gsub(r2, s3) } + ], + [ + "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { s1.gsub(r2) { s3 } } + ] + ].each {|desc, doit| + if !s1.valid_encoding? + assert_raise(ArgumentError, desc) { doit.call } + next + end + if !str_enc_compatible?(s1, s2) + assert_raise(ArgumentError, desc) { doit.call } + next + end + if !s1.include?(s2) + assert_equal(s1, doit.call) + next + end + if !str_enc_compatible?(s1, s3) + assert_raise(ArgumentError, desc) { doit.call } + next + end + t = nil + assert_nothing_raised(desc) { + t = doit.call + } + if s2 == s3 + assert_equal(s1, t, desc) + else + assert_not_equal(s1, t, desc) + end + } + } + end + + def test_str_sub! + combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3| + if !s2.valid_encoding? + assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) } + next + end + r2 = Regexp.new(Regexp.escape(s2)) + [ + [ + "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { t=s1.dup; [t, t.sub!(r2, s3)] } + ], + [ + "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { t=s1.dup; [t, t.sub!(r2) { s3 }] } + ], + [ + "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { t=s1.dup; [t, t.gsub!(r2, s3)] } + ], + [ + "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})", + lambda { t=s1.dup; [t, t.gsub!(r2) { s3 }] } + ] + ].each {|desc, doit| + if !s1.valid_encoding? + assert_raise(ArgumentError, desc) { doit.call } + next + end + if !str_enc_compatible?(s1, s2) + assert_raise(ArgumentError, desc) { doit.call } + next + end + if !s1.include?(s2) + assert_equal([s1, nil], doit.call) + next + end + if !str_enc_compatible?(s1, s3) + assert_raise(ArgumentError, desc) { doit.call } + next + end + t = ret = nil + assert_nothing_raised(desc) { + t, ret = doit.call + } + assert(ret) + if s2 == s3 + assert_equal(s1, t, desc) + else + assert_not_equal(s1, t, desc) + end + } + } + end + +end Property changes on: test/ruby/test_m17n_comb.rb ___________________________________________________________________ Name: svn:keywords + Author Date Id Revision Name: svn:eol-style + LF -- ML: ruby-changes@q... Info: http://www.atdot.net/~ko1/quickml