aboutsummaryrefslogtreecommitdiffstats
path: root/test
diff options
context:
space:
mode:
authorakr <akr@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2008-01-05 19:14:24 +0000
committerakr <akr@b2dd03c8-39d4-4d8f-98ff-823fe69b080e>2008-01-05 19:14:24 +0000
commitb3b0fa3e85afd845ea85f420398b41c739300486 (patch)
tree93eaa91d020a88b43825dd0f6e1b1de539641ec4 /test
parent1347a9a7e03fded7881a4c4fa40fe843edfaf5f1 (diff)
downloadruby-b3b0fa3e85afd845ea85f420398b41c739300486.tar.gz
split combinational tests.
git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@14901 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
Diffstat (limited to 'test')
-rw-r--r--test/ruby/test_m17n.rb1281
-rw-r--r--test/ruby/test_m17n_comb.rb1434
2 files changed, 1434 insertions, 1281 deletions
diff --git a/test/ruby/test_m17n.rb b/test/ruby/test_m17n.rb
index b86b14658d..5d5b183c67 100644
--- a/test/ruby/test_m17n.rb
+++ b/test/ruby/test_m17n.rb
@@ -78,50 +78,6 @@ class TestM17N < Test::Unit::TestCase
assert_regexp_fixed_encoding(r)
end
- STRINGS = [
- a(""), e(""), s(""), u(""),
- a("a"), e("a"), s("a"), u("a"),
- a("."), e("."), s("."), u("."),
-
- # single character
- a("\x80"), a("\xff"),
- e("\xa1\xa1"), e("\xfe\xfe"),
- e("\x8e\xa1"), e("\x8e\xfe"),
- e("\x8f\xa1\xa1"), e("\x8f\xfe\xfe"),
- s("\x81\x40"), s("\xfc\xfc"),
- s("\xa1"), s("\xdf"),
- u("\xc2\x80"), u("\xf4\x8f\xbf\xbf"),
-
- # same byte sequence
- a("\xc2\xa1"), e("\xc2\xa1"), s("\xc2\xa1"), u("\xc2\xa1"),
-
- s("\x81A"), # mutibyte character which contains "A"
- s("\x81a"), # mutibyte character which contains "a"
-
- # invalid
- e("\xa1"), e("\x80"),
- s("\x81"), s("\x80"),
- u("\xc2"), u("\x80"),
-
- # for transitivity test
- u("\xe0\xa0\xa1"),
- e("\xe0\xa0\xa1"),
- s("\xe0\xa0\xa1"),
- ]
-
- def combination(*args)
- if args.empty?
- yield []
- else
- arg = args.shift
- arg.each {|v|
- combination(*args) {|vs|
- yield [v, *vs]
- }
- }
- end
- end
-
def encdump(str)
"#{str.dump}.force_encoding(#{str.encoding.name.dump})"
end
@@ -164,34 +120,6 @@ class TestM17N < Test::Unit::TestCase
end
end
- def each_slice_call
- combination(STRINGS, -2..2) {|s, nth|
- yield s, nth
- }
- combination(STRINGS, -2..2, 0..2) {|s, nth, len|
- yield s, nth, len
- }
- combination(STRINGS, STRINGS) {|s, substr|
- yield s, substr
- }
- combination(STRINGS, -2..2, 0..2) {|s, first, last|
- yield s, first..last
- yield s, first...last
- }
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s2.valid_encoding?
- next
- end
- yield s1, Regexp.new(Regexp.escape(s2))
- }
- combination(STRINGS, STRINGS, 0..2) {|s1, s2, nth|
- if !s2.valid_encoding?
- next
- end
- yield s1, Regexp.new(Regexp.escape(s2)), nth
- }
- end
-
def str_enc_compatible?(*strs)
encs = []
strs.each {|s|
@@ -669,36 +597,6 @@ class TestM17N < Test::Unit::TestCase
assert_equal(Encoding::ASCII_8BIT, s.encoding)
end
- def test_str_new
- STRINGS.each {|s|
- t = String.new(s)
- assert_strenc(a(s), s.encoding, t)
- }
- end
-
- def test_str_plus
- combination(STRINGS, STRINGS) {|s1, s2|
- if s1.encoding != s2.encoding && !s1.ascii_only? && !s2.ascii_only?
- assert_raise(ArgumentError) { s1 + s2 }
- else
- t = s1 + s2
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert_equal(a(s1) + a(s2), a(t))
- assert_str_enc_propagation(t, s1, s2)
- end
- }
- end
-
- def test_str_times
- STRINGS.each {|s|
- [0,1,2].each {|n|
- t = s * n
- assert(t.valid_encoding?) if s.valid_encoding?
- assert_strenc(a(s) * n, s.encoding, t)
- }
- }
- end
-
def test_sprintf_c
assert_strenc("\x80", 'ASCII-8BIT', a("%c") % 128)
#assert_raise(ArgumentError) { a("%c") % 0xc2a1 }
@@ -710,15 +608,6 @@ class TestM17N < Test::Unit::TestCase
assert_strenc("\u{c2}", 'UTF-8', u("%c") % 0xc2)
end
- def test_sprintf_s
- STRINGS.each {|s|
- assert_strenc(a(s), s.encoding, "%s".force_encoding(s.encoding) % s)
- if !s.empty? # xxx
- assert_strenc(a(s), s.encoding, a("%s") % s)
- end
- }
- end
-
def test_sprintf_p
assert_strenc('""', 'ASCII-8BIT', a("%p") % a(""))
assert_strenc('""', 'EUC-JP', e("%p") % e(""))
@@ -741,67 +630,12 @@ class TestM17N < Test::Unit::TestCase
assert_strenc('"\x00"', 'UTF-8', u("%p") % u("\x00"))
end
- def test_str_eq_reflexive
- STRINGS.each {|s|
- assert(s == s, "#{encdump s} == #{encdump s}")
- }
- end
-
- def test_str_eq_symmetric
- combination(STRINGS, STRINGS) {|s1, s2|
- if s1 == s2
- assert(s2 == s1, "#{encdump s2} == #{encdump s1}")
- else
- assert(!(s2 == s1), "!(#{encdump s2} == #{encdump s1})")
- end
- }
- end
-
- def test_str_eq_transitive
- combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
- if s1 == s2 && s2 == s3
- assert(s1 == s3, "transitive: #{encdump s1} == #{encdump s2} == #{encdump s3}")
- end
- }
- end
-
- def test_str_eq
- combination(STRINGS, STRINGS) {|s1, s2|
- desc_eq = "#{encdump s1} == #{encdump s2}"
- if s1.ascii_only? && s2.ascii_only? && a(s1) == a(s2)
- assert(s1 == s2, desc_eq)
- elsif s1.encoding == s2.encoding && a(s1) == a(s2)
- assert(s1 == s2, desc_eq)
- assert(!(s1 != s2))
- assert_equal(0, s1 <=> s2)
- else
- assert(!(s1 == s2), "!(#{desc_eq})")
- assert(s1 != s2)
- assert_not_equal(0, s1 <=> s2)
- end
- }
- end
-
def test_str_lt
assert(a("a") < a("\xa1"))
assert(a("a") < s("\xa1"))
assert(s("a") < a("\xa1"))
end
- def test_str_concat
- combination(STRINGS, STRINGS) {|s1, s2|
- s = s1.dup
- if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
- s << s2
- assert(s.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert_equal(a(s), a(s1) + a(s2))
- assert_str_enc_propagation(s, s1, s2)
- else
- assert_raise(ArgumentError) { s << s2 }
- end
- }
- end
-
def test_str_aref
assert_equal(a("\xc2"), a("\xc2\xa1")[0])
assert_equal(a("\xa1"), a("\xc2\xa1")[1])
@@ -813,17 +647,6 @@ class TestM17N < Test::Unit::TestCase
assert_equal(nil, s("\xc2\xa1")[2])
assert_equal(u("\xc2\xa1"), u("\xc2\xa1")[0])
assert_equal(nil, u("\xc2\xa1")[1])
-
- STRINGS.each {|s|
- t = ''
- 0.upto(s.length-1) {|i|
- u = s[i]
- assert(u.valid_encoding?) if s.valid_encoding?
- t << u
- }
- assert_equal(t, s)
- }
-
end
def test_str_aref_len
@@ -838,26 +661,6 @@ class TestM17N < Test::Unit::TestCase
assert_equal(u("\xc2\xa2"), u("\xc2\xa1\xc2\xa2\xc2\xa3")[1, 1])
assert_equal(u("\xc2\xa2\xc2\xa3"), u("\xc2\xa1\xc2\xa2\xc2\xa3")[1, 2])
-
- STRINGS.each {|s|
- t = ''
- 0.upto(s.length-1) {|i|
- u = s[i,1]
- assert(u.valid_encoding?) if s.valid_encoding?
- t << u
- }
- assert_equal(t, s)
- }
-
- STRINGS.each {|s|
- t = ''
- 0.step(s.length-1, 2) {|i|
- u = s[i,2]
- assert(u.valid_encoding?) if s.valid_encoding?
- t << u
- }
- assert_equal(t, s)
- }
end
def test_str_aref_substr
@@ -872,810 +675,10 @@ class TestM17N < Test::Unit::TestCase
assert_equal(nil, u("\xc2\xa1\xc2\xa2\xc2\xa3")[u("\xa1\xc2")])
assert_raise(ArgumentError) { u("\xc2\xa1\xc2\xa2\xc2\xa3")[a("\xa1\xc2")] }
-
- combination(STRINGS, STRINGS) {|s1, s2|
- if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
- t = s1[s2]
- if t != nil
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert_equal(s2, t)
- assert_match(/#{Regexp.escape(a(s2))}/, a(s1))
- if s1.valid_encoding?
- assert_match(/#{Regexp.escape(s2)}/, s1)
- end
- end
- else
- assert_raise(ArgumentError) { s1[s2] }
- end
- }
- end
-
- def test_str_aref_range2
- combination(STRINGS, -2..2, -2..2) {|s, first, last|
- t = s[first..last]
- if first < 0
- first += s.length
- if first < 0
- assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
- next
- end
- end
- if s.length < first
- assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
- next
- end
- assert(t.valid_encoding?) if s.valid_encoding?
- if last < 0
- last += s.length
- end
- t2 = ''
- first.upto(last) {|i|
- c = s[i]
- t2 << c if c
- }
- assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]")
- }
- end
-
- def test_str_aref_range3
- combination(STRINGS, -2..2, -2..2) {|s, first, last|
- t = s[first...last]
- if first < 0
- first += s.length
- if first < 0
- assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
- next
- end
- end
- if s.length < first
- assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
- next
- end
- if last < 0
- last += s.length
- end
- assert(t.valid_encoding?) if s.valid_encoding?
- t2 = ''
- first.upto(last-1) {|i|
- c = s[i]
- t2 << c if c
- }
- assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]")
- }
- end
-
- def test_str_assign
- combination(STRINGS, STRINGS) {|s1, s2|
- (-2).upto(2) {|i|
- t = s1.dup
- if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
- if i < -s1.length || s1.length < i
- assert_raise(IndexError) { t[i] = s2 }
- else
- t[i] = s2
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert(a(t).index(a(s2)))
- if s1.valid_encoding? && s2.valid_encoding?
- if i == s1.length && s2.empty?
- assert_nil(t[i])
- elsif i < 0
- assert_equal(s2, t[i-s2.length+1,s2.length],
- "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i-s2.length+1},#{s2.length}]")
- else
- assert_equal(s2, t[i,s2.length],
- "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i},#{s2.length}]")
- end
- end
- end
- else
- assert_raise(ArgumentError) { t[i] = s2 }
- end
- }
- }
- end
-
- def test_str_assign_len
- combination(STRINGS, -2..2, 0..2, STRINGS) {|s1, i, len, s2|
- t = s1.dup
- if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
- if i < -s1.length || s1.length < i
- assert_raise(IndexError) { t[i,len] = s2 }
- else
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- t[i,len] = s2
- assert(a(t).index(a(s2)))
- if s1.valid_encoding? && s2.valid_encoding?
- if i == s1.length && s2.empty?
- assert_nil(t[i])
- elsif i < 0
- if -i < len
- len = -i
- end
- assert_equal(s2, t[i-s2.length+len,s2.length],
- "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i-s2.length+len},#{s2.length}]")
- else
- assert_equal(s2, t[i,s2.length],
- "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i},#{s2.length}]")
- end
- end
- end
- else
- assert_raise(ArgumentError) { t[i,len] = s2 }
- end
- }
- end
-
- def test_str_assign_substr
- combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
- t = s1.dup
- encs = [
- !s1.ascii_only? ? s1.encoding : nil,
- !s2.ascii_only? ? s2.encoding : nil,
- !s3.ascii_only? ? s3.encoding : nil].uniq.compact
- if 1 < encs.length
- assert_raise(ArgumentError, IndexError) { t[s2] = s3 }
- else
- if encs.empty?
- encs = [
- s1.encoding,
- s2.encoding,
- s3.encoding].uniq.reject {|e| e == Encoding.find("ASCII-8BIT") }
- if encs.empty?
- encs = [Encoding.find("ASCII-8BIT")]
- end
- end
- if !t[s2]
- else
- t[s2] = s3
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? && s3.valid_encoding?
- end
- end
- }
- end
-
- def test_str_assign_range2
- combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2|
- t = s1.dup
- if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
- if first < -s1.length || s1.length < first
- assert_raise(RangeError) { t[first..last] = s2 }
- else
- t[first..last] = s2
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert(a(t).index(a(s2)))
- if s1.valid_encoding? && s2.valid_encoding?
- if first < 0
- assert_equal(s2, t[s1.length+first, s2.length])
- else
- assert_equal(s2, t[first, s2.length])
- end
- end
- end
- else
- assert_raise(ArgumentError, RangeError,
- "t=#{encdump(s1)};t[#{first}..#{last}]=#{encdump(s2)}") {
- t[first..last] = s2
- }
- end
- }
- end
-
- def test_str_assign_range3
- combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2|
- t = s1.dup
- if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
- if first < -s1.length || s1.length < first
- assert_raise(RangeError) { t[first...last] = s2 }
- else
- t[first...last] = s2
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert(a(t).index(a(s2)))
- if s1.valid_encoding? && s2.valid_encoding?
- if first < 0
- assert_equal(s2, t[s1.length+first, s2.length])
- else
- assert_equal(s2, t[first, s2.length])
- end
- end
- end
- else
- assert_raise(ArgumentError, RangeError,
- "t=#{encdump(s1)};t[#{first}...#{last}]=#{encdump(s2)}") {
- t[first...last] = s2
- }
- end
- }
- end
-
- def test_str_cmp
- combination(STRINGS, STRINGS) {|s1, s2|
- desc = "#{encdump s1} <=> #{encdump s2}"
- r = s1 <=> s2
- if s1 == s2
- assert_equal(0, r, desc)
- else
- assert_not_equal(0, r, desc)
- end
- }
- end
-
- def test_str_capitalize
- STRINGS.each {|s|
- begin
- t1 = s.capitalize
- rescue ArgumentError
- assert(!s.valid_encoding?)
- next
- end
- assert(t1.valid_encoding?) if s.valid_encoding?
- assert(t1.casecmp(s))
- t2 = s.dup
- t2.capitalize!
- assert_equal(t1, t2)
- assert_equal(s.downcase.sub(/\A[a-z]/) {|ch| a(ch).upcase }, t1)
- }
- end
-
- def test_str_casecmp
- combination(STRINGS, STRINGS) {|s1, s2|
- #puts "#{encdump(s1)}.casecmp(#{encdump(s2)})"
- begin
- r = s1.casecmp(s2)
- rescue ArgumentError
- assert(!s1.valid_encoding? || !s2.valid_encoding?)
- next
- end
- #assert_equal(s1.upcase <=> s2.upcase, r)
- }
end
def test_str_center
assert_encoding("EUC-JP", "a".center(5, "\xa1\xa2".force_encoding("euc-jp")).encoding)
-
- combination(STRINGS, [0,1,2,3,10]) {|s1, width|
- t = s1.center(width)
- assert(a(t).index(a(s1)))
- }
- combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2|
- if s2.empty?
- assert_raise(ArgumentError) { s1.center(width, s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.center(width, s2) }
- next
- end
- t = s1.center(width, s2)
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert(a(t).index(a(s1)))
- assert_str_enc_propagation(t, s1, s2) if (t != s1)
- }
- end
-
- def test_str_ljust
- combination(STRINGS, [0,1,2,3,10]) {|s1, width|
- t = s1.ljust(width)
- assert(a(t).index(a(s1)))
- }
- combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2|
- if s2.empty?
- assert_raise(ArgumentError) { s1.ljust(width, s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.ljust(width, s2) }
- next
- end
- t = s1.ljust(width, s2)
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert(a(t).index(a(s1)))
- assert_str_enc_propagation(t, s1, s2) if (t != s1)
- }
- end
-
- def test_str_rjust
- combination(STRINGS, [0,1,2,3,10]) {|s1, width|
- t = s1.rjust(width)
- assert(a(t).index(a(s1)))
- }
- combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2|
- if s2.empty?
- assert_raise(ArgumentError) { s1.rjust(width, s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.rjust(width, s2) }
- next
- end
- t = s1.rjust(width, s2)
- assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
- assert(a(t).index(a(s1)))
- assert_str_enc_propagation(t, s1, s2) if (t != s1)
- }
- end
-
- def test_str_chomp
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.chomp(s2) }
- next
- end
- t = s1.chomp(s2)
- assert(t.valid_encoding?, "#{encdump(s1)}.chomp(#{encdump(s2)})") if s1.valid_encoding? && s2.valid_encoding?
- assert_equal(s1.encoding, t.encoding)
- t2 = s1.dup
- t2.chomp!(s2)
- assert_equal(t, t2)
- }
- end
-
- def test_str_chop
- STRINGS.each {|s|
- s = s.dup
- desc = "#{encdump s}.chop"
- if !s.valid_encoding?
- #assert_raise(ArgumentError, desc) { s.chop }
- begin
- s.chop
- rescue ArgumentError
- e = $!
- end
- next if e
- end
- t = nil
- assert_nothing_raised(desc) { t = s.chop }
- assert(t.valid_encoding?) if s.valid_encoding?
- assert(a(s).index(a(t)))
- t2 = s.dup
- t2.chop!
- assert_equal(t, t2)
- }
- end
-
- def test_str_clear
- STRINGS.each {|s|
- t = s.dup
- t.clear
- assert(t.valid_encoding?)
- assert(t.empty?)
- }
- end
-
- def test_str_clone
- STRINGS.each {|s|
- t = s.clone
- assert_equal(s, t)
- assert_equal(s.encoding, t.encoding)
- assert_equal(a(s), a(t))
- }
- end
-
- def test_str_dup
- STRINGS.each {|s|
- t = s.dup
- assert_equal(s, t)
- assert_equal(s.encoding, t.encoding)
- assert_equal(a(s), a(t))
- }
- end
-
- def test_str_count
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_raise(ArgumentError) { s1.count(s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.count(s2) }
- next
- end
- n = s1.count(s2)
- n0 = a(s1).count(a(s2))
- assert_operator(n, :<=, n0)
- }
- end
-
- def test_str_crypt
- combination(STRINGS, STRINGS) {|str, salt|
- if a(salt).length < 2
- assert_raise(ArgumentError) { str.crypt(salt) }
- next
- end
- t = str.crypt(salt)
- assert_equal(a(str).crypt(a(salt)), t)
- assert_encoding('ASCII-8BIT', t.encoding)
- }
- end
-
- def test_str_delete
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_raise(ArgumentError) { s1.delete(s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.delete(s2) }
- next
- end
- t = s1.delete(s2)
- assert(t.valid_encoding?)
- assert_equal(t.encoding, s1.encoding)
- assert_operator(t.length, :<=, s1.length)
- t2 = s1.dup
- t2.delete!(s2)
- assert_equal(t, t2)
- }
- end
-
- def test_str_downcase
- STRINGS.each {|s|
- if !s.valid_encoding?
- assert_raise(ArgumentError) { s.downcase }
- next
- end
- t = s.downcase
- assert(t.valid_encoding?)
- assert_equal(t.encoding, s.encoding)
- assert(t.casecmp(s))
- t2 = s.dup
- t2.downcase!
- assert_equal(t, t2)
- }
- end
-
- def test_str_dump
- STRINGS.each {|s|
- t = s.dump
- assert(t.valid_encoding?)
- assert(t.ascii_only?)
- u = eval(t)
- assert_equal(a(s), a(u))
- }
- end
-
- def test_str_each_line
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_raise(ArgumentError) { s1.each_line(s2) {} }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.each_line(s2) {} }
- next
- end
- lines = []
- s1.each_line(s2) {|line|
- assert(line.valid_encoding?)
- assert_equal(s1.encoding, line.encoding)
- lines << line
- }
- next if lines.size == 0
- s2 = lines.join('')
- assert_equal(s1.encoding, s2.encoding)
- assert_equal(s1, s2)
- }
- end
-
- def test_str_each_byte
- STRINGS.each {|s|
- bytes = []
- s.each_byte {|b|
- bytes << b
- }
- a(s).split(//).each_with_index {|ch, i|
- assert_equal(ch.ord, bytes[i])
- }
- }
- end
-
- def test_str_empty?
- STRINGS.each {|s|
- if s.length == 0
- assert(s.empty?)
- else
- assert(!s.empty?)
- end
- }
- end
-
- def test_str_hex
- STRINGS.each {|s|
- t = s.hex
- t2 = a(s)[/\A[0-9a-fA-Fx]*/].hex
- assert_equal(t2, t)
- }
- end
-
- def test_str_include?
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.include?(s2) }
- assert_raise(ArgumentError) { s1.index(s2) }
- assert_raise(ArgumentError) { s1.rindex(s2) }
- next
- end
- t = s1.include?(s2)
- if t
- assert(a(s1).include?(a(s2)))
- assert(s1.index(s2))
- assert(s1.rindex(s2))
- else
- assert(!s1.index(s2))
- assert(!s1.rindex(s2), "!#{encdump(s1)}.rindex(#{encdump(s2)})")
- end
- if s2.empty?
- assert_equal(true, t)
- next
- end
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_equal(false, t, "#{encdump s1}.include?(#{encdump s2})")
- next
- end
- if t && s1.valid_encoding? && s2.valid_encoding?
- assert_match(/#{Regexp.escape(s2)}/, s1)
- else
- assert_no_match(/#{Regexp.escape(s2)}/, s1)
- end
- }
- end
-
- def test_str_index
- combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos|
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.index(s2) }
- next
- end
- t = s1.index(s2, pos)
- if s2.empty?
- if pos < 0 && pos+s1.length < 0
- assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
- elsif pos < 0
- assert_equal(s1.length+pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
- elsif s1.length < pos
- assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
- else
- assert_equal(pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
- end
- next
- end
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
- next
- end
- if t
- re = /#{Regexp.escape(s2)}/
- assert(re.match(s1, pos))
- assert_equal($`.length, t, "#{encdump s1}.index(#{encdump s2}, #{pos})")
- else
- assert_no_match(/#{Regexp.escape(s2)}/, s1[pos..-1])
- end
- }
- end
-
- def test_str_rindex
- combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos|
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.rindex(s2) }
- next
- end
- t = s1.rindex(s2, pos)
- if s2.empty?
- if pos < 0 && pos+s1.length < 0
- assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
- elsif pos < 0
- assert_equal(s1.length+pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
- elsif s1.length < pos
- assert_equal(s1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
- else
- assert_equal(pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
- end
- next
- end
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
- next
- end
- if t
- #puts "#{encdump s1}.rindex(#{encdump s2}, #{pos}) => #{t}"
- assert(a(s1).index(a(s2)))
- pos2 = pos
- pos2 += s1.length if pos < 0
- re = /\A(.{0,#{pos2}})#{Regexp.escape(s2)}/m
- assert(re.match(s1), "#{re.inspect}.match(#{encdump(s1)})")
- assert_equal($1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
- else
- re = /#{Regexp.escape(s2)}/
- n = re =~ s1
- if n
- if pos < 0
- assert_operator(n, :>, s1.length+pos)
- else
- assert_operator(n, :>, pos)
- end
- end
- end
- }
- end
-
- def test_str_insert
- combination(STRINGS, 0..2, STRINGS) {|s1, nth, s2|
- t1 = s1.dup
- t2 = s1.dup
- begin
- t1[nth, 0] = s2
- rescue ArgumentError, IndexError => e1
- end
- begin
- t2.insert(nth, s2)
- rescue ArgumentError, IndexError => e2
- end
- assert_equal(t1, t2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t")
- assert_equal(e1.class, e2.class, "begin #{encdump s1}.insert(#{nth},#{encdump s2}); rescue ArgumentError, IndexError => e; e end")
- }
- combination(STRINGS, -2..-1, STRINGS) {|s1, nth, s2|
- next if s1.length + nth < 0
- next unless s1.valid_encoding?
- next unless s2.valid_encoding?
- t1 = s1.dup
- begin
- t1.insert(nth, s2)
- slen = s2.length
- assert_equal(t1[nth-slen+1,slen], s2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t")
- rescue ArgumentError, IndexError => e
- end
- }
- end
-
- def test_str_intern
- STRINGS.each {|s|
- if /\0/ =~ a(s)
- assert_raise(ArgumentError) { s.intern }
- else
- sym = s.intern
- assert_equal(s, sym.to_s)
- end
- }
- end
-
- def test_str_length
- STRINGS.each {|s|
- assert_operator(s.length, :<=, s.bytesize)
- }
- end
-
- def test_str_oct
- STRINGS.each {|s|
- t = s.oct
- t2 = a(s)[/\A[0-9a-fA-FxXbB]*/].oct
- assert_equal(t2, t)
- }
- end
-
- def test_str_replace
- combination(STRINGS, STRINGS) {|s1, s2|
- t = s1.dup
- t.replace s2
- assert_equal(s2, t)
- assert_equal(s2.encoding, t.encoding)
- }
- end
-
- def test_str_reverse
- STRINGS.each {|s|
- t = s.reverse
- assert_equal(s.bytesize, t.bytesize)
- if !s.valid_encoding?
- assert_operator(t.length, :<=, s.length)
- next
- end
- assert_equal(s, t.reverse)
- }
- end
-
- def test_str_scan
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s2.valid_encoding?
- assert_raise(RegexpError) { s1.scan(s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.scan(s2) }
- next
- end
- if !s1.valid_encoding?
- assert_raise(ArgumentError) { s1.scan(s2) }
- next
- end
- r = s1.scan(s2)
- r.each {|t|
- assert_equal(s2, t)
- }
- }
- end
-
- def test_str_slice
- each_slice_call {|obj, *args|
- assert_same_result(lambda { obj[*args] }, lambda { obj.slice(*args) })
- }
- end
-
- def test_str_slice!
- each_slice_call {|s, *args|
- t = s.dup
- begin
- r = t.slice!(*args)
- rescue
- e = $!
- end
- if e
- assert_raise(e.class) { s.slice(*args) }
- next
- end
- if !r
- assert_nil(s.slice(*args))
- next
- end
- assert_equal(s.slice(*args), r)
- assert_equal(s.bytesize, r.bytesize + t.bytesize)
- if args.length == 1 && String === args[0]
- assert_equal(args[0].encoding, r.encoding,
- "#{encdump s}.slice!#{encdumpargs args}.encoding")
- else
- assert_equal(s.encoding, r.encoding,
- "#{encdump s}.slice!#{encdumpargs args}.encoding")
- end
- if [s, *args].all? {|o| !(String === o) || o.valid_encoding? }
- assert(r.valid_encoding?)
- assert(t.valid_encoding?)
- assert_equal(s.length, r.length + t.length)
- end
- }
- end
-
- def test_str_split
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s2.valid_encoding?
- assert_raise(RegexpError) { s1.split(s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.split(s2) }
- next
- end
- if !s1.valid_encoding?
- assert_raise(ArgumentError) { s1.split(s2) }
- next
- end
- t = s1.split(s2)
- t.each {|r|
- assert(a(s1).include?(a(r)))
- assert_equal(s1.encoding, r.encoding)
- }
- assert(a(s1).include?(t.map {|u| a(u) }.join(a(s2))))
- if s1.valid_encoding? && s2.valid_encoding?
- t.each {|r|
- assert(r.valid_encoding?)
- }
- end
- }
- end
-
- def test_str_squeeze
- combination(STRINGS, STRINGS) {|s1, s2|
- if !s1.valid_encoding? || !s2.valid_encoding?
- assert_raise(ArgumentError, "#{encdump s1}.squeeze(#{encdump s2})") { s1.squeeze(s2) }
- next
- end
- if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
- assert_raise(ArgumentError) { s1.squeeze(s2) }
- next
- end
- t = s1.squeeze(s2)
- assert_operator(t.length, :<=, s1.length)
- t2 = s1.dup
- t2.squeeze!(s2)
- assert_equal(t, t2)
- }
end
def test_squeeze
@@ -1683,77 +686,6 @@ class TestM17N < Test::Unit::TestCase
assert_equal("\xa3\xb0\xa3\xb1\xa3\xb3\xa3\xb4".force_encoding("euc-jp"), s.squeeze)
end
- def test_str_strip
- STRINGS.each {|s|
- if !s.valid_encoding?
- assert_raise(ArgumentError, "#{encdump s}.strip") { s.strip }
- next
- end
- t = s.strip
- l = s.lstrip
- r = s.rstrip
- assert_operator(l.length, :<=, s.length)
- assert_operator(r.length, :<=, s.length)
- assert_operator(t.length, :<=, l.length)
- assert_operator(t.length, :<=, r.length)
- t2 = s.dup
- t2.strip!
- assert_equal(t, t2)
- l2 = s.dup
- l2.lstrip!
- assert_equal(l, l2)
- r2 = s.dup
- r2.rstrip!
- assert_equal(r, r2)
- }
- end
-
- def test_str_sum
- STRINGS.each {|s|
- assert_equal(a(s).sum, s.sum)
- }
- end
-
- def test_str_swapcase
- STRINGS.each {|s|
- if !s.valid_encoding?
- assert_raise(ArgumentError, "#{encdump s}.swapcase") { s.swapcase }
- next
- end
- t1 = s.swapcase
- assert(t1.valid_encoding?) if s.valid_encoding?
- assert(t1.casecmp(s))
- t2 = s.dup
- t2.swapcase!
- assert_equal(t1, t2)
- t3 = t1.swapcase
- assert_equal(s, t3);
- }
- end
-
-
- def test_str_to_f
- STRINGS.each {|s|
- assert_nothing_raised { s.to_f }
- }
- end
-
- def test_str_to_i
- STRINGS.each {|s|
- assert_nothing_raised { s.to_i }
- 2.upto(36) {|radix|
- assert_nothing_raised { s.to_i(radix) }
- }
- }
- end
-
- def test_str_to_s
- STRINGS.each {|s|
- assert_same(s, s.to_s)
- assert_same(s, s.to_str)
- }
- end
-
def test_tr
s = "\x81\x41".force_encoding("shift_jis")
assert_equal(s.tr("A", "B"), s)
@@ -1766,109 +698,11 @@ class TestM17N < Test::Unit::TestCase
assert_equal("\xA1\xA1".force_encoding("EUC-JP"),
"a".force_encoding("ASCII-8BIT").tr("a".force_encoding("ASCII-8BIT"), "\xA1\xA1".force_encoding("EUC-JP")))
- combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
- desc = "#{encdump s1}.tr(#{encdump s2}, #{encdump s3})"
- if s1.empty?
- assert_equal(s1, s1.tr(s2, s3), desc)
- next
- end
- if !str_enc_compatible?(s1, s2, s3)
- assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
- next
- end
- if !s1.valid_encoding?
- assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
- next
- end
- if s2.empty?
- assert_equal(s1, s1.tr(s2, s3), desc)
- next
- end
- if !s2.valid_encoding? || !s3.valid_encoding?
- assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
- next
- end
- t = s1.tr(s2, s3)
- assert_operator(s1.length, :>=, t.length, desc)
- }
end
def test_tr_s
assert_equal("\xA1\xA1".force_encoding("EUC-JP"),
"a".force_encoding("ASCII-8BIT").tr("a".force_encoding("ASCII-8BIT"), "\xA1\xA1".force_encoding("EUC-JP")))
-
- combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
- desc = "#{encdump s1}.tr_s(#{encdump s2}, #{encdump s3})"
- if s1.empty?
- assert_equal(s1, s1.tr_s(s2, s3), desc)
- next
- end
- if !s1.valid_encoding?
- assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) }
- next
- end
- if !str_enc_compatible?(s1, s2, s3)
- assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
- next
- end
- if s2.empty?
- assert_equal(s1, s1.tr_s(s2, s3), desc)
- next
- end
- if !s2.valid_encoding? || !s3.valid_encoding?
- assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) }
- next
- end
-
- t = nil
- assert_nothing_raised(desc) { t = s1.tr_s(s1, s3) }
- assert_operator(s1.length, :>=, t.length, desc)
- }
- end
-
- def test_str_upcase
- STRINGS.each {|s|
- desc = "#{encdump s}.upcase"
- if !s.valid_encoding?
- assert_raise(ArgumentError, desc) { s.upcase }
- next
- end
- t1 = s.upcase
- assert(t1.valid_encoding?)
- assert(t1.casecmp(s))
- t2 = s.dup
- t2.upcase!
- assert_equal(t1, t2)
- }
- end
-
- def test_str_succ
- starts = [
- e("\xA1\xA1"),
- e("\xFE\xFE")
- ]
- STRINGS.each {|s0|
- next if s0.empty?
- s = s0.dup
- n = 1000
- h = {}
- n.times {|i|
- if h[s]
- assert(false, "#{encdump s} cycle with succ! #{i-h[s]} times")
- end
- h[s] = i
- assert_operator(s.length, :<=, s0.length + Math.log2(i+1) + 1, "#{encdump s0} succ! #{i} times => #{encdump s}")
- s.succ!
- }
- }
- end
-
- def test_str_hash
- combination(STRINGS, STRINGS) {|s1, s2|
- if s1.eql?(s2)
- assert_equal(s1.hash, s2.hash, "#{encdump s1}.hash == #{encdump s2}.dump")
- end
- }
end
def test_sub
@@ -1921,11 +755,6 @@ class TestM17N < Test::Unit::TestCase
end
def test_marshal
- STRINGS.each {|s|
- m = Marshal.dump(s)
- t = Marshal.load(m)
- assert_equal(s, t)
- }
end
def test_env
@@ -1934,114 +763,4 @@ class TestM17N < Test::Unit::TestCase
assert_equal(Encoding::ASCII_8BIT, v.encoding)
}
end
-
- def test_str_sub
- combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
- if !s2.valid_encoding?
- assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) }
- next
- end
- r2 = Regexp.new(Regexp.escape(s2))
- [
- [
- "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { s1.sub(r2, s3) }
- ],
- [
- "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { s1.sub(r2) { s3 } }
- ],
- [
- "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { s1.gsub(r2, s3) }
- ],
- [
- "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { s1.gsub(r2) { s3 } }
- ]
- ].each {|desc, doit|
- if !s1.valid_encoding?
- assert_raise(ArgumentError, desc) { doit.call }
- next
- end
- if !str_enc_compatible?(s1, s2)
- assert_raise(ArgumentError, desc) { doit.call }
- next
- end
- if !s1.include?(s2)
- assert_equal(s1, doit.call)
- next
- end
- if !str_enc_compatible?(s1, s3)
- assert_raise(ArgumentError, desc) { doit.call }
- next
- end
- t = nil
- assert_nothing_raised(desc) {
- t = doit.call
- }
- if s2 == s3
- assert_equal(s1, t, desc)
- else
- assert_not_equal(s1, t, desc)
- end
- }
- }
- end
-
- def test_str_sub!
- combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
- if !s2.valid_encoding?
- assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) }
- next
- end
- r2 = Regexp.new(Regexp.escape(s2))
- [
- [
- "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { t=s1.dup; [t, t.sub!(r2, s3)] }
- ],
- [
- "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { t=s1.dup; [t, t.sub!(r2) { s3 }] }
- ],
- [
- "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { t=s1.dup; [t, t.gsub!(r2, s3)] }
- ],
- [
- "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})",
- lambda { t=s1.dup; [t, t.gsub!(r2) { s3 }] }
- ]
- ].each {|desc, doit|
- if !s1.valid_encoding?
- assert_raise(ArgumentError, desc) { doit.call }
- next
- end
- if !str_enc_compatible?(s1, s2)
- assert_raise(ArgumentError, desc) { doit.call }
- next
- end
- if !s1.include?(s2)
- assert_equal([s1, nil], doit.call)
- next
- end
- if !str_enc_compatible?(s1, s3)
- assert_raise(ArgumentError, desc) { doit.call }
- next
- end
- t = ret = nil
- assert_nothing_raised(desc) {
- t, ret = doit.call
- }
- assert(ret)
- if s2 == s3
- assert_equal(s1, t, desc)
- else
- assert_not_equal(s1, t, desc)
- end
- }
- }
- end
-
end
diff --git a/test/ruby/test_m17n_comb.rb b/test/ruby/test_m17n_comb.rb
new file mode 100644
index 0000000000..b1928f3cd5
--- /dev/null
+++ b/test/ruby/test_m17n_comb.rb
@@ -0,0 +1,1434 @@
+require 'test/unit'
+require 'stringio'
+
+class TestM17NComb < Test::Unit::TestCase
+ def assert_encoding(encname, actual, message=nil)
+ assert_equal(Encoding.find(encname), actual, message)
+ end
+
+ module AESU
+ def a(str) str.dup.force_encoding("ASCII-8BIT") end
+ def e(str) str.dup.force_encoding("EUC-JP") end
+ def s(str) str.dup.force_encoding("Shift_JIS") end
+ def u(str) str.dup.force_encoding("UTF-8") end
+ end
+ include AESU
+ extend AESU
+
+ def assert_strenc(bytes, enc, actual, message=nil)
+ assert_instance_of(String, actual, message)
+ enc = Encoding.find(enc) if String === enc
+ assert_equal(enc, actual.encoding, message)
+ assert_equal(a(bytes), a(actual), message)
+ end
+
+ def assert_warning(pat, mesg=nil)
+ begin
+ org_stderr = $stderr
+ $stderr = StringIO.new(warn = '')
+ yield
+ ensure
+ $stderr = org_stderr
+ end
+ assert_match(pat, warn, mesg)
+ end
+
+ def assert_regexp_generic_encoding(r)
+ assert(!r.fixed_encoding?)
+ %w[ASCII-8BIT EUC-JP Shift_JIS UTF-8].each {|ename|
+ # "\xc2\xa1" is a valid sequence for ASCII-8BIT, EUC-JP, Shift_JIS and UTF-8.
+ assert_nothing_raised { r =~ "\xc2\xa1".force_encoding(ename) }
+ }
+ end
+
+ def assert_regexp_fixed_encoding(r)
+ assert(r.fixed_encoding?)
+ %w[ASCII-8BIT EUC-JP Shift_JIS UTF-8].each {|ename|
+ enc = Encoding.find(ename)
+ if enc == r.encoding
+ assert_nothing_raised { r =~ "\xc2\xa1".force_encoding(enc) }
+ else
+ assert_raise(ArgumentError) { r =~ "\xc2\xa1".force_encoding(enc) }
+ end
+ }
+ end
+
+ def assert_regexp_generic_ascii(r)
+ assert_encoding("ASCII-8BIT", r.encoding)
+ assert_regexp_generic_encoding(r)
+ end
+
+ def assert_regexp_fixed_ascii8bit(r)
+ assert_encoding("ASCII-8BIT", r.encoding)
+ assert_regexp_fixed_encoding(r)
+ end
+
+ def assert_regexp_fixed_eucjp(r)
+ assert_encoding("EUC-JP", r.encoding)
+ assert_regexp_fixed_encoding(r)
+ end
+
+ def assert_regexp_fixed_sjis(r)
+ assert_encoding("Shift_JIS", r.encoding)
+ assert_regexp_fixed_encoding(r)
+ end
+
+ def assert_regexp_fixed_utf8(r)
+ assert_encoding("UTF-8", r.encoding)
+ assert_regexp_fixed_encoding(r)
+ end
+
+ STRINGS = [
+ a(""), e(""), s(""), u(""),
+ a("a"), e("a"), s("a"), u("a"),
+ a("."), e("."), s("."), u("."),
+
+ # single character
+ a("\x80"), a("\xff"),
+ e("\xa1\xa1"), e("\xfe\xfe"),
+ e("\x8e\xa1"), e("\x8e\xfe"),
+ e("\x8f\xa1\xa1"), e("\x8f\xfe\xfe"),
+ s("\x81\x40"), s("\xfc\xfc"),
+ s("\xa1"), s("\xdf"),
+ u("\xc2\x80"), u("\xf4\x8f\xbf\xbf"),
+
+ # same byte sequence
+ a("\xc2\xa1"), e("\xc2\xa1"), s("\xc2\xa1"), u("\xc2\xa1"),
+
+ s("\x81A"), # mutibyte character which contains "A"
+ s("\x81a"), # mutibyte character which contains "a"
+
+ # invalid
+ e("\xa1"), e("\x80"),
+ s("\x81"), s("\x80"),
+ u("\xc2"), u("\x80"),
+
+ # for transitivity test
+ u("\xe0\xa0\xa1"),
+ e("\xe0\xa0\xa1"),
+ s("\xe0\xa0\xa1"),
+ ]
+
+ def combination(*args)
+ if args.empty?
+ yield []
+ else
+ arg = args.shift
+ arg.each {|v|
+ combination(*args) {|vs|
+ yield [v, *vs]
+ }
+ }
+ end
+ end
+
+ def encdump(str)
+ "#{str.dump}.force_encoding(#{str.encoding.name.dump})"
+ end
+
+ def encdumpargs(args)
+ r = '('
+ args.each_with_index {|a, i|
+ r << ',' if 0 < i
+ if String === a
+ r << encdump(a)
+ else
+ r << a.inspect
+ end
+ }
+ r << ')'
+ r
+ end
+
+ def assert_str_enc_propagation(t, s1, s2)
+ if !s1.ascii_only?
+ assert_equal(s1.encoding, t.encoding)
+ elsif !s2.ascii_only?
+ assert_equal(s2.encoding, t.encoding)
+ else
+ assert([s1.encoding, s2.encoding].include?(t.encoding))
+ end
+ end
+
+ def assert_same_result(expected_proc, actual_proc)
+ e = nil
+ begin
+ t = expected_proc.call
+ rescue
+ e = $!
+ end
+ if e
+ assert_raise(e.class) { actual_proc.call }
+ else
+ assert_equal(t, actual_proc.call)
+ end
+ end
+
+ def each_slice_call
+ combination(STRINGS, -2..2) {|s, nth|
+ yield s, nth
+ }
+ combination(STRINGS, -2..2, 0..2) {|s, nth, len|
+ yield s, nth, len
+ }
+ combination(STRINGS, STRINGS) {|s, substr|
+ yield s, substr
+ }
+ combination(STRINGS, -2..2, 0..2) {|s, first, last|
+ yield s, first..last
+ yield s, first...last
+ }
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s2.valid_encoding?
+ next
+ end
+ yield s1, Regexp.new(Regexp.escape(s2))
+ }
+ combination(STRINGS, STRINGS, 0..2) {|s1, s2, nth|
+ if !s2.valid_encoding?
+ next
+ end
+ yield s1, Regexp.new(Regexp.escape(s2)), nth
+ }
+ end
+
+ def str_enc_compatible?(*strs)
+ encs = []
+ strs.each {|s|
+ encs << s.encoding if !s.ascii_only?
+ }
+ encs.uniq!
+ encs.length <= 1
+ end
+
+ # tests start
+
+ def test_str_new
+ STRINGS.each {|s|
+ t = String.new(s)
+ assert_strenc(a(s), s.encoding, t)
+ }
+ end
+
+ def test_str_plus
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if s1.encoding != s2.encoding && !s1.ascii_only? && !s2.ascii_only?
+ assert_raise(ArgumentError) { s1 + s2 }
+ else
+ t = s1 + s2
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert_equal(a(s1) + a(s2), a(t))
+ assert_str_enc_propagation(t, s1, s2)
+ end
+ }
+ end
+
+ def test_str_times
+ STRINGS.each {|s|
+ [0,1,2].each {|n|
+ t = s * n
+ assert(t.valid_encoding?) if s.valid_encoding?
+ assert_strenc(a(s) * n, s.encoding, t)
+ }
+ }
+ end
+
+ def test_sprintf_s
+ STRINGS.each {|s|
+ assert_strenc(a(s), s.encoding, "%s".force_encoding(s.encoding) % s)
+ if !s.empty? # xxx
+ assert_strenc(a(s), s.encoding, a("%s") % s)
+ end
+ }
+ end
+
+ def test_str_eq_reflexive
+ STRINGS.each {|s|
+ assert(s == s, "#{encdump s} == #{encdump s}")
+ }
+ end
+
+ def test_str_eq_symmetric
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if s1 == s2
+ assert(s2 == s1, "#{encdump s2} == #{encdump s1}")
+ else
+ assert(!(s2 == s1), "!(#{encdump s2} == #{encdump s1})")
+ end
+ }
+ end
+
+ def test_str_eq_transitive
+ combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
+ if s1 == s2 && s2 == s3
+ assert(s1 == s3, "transitive: #{encdump s1} == #{encdump s2} == #{encdump s3}")
+ end
+ }
+ end
+
+ def test_str_eq
+ combination(STRINGS, STRINGS) {|s1, s2|
+ desc_eq = "#{encdump s1} == #{encdump s2}"
+ if s1.ascii_only? && s2.ascii_only? && a(s1) == a(s2)
+ assert(s1 == s2, desc_eq)
+ elsif s1.encoding == s2.encoding && a(s1) == a(s2)
+ assert(s1 == s2, desc_eq)
+ assert(!(s1 != s2))
+ assert_equal(0, s1 <=> s2)
+ else
+ assert(!(s1 == s2), "!(#{desc_eq})")
+ assert(s1 != s2)
+ assert_not_equal(0, s1 <=> s2)
+ end
+ }
+ end
+
+ def test_str_concat
+ combination(STRINGS, STRINGS) {|s1, s2|
+ s = s1.dup
+ if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
+ s << s2
+ assert(s.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert_equal(a(s), a(s1) + a(s2))
+ assert_str_enc_propagation(s, s1, s2)
+ else
+ assert_raise(ArgumentError) { s << s2 }
+ end
+ }
+ end
+
+ def test_str_aref
+
+ STRINGS.each {|s|
+ t = ''
+ 0.upto(s.length-1) {|i|
+ u = s[i]
+ assert(u.valid_encoding?) if s.valid_encoding?
+ t << u
+ }
+ assert_equal(t, s)
+ }
+
+ end
+
+ def test_str_aref_len
+
+ STRINGS.each {|s|
+ t = ''
+ 0.upto(s.length-1) {|i|
+ u = s[i,1]
+ assert(u.valid_encoding?) if s.valid_encoding?
+ t << u
+ }
+ assert_equal(t, s)
+ }
+
+ STRINGS.each {|s|
+ t = ''
+ 0.step(s.length-1, 2) {|i|
+ u = s[i,2]
+ assert(u.valid_encoding?) if s.valid_encoding?
+ t << u
+ }
+ assert_equal(t, s)
+ }
+ end
+
+ def test_str_aref_substr
+
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
+ t = s1[s2]
+ if t != nil
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert_equal(s2, t)
+ assert_match(/#{Regexp.escape(a(s2))}/, a(s1))
+ if s1.valid_encoding?
+ assert_match(/#{Regexp.escape(s2)}/, s1)
+ end
+ end
+ else
+ assert_raise(ArgumentError) { s1[s2] }
+ end
+ }
+ end
+
+ def test_str_aref_range2
+ combination(STRINGS, -2..2, -2..2) {|s, first, last|
+ t = s[first..last]
+ if first < 0
+ first += s.length
+ if first < 0
+ assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
+ next
+ end
+ end
+ if s.length < first
+ assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
+ next
+ end
+ assert(t.valid_encoding?) if s.valid_encoding?
+ if last < 0
+ last += s.length
+ end
+ t2 = ''
+ first.upto(last) {|i|
+ c = s[i]
+ t2 << c if c
+ }
+ assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]")
+ }
+ end
+
+ def test_str_aref_range3
+ combination(STRINGS, -2..2, -2..2) {|s, first, last|
+ t = s[first...last]
+ if first < 0
+ first += s.length
+ if first < 0
+ assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
+ next
+ end
+ end
+ if s.length < first
+ assert_nil(t, "#{s.inspect}[#{first}..#{last}]")
+ next
+ end
+ if last < 0
+ last += s.length
+ end
+ assert(t.valid_encoding?) if s.valid_encoding?
+ t2 = ''
+ first.upto(last-1) {|i|
+ c = s[i]
+ t2 << c if c
+ }
+ assert_equal(t2, t, "#{s.inspect}[#{first}..#{last}]")
+ }
+ end
+
+ def test_str_assign
+ combination(STRINGS, STRINGS) {|s1, s2|
+ (-2).upto(2) {|i|
+ t = s1.dup
+ if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
+ if i < -s1.length || s1.length < i
+ assert_raise(IndexError) { t[i] = s2 }
+ else
+ t[i] = s2
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert(a(t).index(a(s2)))
+ if s1.valid_encoding? && s2.valid_encoding?
+ if i == s1.length && s2.empty?
+ assert_nil(t[i])
+ elsif i < 0
+ assert_equal(s2, t[i-s2.length+1,s2.length],
+ "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i-s2.length+1},#{s2.length}]")
+ else
+ assert_equal(s2, t[i,s2.length],
+ "t = #{encdump(s1)}; t[#{i}] = #{encdump(s2)}; t[#{i},#{s2.length}]")
+ end
+ end
+ end
+ else
+ assert_raise(ArgumentError) { t[i] = s2 }
+ end
+ }
+ }
+ end
+
+ def test_str_assign_len
+ combination(STRINGS, -2..2, 0..2, STRINGS) {|s1, i, len, s2|
+ t = s1.dup
+ if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
+ if i < -s1.length || s1.length < i
+ assert_raise(IndexError) { t[i,len] = s2 }
+ else
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ t[i,len] = s2
+ assert(a(t).index(a(s2)))
+ if s1.valid_encoding? && s2.valid_encoding?
+ if i == s1.length && s2.empty?
+ assert_nil(t[i])
+ elsif i < 0
+ if -i < len
+ len = -i
+ end
+ assert_equal(s2, t[i-s2.length+len,s2.length],
+ "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i-s2.length+len},#{s2.length}]")
+ else
+ assert_equal(s2, t[i,s2.length],
+ "t = #{encdump(s1)}; t[#{i},#{len}] = #{encdump(s2)}; t[#{i},#{s2.length}]")
+ end
+ end
+ end
+ else
+ assert_raise(ArgumentError) { t[i,len] = s2 }
+ end
+ }
+ end
+
+ def test_str_assign_substr
+ combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
+ t = s1.dup
+ encs = [
+ !s1.ascii_only? ? s1.encoding : nil,
+ !s2.ascii_only? ? s2.encoding : nil,
+ !s3.ascii_only? ? s3.encoding : nil].uniq.compact
+ if 1 < encs.length
+ assert_raise(ArgumentError, IndexError) { t[s2] = s3 }
+ else
+ if encs.empty?
+ encs = [
+ s1.encoding,
+ s2.encoding,
+ s3.encoding].uniq.reject {|e| e == Encoding.find("ASCII-8BIT") }
+ if encs.empty?
+ encs = [Encoding.find("ASCII-8BIT")]
+ end
+ end
+ if !t[s2]
+ else
+ t[s2] = s3
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding? && s3.valid_encoding?
+ end
+ end
+ }
+ end
+
+ def test_str_assign_range2
+ combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2|
+ t = s1.dup
+ if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
+ if first < -s1.length || s1.length < first
+ assert_raise(RangeError) { t[first..last] = s2 }
+ else
+ t[first..last] = s2
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert(a(t).index(a(s2)))
+ if s1.valid_encoding? && s2.valid_encoding?
+ if first < 0
+ assert_equal(s2, t[s1.length+first, s2.length])
+ else
+ assert_equal(s2, t[first, s2.length])
+ end
+ end
+ end
+ else
+ assert_raise(ArgumentError, RangeError,
+ "t=#{encdump(s1)};t[#{first}..#{last}]=#{encdump(s2)}") {
+ t[first..last] = s2
+ }
+ end
+ }
+ end
+
+ def test_str_assign_range3
+ combination(STRINGS, -2..2, -2..2, STRINGS) {|s1, first, last, s2|
+ t = s1.dup
+ if s1.ascii_only? || s2.ascii_only? || s1.encoding == s2.encoding
+ if first < -s1.length || s1.length < first
+ assert_raise(RangeError) { t[first...last] = s2 }
+ else
+ t[first...last] = s2
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert(a(t).index(a(s2)))
+ if s1.valid_encoding? && s2.valid_encoding?
+ if first < 0
+ assert_equal(s2, t[s1.length+first, s2.length])
+ else
+ assert_equal(s2, t[first, s2.length])
+ end
+ end
+ end
+ else
+ assert_raise(ArgumentError, RangeError,
+ "t=#{encdump(s1)};t[#{first}...#{last}]=#{encdump(s2)}") {
+ t[first...last] = s2
+ }
+ end
+ }
+ end
+
+ def test_str_cmp
+ combination(STRINGS, STRINGS) {|s1, s2|
+ desc = "#{encdump s1} <=> #{encdump s2}"
+ r = s1 <=> s2
+ if s1 == s2
+ assert_equal(0, r, desc)
+ else
+ assert_not_equal(0, r, desc)
+ end
+ }
+ end
+
+ def test_str_capitalize
+ STRINGS.each {|s|
+ begin
+ t1 = s.capitalize
+ rescue ArgumentError
+ assert(!s.valid_encoding?)
+ next
+ end
+ assert(t1.valid_encoding?) if s.valid_encoding?
+ assert(t1.casecmp(s))
+ t2 = s.dup
+ t2.capitalize!
+ assert_equal(t1, t2)
+ assert_equal(s.downcase.sub(/\A[a-z]/) {|ch| a(ch).upcase }, t1)
+ }
+ end
+
+ def test_str_casecmp
+ combination(STRINGS, STRINGS) {|s1, s2|
+ #puts "#{encdump(s1)}.casecmp(#{encdump(s2)})"
+ begin
+ r = s1.casecmp(s2)
+ rescue ArgumentError
+ assert(!s1.valid_encoding? || !s2.valid_encoding?)
+ next
+ end
+ #assert_equal(s1.upcase <=> s2.upcase, r)
+ }
+ end
+
+ def test_str_center
+
+ combination(STRINGS, [0,1,2,3,10]) {|s1, width|
+ t = s1.center(width)
+ assert(a(t).index(a(s1)))
+ }
+ combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2|
+ if s2.empty?
+ assert_raise(ArgumentError) { s1.center(width, s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.center(width, s2) }
+ next
+ end
+ t = s1.center(width, s2)
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert(a(t).index(a(s1)))
+ assert_str_enc_propagation(t, s1, s2) if (t != s1)
+ }
+ end
+
+ def test_str_ljust
+ combination(STRINGS, [0,1,2,3,10]) {|s1, width|
+ t = s1.ljust(width)
+ assert(a(t).index(a(s1)))
+ }
+ combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2|
+ if s2.empty?
+ assert_raise(ArgumentError) { s1.ljust(width, s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.ljust(width, s2) }
+ next
+ end
+ t = s1.ljust(width, s2)
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert(a(t).index(a(s1)))
+ assert_str_enc_propagation(t, s1, s2) if (t != s1)
+ }
+ end
+
+ def test_str_rjust
+ combination(STRINGS, [0,1,2,3,10]) {|s1, width|
+ t = s1.rjust(width)
+ assert(a(t).index(a(s1)))
+ }
+ combination(STRINGS, [0,1,2,3,10], STRINGS) {|s1, width, s2|
+ if s2.empty?
+ assert_raise(ArgumentError) { s1.rjust(width, s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.rjust(width, s2) }
+ next
+ end
+ t = s1.rjust(width, s2)
+ assert(t.valid_encoding?) if s1.valid_encoding? && s2.valid_encoding?
+ assert(a(t).index(a(s1)))
+ assert_str_enc_propagation(t, s1, s2) if (t != s1)
+ }
+ end
+
+ def test_str_chomp
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.chomp(s2) }
+ next
+ end
+ t = s1.chomp(s2)
+ assert(t.valid_encoding?, "#{encdump(s1)}.chomp(#{encdump(s2)})") if s1.valid_encoding? && s2.valid_encoding?
+ assert_equal(s1.encoding, t.encoding)
+ t2 = s1.dup
+ t2.chomp!(s2)
+ assert_equal(t, t2)
+ }
+ end
+
+ def test_str_chop
+ STRINGS.each {|s|
+ s = s.dup
+ desc = "#{encdump s}.chop"
+ if !s.valid_encoding?
+ #assert_raise(ArgumentError, desc) { s.chop }
+ begin
+ s.chop
+ rescue ArgumentError
+ e = $!
+ end
+ next if e
+ end
+ t = nil
+ assert_nothing_raised(desc) { t = s.chop }
+ assert(t.valid_encoding?) if s.valid_encoding?
+ assert(a(s).index(a(t)))
+ t2 = s.dup
+ t2.chop!
+ assert_equal(t, t2)
+ }
+ end
+
+ def test_str_clear
+ STRINGS.each {|s|
+ t = s.dup
+ t.clear
+ assert(t.valid_encoding?)
+ assert(t.empty?)
+ }
+ end
+
+ def test_str_clone
+ STRINGS.each {|s|
+ t = s.clone
+ assert_equal(s, t)
+ assert_equal(s.encoding, t.encoding)
+ assert_equal(a(s), a(t))
+ }
+ end
+
+ def test_str_dup
+ STRINGS.each {|s|
+ t = s.dup
+ assert_equal(s, t)
+ assert_equal(s.encoding, t.encoding)
+ assert_equal(a(s), a(t))
+ }
+ end
+
+ def test_str_count
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_raise(ArgumentError) { s1.count(s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.count(s2) }
+ next
+ end
+ n = s1.count(s2)
+ n0 = a(s1).count(a(s2))
+ assert_operator(n, :<=, n0)
+ }
+ end
+
+ def test_str_crypt
+ combination(STRINGS, STRINGS) {|str, salt|
+ if a(salt).length < 2
+ assert_raise(ArgumentError) { str.crypt(salt) }
+ next
+ end
+ t = str.crypt(salt)
+ assert_equal(a(str).crypt(a(salt)), t)
+ assert_encoding('ASCII-8BIT', t.encoding)
+ }
+ end
+
+ def test_str_delete
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_raise(ArgumentError) { s1.delete(s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.delete(s2) }
+ next
+ end
+ t = s1.delete(s2)
+ assert(t.valid_encoding?)
+ assert_equal(t.encoding, s1.encoding)
+ assert_operator(t.length, :<=, s1.length)
+ t2 = s1.dup
+ t2.delete!(s2)
+ assert_equal(t, t2)
+ }
+ end
+
+ def test_str_downcase
+ STRINGS.each {|s|
+ if !s.valid_encoding?
+ assert_raise(ArgumentError) { s.downcase }
+ next
+ end
+ t = s.downcase
+ assert(t.valid_encoding?)
+ assert_equal(t.encoding, s.encoding)
+ assert(t.casecmp(s))
+ t2 = s.dup
+ t2.downcase!
+ assert_equal(t, t2)
+ }
+ end
+
+ def test_str_dump
+ STRINGS.each {|s|
+ t = s.dump
+ assert(t.valid_encoding?)
+ assert(t.ascii_only?)
+ u = eval(t)
+ assert_equal(a(s), a(u))
+ }
+ end
+
+ def test_str_each_line
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_raise(ArgumentError) { s1.each_line(s2) {} }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.each_line(s2) {} }
+ next
+ end
+ lines = []
+ s1.each_line(s2) {|line|
+ assert(line.valid_encoding?)
+ assert_equal(s1.encoding, line.encoding)
+ lines << line
+ }
+ next if lines.size == 0
+ s2 = lines.join('')
+ assert_equal(s1.encoding, s2.encoding)
+ assert_equal(s1, s2)
+ }
+ end
+
+ def test_str_each_byte
+ STRINGS.each {|s|
+ bytes = []
+ s.each_byte {|b|
+ bytes << b
+ }
+ a(s).split(//).each_with_index {|ch, i|
+ assert_equal(ch.ord, bytes[i])
+ }
+ }
+ end
+
+ def test_str_empty?
+ STRINGS.each {|s|
+ if s.length == 0
+ assert(s.empty?)
+ else
+ assert(!s.empty?)
+ end
+ }
+ end
+
+ def test_str_hex
+ STRINGS.each {|s|
+ t = s.hex
+ t2 = a(s)[/\A[0-9a-fA-Fx]*/].hex
+ assert_equal(t2, t)
+ }
+ end
+
+ def test_str_include?
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.include?(s2) }
+ assert_raise(ArgumentError) { s1.index(s2) }
+ assert_raise(ArgumentError) { s1.rindex(s2) }
+ next
+ end
+ t = s1.include?(s2)
+ if t
+ assert(a(s1).include?(a(s2)))
+ assert(s1.index(s2))
+ assert(s1.rindex(s2))
+ else
+ assert(!s1.index(s2))
+ assert(!s1.rindex(s2), "!#{encdump(s1)}.rindex(#{encdump(s2)})")
+ end
+ if s2.empty?
+ assert_equal(true, t)
+ next
+ end
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_equal(false, t, "#{encdump s1}.include?(#{encdump s2})")
+ next
+ end
+ if t && s1.valid_encoding? && s2.valid_encoding?
+ assert_match(/#{Regexp.escape(s2)}/, s1)
+ else
+ assert_no_match(/#{Regexp.escape(s2)}/, s1)
+ end
+ }
+ end
+
+ def test_str_index
+ combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos|
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.index(s2) }
+ next
+ end
+ t = s1.index(s2, pos)
+ if s2.empty?
+ if pos < 0 && pos+s1.length < 0
+ assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
+ elsif pos < 0
+ assert_equal(s1.length+pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
+ elsif s1.length < pos
+ assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
+ else
+ assert_equal(pos, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
+ end
+ next
+ end
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_equal(nil, t, "#{encdump s1}.index(#{encdump s2}, #{pos})");
+ next
+ end
+ if t
+ re = /#{Regexp.escape(s2)}/
+ assert(re.match(s1, pos))
+ assert_equal($`.length, t, "#{encdump s1}.index(#{encdump s2}, #{pos})")
+ else
+ assert_no_match(/#{Regexp.escape(s2)}/, s1[pos..-1])
+ end
+ }
+ end
+
+ def test_str_rindex
+ combination(STRINGS, STRINGS, -2..2) {|s1, s2, pos|
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.rindex(s2) }
+ next
+ end
+ t = s1.rindex(s2, pos)
+ if s2.empty?
+ if pos < 0 && pos+s1.length < 0
+ assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
+ elsif pos < 0
+ assert_equal(s1.length+pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
+ elsif s1.length < pos
+ assert_equal(s1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
+ else
+ assert_equal(pos, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
+ end
+ next
+ end
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_equal(nil, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
+ next
+ end
+ if t
+ #puts "#{encdump s1}.rindex(#{encdump s2}, #{pos}) => #{t}"
+ assert(a(s1).index(a(s2)))
+ pos2 = pos
+ pos2 += s1.length if pos < 0
+ re = /\A(.{0,#{pos2}})#{Regexp.escape(s2)}/m
+ assert(re.match(s1), "#{re.inspect}.match(#{encdump(s1)})")
+ assert_equal($1.length, t, "#{encdump s1}.rindex(#{encdump s2}, #{pos})")
+ else
+ re = /#{Regexp.escape(s2)}/
+ n = re =~ s1
+ if n
+ if pos < 0
+ assert_operator(n, :>, s1.length+pos)
+ else
+ assert_operator(n, :>, pos)
+ end
+ end
+ end
+ }
+ end
+
+ def test_str_insert
+ combination(STRINGS, 0..2, STRINGS) {|s1, nth, s2|
+ t1 = s1.dup
+ t2 = s1.dup
+ begin
+ t1[nth, 0] = s2
+ rescue ArgumentError, IndexError => e1
+ end
+ begin
+ t2.insert(nth, s2)
+ rescue ArgumentError, IndexError => e2
+ end
+ assert_equal(t1, t2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t")
+ assert_equal(e1.class, e2.class, "begin #{encdump s1}.insert(#{nth},#{encdump s2}); rescue ArgumentError, IndexError => e; e end")
+ }
+ combination(STRINGS, -2..-1, STRINGS) {|s1, nth, s2|
+ next if s1.length + nth < 0
+ next unless s1.valid_encoding?
+ next unless s2.valid_encoding?
+ t1 = s1.dup
+ begin
+ t1.insert(nth, s2)
+ slen = s2.length
+ assert_equal(t1[nth-slen+1,slen], s2, "t=#{encdump s1}; t.insert(#{nth},#{encdump s2}); t")
+ rescue ArgumentError, IndexError => e
+ end
+ }
+ end
+
+ def test_str_intern
+ STRINGS.each {|s|
+ if /\0/ =~ a(s)
+ assert_raise(ArgumentError) { s.intern }
+ else
+ sym = s.intern
+ assert_equal(s, sym.to_s)
+ end
+ }
+ end
+
+ def test_str_length
+ STRINGS.each {|s|
+ assert_operator(s.length, :<=, s.bytesize)
+ }
+ end
+
+ def test_str_oct
+ STRINGS.each {|s|
+ t = s.oct
+ t2 = a(s)[/\A[0-9a-fA-FxXbB]*/].oct
+ assert_equal(t2, t)
+ }
+ end
+
+ def test_str_replace
+ combination(STRINGS, STRINGS) {|s1, s2|
+ t = s1.dup
+ t.replace s2
+ assert_equal(s2, t)
+ assert_equal(s2.encoding, t.encoding)
+ }
+ end
+
+ def test_str_reverse
+ STRINGS.each {|s|
+ t = s.reverse
+ assert_equal(s.bytesize, t.bytesize)
+ if !s.valid_encoding?
+ assert_operator(t.length, :<=, s.length)
+ next
+ end
+ assert_equal(s, t.reverse)
+ }
+ end
+
+ def test_str_scan
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s2.valid_encoding?
+ assert_raise(RegexpError) { s1.scan(s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.scan(s2) }
+ next
+ end
+ if !s1.valid_encoding?
+ assert_raise(ArgumentError) { s1.scan(s2) }
+ next
+ end
+ r = s1.scan(s2)
+ r.each {|t|
+ assert_equal(s2, t)
+ }
+ }
+ end
+
+ def test_str_slice
+ each_slice_call {|obj, *args|
+ assert_same_result(lambda { obj[*args] }, lambda { obj.slice(*args) })
+ }
+ end
+
+ def test_str_slice!
+ each_slice_call {|s, *args|
+ t = s.dup
+ begin
+ r = t.slice!(*args)
+ rescue
+ e = $!
+ end
+ if e
+ assert_raise(e.class) { s.slice(*args) }
+ next
+ end
+ if !r
+ assert_nil(s.slice(*args))
+ next
+ end
+ assert_equal(s.slice(*args), r)
+ assert_equal(s.bytesize, r.bytesize + t.bytesize)
+ if args.length == 1 && String === args[0]
+ assert_equal(args[0].encoding, r.encoding,
+ "#{encdump s}.slice!#{encdumpargs args}.encoding")
+ else
+ assert_equal(s.encoding, r.encoding,
+ "#{encdump s}.slice!#{encdumpargs args}.encoding")
+ end
+ if [s, *args].all? {|o| !(String === o) || o.valid_encoding? }
+ assert(r.valid_encoding?)
+ assert(t.valid_encoding?)
+ assert_equal(s.length, r.length + t.length)
+ end
+ }
+ end
+
+ def test_str_split
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s2.valid_encoding?
+ assert_raise(RegexpError) { s1.split(s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.split(s2) }
+ next
+ end
+ if !s1.valid_encoding?
+ assert_raise(ArgumentError) { s1.split(s2) }
+ next
+ end
+ t = s1.split(s2)
+ t.each {|r|
+ assert(a(s1).include?(a(r)))
+ assert_equal(s1.encoding, r.encoding)
+ }
+ assert(a(s1).include?(t.map {|u| a(u) }.join(a(s2))))
+ if s1.valid_encoding? && s2.valid_encoding?
+ t.each {|r|
+ assert(r.valid_encoding?)
+ }
+ end
+ }
+ end
+
+ def test_str_squeeze
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if !s1.valid_encoding? || !s2.valid_encoding?
+ assert_raise(ArgumentError, "#{encdump s1}.squeeze(#{encdump s2})") { s1.squeeze(s2) }
+ next
+ end
+ if !s1.ascii_only? && !s2.ascii_only? && s1.encoding != s2.encoding
+ assert_raise(ArgumentError) { s1.squeeze(s2) }
+ next
+ end
+ t = s1.squeeze(s2)
+ assert_operator(t.length, :<=, s1.length)
+ t2 = s1.dup
+ t2.squeeze!(s2)
+ assert_equal(t, t2)
+ }
+ end
+
+ def test_str_strip
+ STRINGS.each {|s|
+ if !s.valid_encoding?
+ assert_raise(ArgumentError, "#{encdump s}.strip") { s.strip }
+ next
+ end
+ t = s.strip
+ l = s.lstrip
+ r = s.rstrip
+ assert_operator(l.length, :<=, s.length)
+ assert_operator(r.length, :<=, s.length)
+ assert_operator(t.length, :<=, l.length)
+ assert_operator(t.length, :<=, r.length)
+ t2 = s.dup
+ t2.strip!
+ assert_equal(t, t2)
+ l2 = s.dup
+ l2.lstrip!
+ assert_equal(l, l2)
+ r2 = s.dup
+ r2.rstrip!
+ assert_equal(r, r2)
+ }
+ end
+
+ def test_str_sum
+ STRINGS.each {|s|
+ assert_equal(a(s).sum, s.sum)
+ }
+ end
+
+ def test_str_swapcase
+ STRINGS.each {|s|
+ if !s.valid_encoding?
+ assert_raise(ArgumentError, "#{encdump s}.swapcase") { s.swapcase }
+ next
+ end
+ t1 = s.swapcase
+ assert(t1.valid_encoding?) if s.valid_encoding?
+ assert(t1.casecmp(s))
+ t2 = s.dup
+ t2.swapcase!
+ assert_equal(t1, t2)
+ t3 = t1.swapcase
+ assert_equal(s, t3);
+ }
+ end
+
+
+ def test_str_to_f
+ STRINGS.each {|s|
+ assert_nothing_raised { s.to_f }
+ }
+ end
+
+ def test_str_to_i
+ STRINGS.each {|s|
+ assert_nothing_raised { s.to_i }
+ 2.upto(36) {|radix|
+ assert_nothing_raised { s.to_i(radix) }
+ }
+ }
+ end
+
+ def test_str_to_s
+ STRINGS.each {|s|
+ assert_same(s, s.to_s)
+ assert_same(s, s.to_str)
+ }
+ end
+
+ def test_tr
+ combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
+ desc = "#{encdump s1}.tr(#{encdump s2}, #{encdump s3})"
+ if s1.empty?
+ assert_equal(s1, s1.tr(s2, s3), desc)
+ next
+ end
+ if !str_enc_compatible?(s1, s2, s3)
+ assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
+ next
+ end
+ if !s1.valid_encoding?
+ assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
+ next
+ end
+ if s2.empty?
+ assert_equal(s1, s1.tr(s2, s3), desc)
+ next
+ end
+ if !s2.valid_encoding? || !s3.valid_encoding?
+ assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
+ next
+ end
+ t = s1.tr(s2, s3)
+ assert_operator(s1.length, :>=, t.length, desc)
+ }
+ end
+
+ def test_tr_s
+ combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
+ desc = "#{encdump s1}.tr_s(#{encdump s2}, #{encdump s3})"
+ if s1.empty?
+ assert_equal(s1, s1.tr_s(s2, s3), desc)
+ next
+ end
+ if !s1.valid_encoding?
+ assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) }
+ next
+ end
+ if !str_enc_compatible?(s1, s2, s3)
+ assert_raise(ArgumentError, desc) { s1.tr(s2, s3) }
+ next
+ end
+ if s2.empty?
+ assert_equal(s1, s1.tr_s(s2, s3), desc)
+ next
+ end
+ if !s2.valid_encoding? || !s3.valid_encoding?
+ assert_raise(ArgumentError, desc) { s1.tr_s(s2, s3) }
+ next
+ end
+
+ t = nil
+ assert_nothing_raised(desc) { t = s1.tr_s(s1, s3) }
+ assert_operator(s1.length, :>=, t.length, desc)
+ }
+ end
+
+ def test_str_upcase
+ STRINGS.each {|s|
+ desc = "#{encdump s}.upcase"
+ if !s.valid_encoding?
+ assert_raise(ArgumentError, desc) { s.upcase }
+ next
+ end
+ t1 = s.upcase
+ assert(t1.valid_encoding?)
+ assert(t1.casecmp(s))
+ t2 = s.dup
+ t2.upcase!
+ assert_equal(t1, t2)
+ }
+ end
+
+ def test_str_succ
+ starts = [
+ e("\xA1\xA1"),
+ e("\xFE\xFE")
+ ]
+ STRINGS.each {|s0|
+ next if s0.empty?
+ s = s0.dup
+ n = 1000
+ h = {}
+ n.times {|i|
+ if h[s]
+ assert(false, "#{encdump s} cycle with succ! #{i-h[s]} times")
+ end
+ h[s] = i
+ assert_operator(s.length, :<=, s0.length + Math.log2(i+1) + 1, "#{encdump s0} succ! #{i} times => #{encdump s}")
+ s.succ!
+ }
+ }
+ end
+
+ def test_str_hash
+ combination(STRINGS, STRINGS) {|s1, s2|
+ if s1.eql?(s2)
+ assert_equal(s1.hash, s2.hash, "#{encdump s1}.hash == #{encdump s2}.dump")
+ end
+ }
+ end
+
+ def test_marshal
+ STRINGS.each {|s|
+ m = Marshal.dump(s)
+ t = Marshal.load(m)
+ assert_equal(s, t)
+ }
+ end
+
+ def test_str_sub
+ combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
+ if !s2.valid_encoding?
+ assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) }
+ next
+ end
+ r2 = Regexp.new(Regexp.escape(s2))
+ [
+ [
+ "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { s1.sub(r2, s3) }
+ ],
+ [
+ "#{encdump s1}.sub(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { s1.sub(r2) { s3 } }
+ ],
+ [
+ "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { s1.gsub(r2, s3) }
+ ],
+ [
+ "#{encdump s1}.gsub(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { s1.gsub(r2) { s3 } }
+ ]
+ ].each {|desc, doit|
+ if !s1.valid_encoding?
+ assert_raise(ArgumentError, desc) { doit.call }
+ next
+ end
+ if !str_enc_compatible?(s1, s2)
+ assert_raise(ArgumentError, desc) { doit.call }
+ next
+ end
+ if !s1.include?(s2)
+ assert_equal(s1, doit.call)
+ next
+ end
+ if !str_enc_compatible?(s1, s3)
+ assert_raise(ArgumentError, desc) { doit.call }
+ next
+ end
+ t = nil
+ assert_nothing_raised(desc) {
+ t = doit.call
+ }
+ if s2 == s3
+ assert_equal(s1, t, desc)
+ else
+ assert_not_equal(s1, t, desc)
+ end
+ }
+ }
+ end
+
+ def test_str_sub!
+ combination(STRINGS, STRINGS, STRINGS) {|s1, s2, s3|
+ if !s2.valid_encoding?
+ assert_raise(RegexpError) { Regexp.new(Regexp.escape(s2)) }
+ next
+ end
+ r2 = Regexp.new(Regexp.escape(s2))
+ [
+ [
+ "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { t=s1.dup; [t, t.sub!(r2, s3)] }
+ ],
+ [
+ "t=#{encdump s1}.dup;t.sub!(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { t=s1.dup; [t, t.sub!(r2) { s3 }] }
+ ],
+ [
+ "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { t=s1.dup; [t, t.gsub!(r2, s3)] }
+ ],
+ [
+ "t=#{encdump s1}.dup;t.gsub!(Regexp.new(#{encdump s2}), #{encdump s3})",
+ lambda { t=s1.dup; [t, t.gsub!(r2) { s3 }] }
+ ]
+ ].each {|desc, doit|
+ if !s1.valid_encoding?
+ assert_raise(ArgumentError, desc) { doit.call }
+ next
+ end
+ if !str_enc_compatible?(s1, s2)
+ assert_raise(ArgumentError, desc) { doit.call }
+ next
+ end
+ if !s1.include?(s2)
+ assert_equal([s1, nil], doit.call)
+ next
+ end
+ if !str_enc_compatible?(s1, s3)
+ assert_raise(ArgumentError, desc) { doit.call }
+ next
+ end
+ t = ret = nil
+ assert_nothing_raised(desc) {
+ t, ret = doit.call
+ }
+ assert(ret)
+ if s2 == s3
+ assert_equal(s1, t, desc)
+ else
+ assert_not_equal(s1, t, desc)
+ end
+ }
+ }
+ end
+
+end