summaryrefslogtreecommitdiff
path: root/test/ruby/enc/test_cesu8.rb
blob: d9debe76cdb9caf85aacedb394a16951a6c76d44 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
# frozen_string_literal: false
require 'test/unit'

class TestCESU8 < Test::Unit::TestCase

  def encdump(obj)
    case obj
    when String
      obj.dump
    when Regexp
      "Regexp.new(#{encdump(obj.source)}, #{obj.options})"
    else
      raise Argument, "unexpected: #{obj.inspect}"
    end
  end

  def enccall(recv, meth, *args)
    desc = ''
    if String === recv
      desc << encdump(recv)
    else
      desc << recv.inspect
    end
    desc << '.' << meth.to_s
    if !args.empty?
      desc << '('
      args.each_with_index {|a, i|
        desc << ',' if 0 < i
        if String === a
          desc << encdump(a)
        else
          desc << a.inspect
        end
      }
      desc << ')'
    end
    result = nil
    assert_nothing_raised(desc) {
      result = recv.send(meth, *args)
    }
    result
  end

  def assert_str_equal(expected, actual, message=nil)
    full_message = build_message(message, <<EOT)
#{encdump expected} expected but not equal to
#{encdump actual}.
EOT
    assert_equal(expected, actual, full_message)
  end

  # tests start

  def test_cesu8_valid_encoding
    all_assertions do |a|
      [
        "\x00",
        "\x7f",
        "\u0080",
        "\u07ff",
        "\u0800",
        "\ud7ff",
        "\xed\xa0\x80\xed\xb0\x80",
        "\xed\xaf\xbf\xed\xbf\xbf",
        "\ue000",
        "\uffff",
      ].each {|s|
        s.force_encoding("cesu-8")
        a.for(s) {
          assert_predicate(s, :valid_encoding?, "#{encdump s}.valid_encoding?")
        }
      }
      [
        "\x80",
        "\xc0\x80",
        "\xc0",
        "\xe0\x80\x80",
        "\xed\xa0\x80",
        "\xed\xb0\x80\xed\xb0\x80",
        "\xe0",
        "\xff",
      ].each {|s|
        s.force_encoding("cesu-8")
        a.for(s) {
          assert_not_predicate(s, :valid_encoding?, "#{encdump s}.valid_encoding?")
        }
      }
    end
  end

  def test_cesu8_ord
    [
      ["\x00", 0],
      ["\x7f", 0x7f],
      ["\u0080", 0x80],
      ["\u07ff", 0x7ff],
      ["\u0800", 0x800],
      ["\ud7ff", 0xd7ff],
      ["\xed\xa0\x80\xed\xb0\x80", 0x10000],
      ["\xed\xaf\xbf\xed\xbf\xbf", 0x10ffff],
      ["\xee\x80\x80", 0xe000],
      ["\xef\xbf\xbf", 0xffff],
    ].each do |chr, ord|
      chr.force_encoding("cesu-8")
      assert_equal ord, chr.ord
      assert_equal chr, ord.chr("cesu-8")
    end
  end
end