2d69d2f3f28d11a0ca5721107b03316e65b3b8fb
[chise/ruby.git] / test / test-rbchise.rb
1 #!/usr/bin/env ruby
2 # Copyright (C) 2002-2004 Kouichirou Eto, All rights reserved.
3
4 require "common"
5
6 class TestRbChise < Test::Unit::TestCase
7   include CHISE::ChiseValue
8
9   def test_rbchise
10     @ds = CHISE::DataSource.new
11     assert_instance_of(CHISE::DataSource, @ds)
12     assert_match(/chise-db\Z/, @ds.location.to_s)
13
14     @ct = @ds.get_ccs("=daikanwa")
15     assert_instance_of(CHISE::CCSTable, @ct)
16     char_id = @ct.decode(364) # get a character by Daikanwa number 364.
17     assert_equal(20175, char_id)
18     str = format_char_id(20175)
19     assert_equal("?\344\273\217", str)
20
21     char_id = @ds.decode_char("=daikanwa", 364)
22     assert_equal(20175, char_id)
23
24     @ft = @ds.get_feature("ideographic-structure")
25     assert_instance_of(CHISE::FeatureTable, @ft)
26     value = @ft.get_value(char_id)
27     assert_instance_of(String, value)
28     assert_equal("(?\342\277\260 ?\344\272\273 ?\345\216\266)", value)
29
30     value = @ds.load_feature("ideographic-structure", char_id)
31     assert_equal("(?\342\277\260 ?\344\272\273 ?\345\216\266)", value)
32
33     @ds.each_feature {|f|
34       #qp f
35       assert_instance_of(String, f)
36     }
37
38     @ft.each {|k, v|
39       #qp k, v
40       assert_kind_of(Integer, k)
41       assert_instance_of(String, v)
42     }
43
44     ft = @ds.get_feature("numeric-value")
45     ft.each {|k, v|
46       #qp k, v
47       assert_kind_of(Integer, k)
48       assert_instance_of(String, v)
49     }
50   end
51
52   def test_each_ccs
53     @ds = CHISE::DataSource.new
54     @ds.each_ccs {|ccs|
55       #qp ccs
56       assert_instance_of(String, ccs)
57       ct = @ds.get_ccs(ccs)
58       assert_instance_of(CHISE::CCSTable, ct)
59     }
60
61     ct = @ds.get_ccs("=ascii")
62     ct.each {|k, v|
63       #qp k, v
64       assert_kind_of(Integer, k)
65       assert_kind_of(Integer, v)
66     }
67     ct.close
68   end
69
70   def test_error
71     @ds = CHISE::DataSource.new
72     @ft = @ds.get_feature("nosuchfeature")
73     v = @ft.get_value(20175)
74     assert_equal(nil, v)
75   end
76
77   def test_chisedb
78     @cd = CHISE::ChiseDB.instance
79
80     char_id = @cd.decode_char("=daikanwa", 364)
81     assert_equal(20175, char_id)
82
83     value = @cd.load_feature("ideographic-structure", char_id)
84     assert_equal("(?\342\277\260 ?\344\272\273 ?\345\216\266)", value)
85
86     value = @cd.load_feature("=ucs", char_id)
87     assert_equal(20175, value)
88
89     @cd.each_feature {|f|
90       assert_instance_of(String, f)
91     }
92
93     ft = @cd.get_feature("numeric-value")
94     ft.each {|k, v|
95       assert_kind_of(Integer, k)
96       assert_instance_of(String, v)
97     }
98   end
99
100   def test_ascii
101     @cd = CHISE::ChiseDB.instance
102     ct = @cd.get_ccs("ascii")
103     char_id = ct.decode(65)
104     assert_equal(65, char_id)
105     assert_equal("A", CHISE::Character.get(char_id).to_s)
106 #    assert_equal("A", char.to_s)
107   end
108
109
110   def test_parse_c_string
111     u8 = "字"
112     assert_equal(23383, u8.u8to_i)
113     assert_equal(23383, parse_c_string("?"+u8))
114     assert_equal(0,     parse_c_string("?\\^@"))
115     assert_equal(9,     parse_c_string("?\t"))
116     assert_equal(10,    parse_c_string("?\n"))
117     assert_equal(13,    parse_c_string("?\r"))
118     assert_equal(94,    parse_c_string("?^\\"))
119     assert_equal(31,    parse_c_string("?\\^_"))
120     assert_equal(32,    parse_c_string("?\\ "))
121     assert_equal(34,    parse_c_string("?\\\""))
122     assert_equal(126,   parse_c_string("?~"))
123     assert_equal(127,   parse_c_string("?\\^?\000"))
124     assert_equal(131,   parse_c_string("?\\^\303\237"))
125     assert_equal(0x7FF, parse_c_string("?\337\277"))
126     assert_equal(0xFFFF,        parse_c_string("?\357\277\277"))
127     assert_equal(0x1FFFFF,      parse_c_string("?\367\277\277\277"))
128     assert_equal(0x3FFFFFF,     parse_c_string("?\373\277\277\277\277"))
129     assert_equal(0xFFFFFFF,     parse_c_string("?\374\217\277\277\277\277"))
130     assert_raise(RuntimeError) { parse_c_string("nosuch") }
131   end
132
133   def test_format_char_id
134     u8 = "字"
135     assert_equal(u8, CHISE.i_tou8(23383))
136     assert_equal("?\345\255\227",       format_char_id(23383))
137     assert_equal("?"+u8,                format_char_id(23383))
138     assert_equal("?\\^@",       format_char_id(0))
139     assert_equal("?\t",         format_char_id(?\t))
140     assert_equal("?\n",         format_char_id(?\n))
141     assert_equal("?\r",         format_char_id(?\r))
142     assert_equal("?^\\",        format_char_id(0x1C))
143     assert_equal("?\\^_",       format_char_id(0x1F))
144     assert_equal("?\\ ",        format_char_id(?\s))
145     assert_equal("?\\\"",       format_char_id(?\"))
146     assert_equal("?~",          format_char_id(0x7E))
147     assert_equal("?\\^?\000",   format_char_id(0x7F))
148     assert_equal("?\\^\303\237",        format_char_id(0x9F))
149     assert_equal("?\337\277",   format_char_id(0x7FF))
150     assert_equal("?\357\277\277",       format_char_id(0xFFFF))
151     assert_equal("?\367\277\277\277",   format_char_id(0x1FFFFF))
152     assert_equal("?\373\277\277\277\277",       format_char_id(0x3FFFFFF))
153     assert_equal("?\374\217\277\277\277\277",   format_char_id(0xFFFFFFF))
154   end
155 end