X-Git-Url: http://git.chise.org/gitweb/?a=blobdiff_plain;f=src%2Fchise.rb;h=f14b59fffb17c9a41968539b924f26d9ca9be978;hb=66837463b5d1d847c8f8043c1e08615aa7bbd8e3;hp=cb547a5497286bc8381d7f16c516109f269a2458;hpb=545951c3f879a03a861ddb6ebaa643c0f1a05b19;p=chise%2Fruby.git

diff --git a/src/chise.rb b/src/chise.rb
index cb547a5..f14b59f 100755
--- a/src/chise.rb
+++ b/src/chise.rb
@@ -1,13 +1,17 @@
-#!c:/ruby/bin/ruby.exe
-# Ruby/UTF-2000 module by eto 2002-1114
+#!/usr/bin/env ruby
+# Ruby/CHISE module by eto 2002-1114
 
 require 'bdb'
 require 'uconv'
 require 'singleton'
+require 'rbchise'
+require 'db'
+require 'ids'
 
 $KCODE = 'u' #ä»ã®ã¨ããããä»¥å¤ã§ã¯åããªããString.splitãå½±é¿å¤§ãinspectãå½±é¿ã
+$debug = false #ããã¯ãã¹ãç¨
 $debug = true #ããã¯ãã¹ãç¨
-#$stdout.binmode if $debug
+$stdout.binmode if $debug
 $stdout.sync = true if $debug
 
 class String #======================================================================
@@ -18,8 +22,8 @@ class String #==================================================================
   def char_at(n) to_a()[n] end
   def char() Character.get(to_a[0]) end
   #alias to_c char #æ©ã¿ä¸­
-  def char_id() char.char_id() end
-  def get_char_attribute(a) char.get_char_attribute(a) end
+  #def char_id() char.char_id() end #ãªãã¨ãªãå»æ­¢
+  #def get_char_attribute(a) char.get_char_attribute(a) end #ãªãã¨ãªãå»æ­¢
   #def ucs() char.ucs() end
   def to_utf8()
     return to_a.map {|ch|
@@ -27,6 +31,23 @@ class String #==================================================================
     }.join('')
   end
 
+  def map_char(block = Proc.new)
+    return unless block_given?
+    return self.to_a.map {|ch| (block.call(ch)).to_s }.join("")
+  end
+  def map_char!(block = Proc.new)
+    return unless block_given?
+    self.replace(self.map_char {|ch| block.call(ch)})
+  end
+  def map_character(block = Proc.new)
+    return unless block_given?
+    return self.to_a.map {|ch| (block.call(ch.char)).to_s }.join("")
+  end
+  def map_character!(block = Proc.new)
+    return unless block_given?
+    self.replace(self.map_char {|ch| block.call(ch.char)})
+  end
+
   def method_missing(mid, *args)
     if char_length == 1 #çç¥å½¢ãæå¹ãªã®ã¯ãä¸æå­ã®æã ã
       char.method_missing(mid, *args)
@@ -50,17 +71,14 @@ class String #==================================================================
   end
   def de_er() return self.dup.de_er!; end
 
-  def map_char(block = Proc.new)
-    return unless block_given?
-    return self.to_a.map {|ch| (block.call(ch)).to_s }.join("")
-  end
-  def map_char!(block = Proc.new)
-    return unless block_given?
-    self.replace(self.map_char {|ch| block.call(ch)})
-  end
   def inspect_all() map_char {|ch| ch.char.inspect_all } end
   def inspect_x()   map_char {|ch| ch.char.inspect_x   } end
 
+  def to_euc()   map_char {|ch| ch.char.to_euc   } end
+  def map_euc()  map_char {|ch| ch.char.map_euc  } end
+  def to_sjis()  map_char {|ch| ch.char.to_sjis  } end
+  def map_sjis() map_char {|ch| ch.char.map_sjis } end
+
   def decompose() map_char {|ch| ch.char.decompose } end
   def decompose!() self.replace(self.decompose); self; end
   def decompose_all_nu(level=nil)
@@ -92,12 +110,12 @@ class String #==================================================================
     }
     str = ""
     h.each {|k, v|
-#      p [k, v]
+      #      p [k, v]
       if length == v #å¨é¨ã«é¡ãåºãã¦ããã
 	str += k
       end
     }
-#    p str
+    #    p str
     str
   end
   def compose()
@@ -113,15 +131,15 @@ class String #==================================================================
     return "" #attributeãæã¤ãã®ãä¸ã¤ãç¡ãã£ããã""ã«ãã
   end
   def aggregate()
-#selfã§ããæå­åãIDSã ã¨ä»®å®ãããããå®å¨ã«composeããããªãã§ã
-#ãã®é¨åéåã ããã¨ãã ãã¦ãcomposeå¯è½ã§ããã°ã§ããã ãcomposeããã
+    #selfã§ããæå­åãIDSã ã¨ä»®å®ãããããå®å¨ã«composeããããªãã§ã
+    #ãã®é¨åéåã ããã¨ãã ãã¦ãcomposeå¯è½ã§ããã°ã§ããã ãcomposeããã
     tree = IDS_Tree.new(self)
     return self if tree.depth <= 1 #sub_nodesãç¡ãå ´åã¯ããã§ãããªã
     tree.sub_nodes.each {|node|
       c = node.compose
       next if c.nil? || c == ""
-#      print "#{self}	#{node}	#{c}\n"
-#      p [self, node, c]
+      #      print "#{self}	#{node}	#{c}\n"
+      #      p [self, node, c]
       n = self.gsub(node, c)
       return n.aggregate
     }
@@ -136,34 +154,60 @@ module CHISE #==================================================================
   module_function :windows?
   if windows?()
     DB_DIR = 'd:/work/chise/char-db' #ãã®å¾ã«/sysmtem-char-id/ucsã¨ããæãã«ç¶ã
+    IDS_DB_DIR = 'd:/work/chise/ids/' #ãã®å¾ã«IDS-JIS-X0208-1990.txtã¨ããæãã«ç¶ã
   else
-    DB_DIR = '/usr/local/lib/xemacs-21.4.10/i686-pc-linux/char-db' #ãã®å¾ã«/sysmtem-char-id/ucsã¨ããæãã«ç¶ã
+    DB_DIR = '/usr/local/lib/xemacs-21.4.12/i686-pc-linux/char-db' #ãã®å¾ã«/sysmtem-char-id/ucsã¨ããæãã«ç¶ã
+    IDS_DB_DIR = '/home/eto/work/chise/ids/' #ãã®å¾ã«IDS-JIS-X0208-1990.txtã¨ããæãã«ç¶ã
   end
 
   class EntityReference #======================================================================
     #ç¶æ³ã«ãã£ã¦ã©ã®ERã«å¤æããããç°ãªãå¯è½æ§ãããã®ã§ãæ®éã®classã¨ãã¦å®è£ããã»ãããã?
+#    CODESYS_TABLE = [
+#      %w( chinese-big5-cdp	CDP- 4 X),
+#      %w( ideograph-daikanwa	M-   5 d),
+#      %w( ideograph-cbeta	CB   5 d),
+#      %w( ideograph-gt		GT-  5 d),
+#      %w( ideograph-gt-k	GT-K 5 d),
+#      %w( japanese-jisx0208-1990 J90- 4 X),
+#      %w( japanese-jisx0208	J83- 4 X),
+#      %w( japanese-jisx0213-1	JX1- 4 X),
+#      %w( japanese-jisx0213-2	JX2- 4 X),
+#      %w( japanese-jisx0212	JSP- 4 X),
+#      %w( japanese-jisx0208-1978 J78- 4 X),
+#      %w( chinese-cns11643-1	C1-  4 X),
+#      %w( chinese-cns11643-2	C2-  4 X),
+#      %w( chinese-cns11643-3	C3-  4 X),
+#      %w( chinese-cns11643-4	C4-  4 X),
+#      %w( chinese-cns11643-5	C5-  4 X),
+#      %w( chinese-cns11643-6	C6-  4 X),
+#      %w( chinese-cns11643-7	C7-  4 X),
+#      %w( korean-ksc5601	K0- 4 X),
+#    ]
+#    CODESYS_ORDER = %w(japanese chinese korean ideograph)
     CODESYS_TABLE = [
-      %w( chinese-big5-cdp	CDP- 4 X),
-      %w( ideograph-daikanwa	M-   5 d),
-      %w( ideograph-cbeta	CB   5 d),
-      %w( ideograph-gt		GT-  5 d),
-      %w( ideograph-gt-k	GT-K 5 d),
-      %w( japanese-jisx0208-1990 J90- 4 X),
-      %w( japanese-jisx0208	J83- 4 X),
-      %w( japanese-jisx0213-1	JX1- 4 X),
-      %w( japanese-jisx0213-2	JX2- 4 X),
-      %w( japanese-jisx0212	JSP- 4 X),
-      %w( japanese-jisx0208-1978 J78- 4 X),
-      %w( chinese-cns11643-1	C1-  4 X),
-      %w( chinese-cns11643-2	C2-  4 X),
-      %w( chinese-cns11643-3	C3-  4 X),
-      %w( chinese-cns11643-4	C4-  4 X),
-      %w( chinese-cns11643-5	C5-  4 X),
-      %w( chinese-cns11643-6	C6-  4 X),
-      %w( chinese-cns11643-7	C7-  4 X),
-      %w( korean-ksc5601	K0- 4 X),
+      %w( =jis-x0208-1990	J90- 4 X),
+      %w( =jis-x0208-1983	J83- 4 X),
+      %w( =jis-x0208-1978	J78- 4 X),
+      %w( =jis-x0208		J90- 4 X), #ç¶æ¿ã®ã¢ãããã¯ãªå®è£
+      %w( =jis-x0208		J83- 4 X), #ç¶æ¿ã®ã¢ãããã¯ãªå®è£
+      %w( =jis-x0208		J78- 4 X), #ç¶æ¿ã®ã¢ãããã¯ãªå®è£
+      %w( =jis-x0213-1-2000	JX1- 4 X),
+      %w( =jis-x0213-2-2000	JX2- 4 X),
+      %w( =jis-x0212		JSP- 4 X),
+      %w( =big5-cdp		CDP- 4 X),
+      %w( =cns11643-1		C1-  4 X),
+      %w( =cns11643-2		C2-  4 X),
+      %w( =cns11643-3		C3-  4 X),
+      %w( =cns11643-4		C4-  4 X),
+      %w( =cns11643-5		C5-  4 X),
+      %w( =cns11643-6		C6-  4 X),
+      %w( =cns11643-7		C7-  4 X),
+      %w( =ks-x1001		K0-  4 X),
+      %w( =daikanwa		M-   5 d),
+      %w( =cbeta		CB   5 d),
+      %w( =gt			GT-  5 d),
+      %w( =gt-k			GT-K 5 d),
     ]
-    CODESYS_ORDER = %w(japanese chinese korean ideograph)
     REGEXP_PART = "&([-+0-9A-Za-z#]+);"
     REGEXP_ALL = "^#{REGEXP_PART}$"
 
@@ -173,7 +217,7 @@ module CHISE #==================================================================
       return "" unless er =~ Regexp.new(REGEXP_ALL) #ãªãããééã£ã¦ã?
       er = $1 #ã¤ãã§ã«ä¸­èº«ã®é¨åãåãåºã
       return $1.hex if er =~ /^MCS-([0-9A-Fa-f]+)/ #MCS
-#      if er =~ /^U[-+]?([0-9A-Fa-f]+)/ #Unicodeç´æã¡
+      #      if er =~ /^U[-+]?([0-9A-Fa-f]+)/ #Unicodeç´æã¡
       if er =~ /^U[-+]?([0-9A-Fa-f]+)/ || er =~ /^#x([0-9A-Fa-f]+)/ #Unicodeç´æã¡
 	return $1.hex 
       end
@@ -182,13 +226,14 @@ module CHISE #==================================================================
       each_codesys {|codesys, er_prefix, keta, numtype|	#p [codesys, er_prefix, keta, numtype]
 	numtyperegex = '\d' #if numtype == 'd'
 	numtyperegex = '[0-9A-Fa-f]' if numtype == 'X'
-	regexpstr = "^#{er_prefix}(#{numtyperegex}{#{keta},#{keta}})$"	#p regexpstr
+	regexpstr = "^#{er_prefix}(#{numtyperegex}{#{keta},#{keta}})$"
 	if er =~ Regexp.new(regexpstr)
 	  codestr = $1
 	  code = codestr.to_i #if numtype == 'd'
 	  code = codestr.hex if numtype == 'X'
 	  char_id_u8 = EntityReference.get_database(codesys, code)
 	  char_id_num = Character.parse_char_id(char_id_u8)
+	  next if char_id_num == nil
 	  return char_id_num
 	end
       }
@@ -196,21 +241,24 @@ module CHISE #==================================================================
     end
 
     def self.each_codesys()
-      CODESYS_ORDER.each {|lang|
-	CODESYS_TABLE.each {|codesys, er_prefix, keta, numtype| #æ®éããããæ¸ãæ¹ã¯ããªããã«ã¼ãä¸åã«ããã
-	  next unless codesys =~ lang
-	  yield(codesys, er_prefix, keta, numtype)
-	}
+#      CODESYS_ORDER.each {|lang|
+#	CODESYS_TABLE.each {|codesys, er_prefix, keta, numtype| #æ®éããããæ¸ãæ¹ã¯ããªããã«ã¼ãä¸åã«ããã
+#	  next unless codesys =~ lang
+#	  yield(codesys, er_prefix, keta, numtype)
+#	}
+#      }
+      CODESYS_TABLE.each {|codesys, er_prefix, keta, numtype|
+	yield(codesys, er_prefix, keta, numtype)
       }
     end
     def self.get_database(codesys, code)
       c = CodesysDB.instance.get(codesys, code)
       return c if c != nil
-      if codesys =~ /-jisx0208/
-	#return self.get_database("=jis-x0208", code) #åå¸°ã§ã©ãã ?
-	c = CodesysDB.instance.get("=jis-x0208", code)
-	return c
-      end
+#      if codesys =~ /-jisx0208/
+#	#return self.get_database("=jis-x0208", code) #åå¸°ã§ã©ãã ?
+#	c = CodesysDB.instance.get("=jis-x0208", code)
+#	return c
+#      end
       return nil
     end
   end
@@ -241,11 +289,6 @@ module CHISE #==================================================================
   end
 
   class Character #=============================================================== æå­ãªãã¸ã§ã¯ã
-    BASIC_KANJI = "äººå­å¥³æ¯ç¶çå£è³æè¶³åç®é¦æ¯å¿ç¬çé³¥è²è§ç¾½è«é¦¬é­ç¾èç®ç±³ç«¹æ¨éº¦è±å±±å·é¨é¢¨æ°´åç³éç°ç©´æ¥æç«é³ç³¸åèéæ¸è¡£ç¢å¼è»ç¿ä¸äºä¸åäºå­ä¸å«ä¹åç¾åä¸å¯¸å°ºä¸ä¸­ä¸æ¬çç«åé£è¡æ­¢äº¤åæ­©èå¥ç¤ºèµ°çåºæ¥æ¸è¨å¤§å°ç½éå¤å°é«é·"
-    def is_basic_kanji?
-      BASIC_KANJI.include?(self.to_s)
-    end
-
     def initialize(char_id=nil)
       @char_id = Character.parse_char_id(char_id)
       @attributes = Hash.new
@@ -263,6 +306,7 @@ module CHISE #==================================================================
     def normalize_attribute_name(b)
       a = b.dup
       a.gsub!(/_/, '-') #underlineã¯-ã«ç½®æ
+      a.sub!(/-at-/,  '@')
       a.sub!(/^map-/,  '=>')
       a.sub!(/^to-/,   '->')
       a.sub!(/^from-/, '<-')
@@ -272,11 +316,14 @@ module CHISE #==================================================================
       a = normalize_attribute_name(b)
       #p [a, b]
       atr = @attributes[a]
-      return atr if atr != nil
+      return atr if atr
       atr = check_database(a)
-      @attributes[a] = atr if atr != nil
-      return get_char_attribute("=jis-x0208") if a =~ /jisx0208/ #ããã ãç¹æ®å½¢
-      return @attributes[a]
+      if atr
+	@attributes[a] = atr
+	return atr
+      end
+      return get_char_attribute("="+a) unless a =~ /^=/ #é ­ã«=ãã¤ãã¦ãªãå ´åã¯ãããçç¥ããã¦ãããã¨ãä»®å®ãã¦ãåå¸°ãã
+      nil
     end
     def put_char_attribute(b,v)
       a = normalize_attribute_name(b)
@@ -380,1031 +427,182 @@ module CHISE #==================================================================
       ar = %w{ucs-jis ucs =>ucs-jis}
       #ä¸¦ã³é ã¯æ£æçã§ãucs-jisãåã«åºãã¦ãããæ¬æ¥ã¯ãããæå®ã§ããããã«ããã¹ãã
       ar.each {|a|	#p [a]
-	 u = get_char_attribute(a)
-	 return u if u != nil
-       }
-       return nil
-     end
-
-     #----------------------------------------------------------------------CCSé¢ä¿
-     def to_utf8() Uconv.u4tou8(Character.u4itou4(ucs())) end #UTF8æå­åãè¿ã
-     #alias to_s to_utf8
-     alias to_s mcs_utf8
-     def map_utf8()
-       u = ucs()
-       if u.nil? || 0xffff < u
-	 return to_er()
-       else
-	 return to_utf8()
-       end
-     end
-     alias map_ucs map_utf8
-     def map_ucs_er()
-       u = ucs()
-       if u.nil? || 0xffff < u
-	 return to_er()
-       else
-	 return Character.get(u).to_er()
-       end
-     end
-     def to_euc()
-       u = ucs()
-       return "" if u.nil? || 0xffff < u
-       Uconv.u16toeuc(Uconv.u4tou16(Character.u4itou4(ucs())))
-     end
-     def map_euc()
-       e = to_euc()
-       return e if e != ""
-       return to_er()
-     end
-     def to_sjis()
-       u = ucs()
-       return "" if u.nil? || 0xffff < u
-       Uconv.u16tosjis(Uconv.u4tou16(Character.u4itou4(ucs())))
-     end
-     def map_sjis()
-       e = to_sjis()
-       return e if e != ""
-       return to_er()
-     end
-
-     #----------------------------------------------------------------------
-     def to_er(codesys=nil) #å®ä½åç§ãè¿ããå¸æããcodesysãå¼æ°(æªå®è£)
-       return "" if @char_id == nil
-       return sprintf("&#x%04x;", @char_id) if @char_id <= 0xffff
-       return sprintf("&#x%05x;", @char_id) if @char_id <= 0xfffff
-       EntityReference.each_codesys {|codesys, er_prefix, keta, numtype|
-	 code = self[codesys]
-	 next if code == nil
-	 return sprintf("&#{er_prefix}%0#{keta}#{numtype};", code)
-       }
-       return sprintf("&MCS-%08X;", @char_id) #æ¬å½ã¯ããã¯ç¡ãã«ããã
-     end
-     def to_er_list()
-       ar = []
-       EntityReference.each_codesys {|codesys, er_prefix, keta, numtype|
-	 er = to_er(codesys)
-	 ar << er if er != nil
-       }
-       ar
-     end
-
-     def inspect_x()
-       return "<>" if @char_id == nil
-       ar = [to_utf8(), to_er().sub(/^&/,'').chop]
-       "<"+ar.join(',')+">"
-     end
-     alias inspect inspect_x
-     def inspect_all_codesys() #æªå®æ
-       #to_erãå¨ã¦ã®codesysã«ããã¦å®è¡ããããã®çµæãã³ã³ãã¯ãã«ã¾ã¨ãã
-     end
-     def inspect_all()
-       ar = [inspect.chop]
-       alist.to_a.sort.each {|a, v| ar << "#{a}:#{v}" }
-       return ar.join(',')+">"
-     end
-     def get_attributes()
-       str = ""
-       alist.to_a.sort.each {|a, v|
-	 str += "#{a}: #{v}\n"
-       }
-       str
-     end
-
-     def inspect_ids(hex_flag=false)
-       ids = decompose
-       ar = []
-       ar << (hex_flag ? "x"+mcs_hex : to_utf8)
-       if to_s != ids #idsãé¨åãã®ãã®ã ã£ããé¨åè¿½å ã¯ããªã
-	 ids.each_char {|ch|
-	   char = ch.char
-	   next if char.is_ids?
-	   if hex_flag then
-	     ar << "x"+char.mcs_hex
-	   else
-	     u = char.to_utf8
-	     if u != ""
-	       ar << u
-	     else
-	       ar << char.to_er
-	     end
-	   end
-         }
-       end
-       return "("+ar.join("\t")+")"
-     end
-
-     #----------------------------------------------------------------------IDSé¢ä¿
-     def decompose
-       k = self.to_s
-#       idss = self['ids']
-#       return idss if idss
-#       return k if self.is_basic_kanji? #åºæ¬æ¼¢å­ã¯stop kanjiã¨ãããã¨ã
-       return self['ids-represent'] if self['ids-represent'] #ids_representãæã£ã¦ããå ´åã¯ãã®å¤ã¨ããã
-       return self['ids-element'] if self['ids-element'] #ids_elementãæã£ã¦ããå ´åã¯ãã®å¤ã¨ããã
-
-       idss = self['ids-meaning']
-       return idss if idss != nil && 0 < idss.length && k != idss
-       idss = self['ids-aggregated']
-       return idss if idss != nil && 0 < idss.length && k != idss
-       idss = self['ids']
-       return idss if idss != nil && 0 < idss.length && k != idss
-       return k
-#       return k if idss.nil? || idss.length == 0 || k == idss
-#       if idss.char_length == 2
-#	p ['What???', k, idss, k.inspect_all]
-#	 #return idssx[1] #äºåç®ã ãè¿ãã¨ã?
-#	 return k #IDSã«å±éããæ¹æ³ãç¡ãã¨ã
-#       end
-#       return k if k == idss
-#       if idss.include?(k) #<C5-4C4D><C6-4A37>ãã®äºæå­ã®BUGå¯¾ç­
-#	 #return idss.sub(k, '')
-#	 return k #IDSã«å±éããæ¹æ³ãç¡ãã¨ã
-#       end
-#       return idss
-     end
-     def decompose_all
-       pde = ""
-       de = self.decompose #åºçºç¹
-       level = 0
-       while true
-	 pde = de
-	 de = pde.decompose #ããä¸åº¦åè§£ããã¦ã¿ãã
-	 break if pde == de #ã«ã¼ããæãã ã
-	 exit if 10 < level #p ['too many recursive', self] 
-	 level += 1
-       end
-       return de
-     end
-     def decompose_all_nu(level=nil)
-       level = 0 if level.nil?
-       if 10 < level
-	 p ['too many recursive', self] 
-	 exit
-       end
-       de = self.decompose
-       return de.decompose_all(level+1) if de != self #ãªã«ãå¤åããã£ãããåå¸°
-       return de #ããããä»¥ä¸å¤åã¯ç¡ãããã ãã¨ã
-     end
-     def is_ids?() 0x2ff0 <= @char_id && @char_id <= 0x2fff end
-     def ids_operator_argc()
-       return 0 unless is_ids?
-       return 3 if @char_id == 0x2ff2 || @char_id == 0x2ff3
-       return 2
-     end
-   end
-
-   class DBS #======================================================================è¤æ°ã®DBãéããclassãæªå®æ
-   end
-
-   class ADB < BDB::Hash #======================================================================ä¸ã¤ã®DB
-     def initialize(*args)
-       super
-       @modified = false
-       at_exit {
-	 if @modified
-	   self.close #ããããªãã¨ããã¾ããã¼ã¿ãã¼ã¹ãã»ã¼ããããªãã®ã§ãã
-	 end
-       }
-     end
-     def self.open_create(filename)
-       ADB.open(filename, nil, BDB::CREATE | BDB::EXCL) #ä¸æ¸ãã¯ããªã
-     end
-     def mykey(key)
-       if key.is_a?(String)
-	 if key.char_length == 1
-	   return '?'+key  #Stringã ã£ããå¼ãåã«?ãè¶³ã
-	 end
-       end
-       #key = key.to_s if key.is_a?(Numeric) #Numberã ã£ããStringã«ããã
-       #ããã§ && key ! =~ /^\?/ ããããã¨ã?èªèº«ãæ¤ç´¢ã§ããªããªã£ã¦ãã¾ãã
-       return key
-     end
-     def myvalue(v)
-       return v if v == nil
-       return v.to_i if v =~ /^\d+$/ #æ°å­ã ã£ããããã§å¤æãã¦ãã
-       return v.sub(/^\?/, '') if v =~ /^\?/ #åé ­ã®?ã¯åãé¤ã
-       return $1 if v =~ /^"(.+)"$/ #æåã¨æå¾ã«"ãã¤ãã¦ããããåãé¤ã
-       #p ['get', v, t, key, db]
-       #return parse_sexp(v) if v =~ /^\(.+\)$/ #æåã¨æå¾ã()ã®æã¯ãSå¼ã«parseãã
-       return v #ããä»¥å¤ã£ã¦ä½?
-     end
-     def myget(key) #keyã­ã¼ãå¼ãã¦è¿ã
-       key = mykey(key)
-       v = get(key) #å­å¨ããªãã£ããnilãè¿ããã¨ã«ãªã
-       return myvalue(v)
-     end
-     def myput(key, v) #keyã«vãããã
-       key = mykey(key)
-       put(key, v) #putãã
-       @modified = true
-     end
-   end
-
-   class DB #======================================================= ãã¼ã¿ãã¼ã¹ç¾¤ã®abstract class
-     def self.unix_to_win(unix) #Windowsãã¡ã¤ã«åå¶éã®ãããå¤æãã
-       win = unix.gsub(/</, '(')
-       win.gsub!(/>/, ')')
-       win.gsub!(/\*/, '+')
-       win.gsub!(/\?/, '!')
-       return win
-     end
-     def self.win_to_unix(win)
-       unix = win.gsub(%r|\)|, '>')
-       unix.gsub!(%r|\(|, '<')
-       unix.gsub!(%r|!|, '?')
-       unix.gsub!(%r|\+|, '*')
-       return unix
-     end
-     def get_filename(t)
-       return @pre + DB.unix_to_win(t) + @post if windows?
-       return @pre + t + @post
-     end
-     def get_dirname(t) File.dirname(get_filename(t)) end
-     def open_dbs()
-       @dbs = Hash.new
-       keys = find_keys()
-       keys.each {|key| open_db(key) }
-     end
-     def find_keys()
-       files = []
-       Dir.glob(@glob){|f|
-	 next if ! File.file?(f)
-	 next if f =~ /.txt$/
-	 files << f
-       }
-       keys = []
-       files.each {|f|
-	 t = DB.win_to_unix(f)
-	 t.sub!(%r|^#{@pre}|, '')
-	 t.sub!(%r|#{@post}$|, '') if @post != ""
-	 keys << t
-       }
-       return keys
-     end
-     def close_db(t)
-       db = get(t)
-       return nil if db.nil?
-       db.close
-       @dbs.delete(t)
-     end
-     def open_db(t)
-       return nil if get(t) #ãã§ã«openãã¦ãããåopenã¯ããªãã
-       begin
-	 bdb = ADB.open(get_filename(t), nil, 0)
-	 @dbs[t] = bdb if bdb != nil
-       rescue
-	 p ["open error", get_filename(t)]; return nil
-       end
-       return true
-     end
-     def make_db(t, h=nil) #tã¨ããååã§hã¨ããä¸­èº«ã®ãã¼ã¿ãã¼ã¹ãä½ã
-       return nil if get(t) #ãã§ã«ããå ´åã¯return
-       Dir.mkdir(get_dirname(t)) unless FileTest.exist?(get_dirname(t))
-       db = nil
-       begin
-	 db = ADB.open_create(get_filename(t)) #ä¸æ¸ãã¯ããªã
-	 if h != nil
-	   h.each {|k, v|
-	     k = '?'+k if k.is_a?(String)
-	     db[k] = v
-	   }
-	 end
-	 db.close
-       rescue
-	 p ["make error", get_filename(t)]; return nil
-       end
-       return true
-     end
-     def make_db_no_question_mark(t, h=nil) #tã¨ããååã§hã¨ããä¸­èº«ã®ãã¼ã¿ãã¼ã¹ãä½ã
-       return nil if get(t) #ãã§ã«ããå ´åã¯return
-       Dir.mkdir(get_dirname(t)) unless FileTest.exist?(get_dirname(t))
-       db = nil
-       begin
-	 db = ADB.open_create(get_filename(t)) #ä¸æ¸ãã¯ããªã
-	 if h != nil
-	   h.each {|k, v|
-#	     k = '?'+k if k.is_a?(String)
-	     db[k] = v
-	   }
-	 end
-	 db.close
-       rescue
-	 p ["make error", get_filename(t)]; return nil
-       end
-       return true
-     end
-     def remove_db(t) #tã¨ããååã®ãã¼ã¿ãã¼ã¹ãæ¶å»ãã
-       db = get(t)
-       if db
-	 db.close
-	 @dbs.delete(t)
-       end
-       begin
-	 File.unlink(get_filename(t)) if FileTest.file?(get_filename(t))
-       rescue
-	 p ["unlink error", get_filename(t)]; return nil
-       end
-       dn = get_dirname(t)
-       Dir.rmdir(dn) if FileTest.directory?(dn) && Dir.entries(dn).length <= 2 #ç©ºdirectoryã ã£ããæ¶ã
-       return true
-     end
-     def to_num(s)
-       return s.to_i if s =~ /^\d+$/
-       return s
-     end
-     def dump_db(t)
-       db = get(t)
-       return nil unless db
-       file = get_filename(t)
-       open("#{file}.txt", "w"){|out|
-#	 out.binmode.sync = true
-	 ar = db.to_a
-	 ar.map! {|k, v| [to_num(k), to_num(v)] }
-	 ar.sort.each {|k, v|
-	   out.printf("%s\t%s\n", k, v)
-	 }
-       }
-       return true
-     end
-     def each_db()  @dbs.to_a.sort.each {|t, db| yield(t, db) } end
-     def dump_all()  each_db {|t, db| dump_db(t) } end
-     def close_all() each_db {|t, db| db.close   } end
-     def keys() @dbs.keys end
-     def each(t)
-       return unless block_given?
-       db = @dbs[t]
-       return nil unless db
-       db.each {|k, v|
-	 k = to_num(k)
-	 v = to_num(v)
-	 k.sub!(/^\?/, '') if k =~ /^\?/ #åé ­ã®?ã¯åãé¤ã
-	 vv = get(t, k)	#p ['each', t, k, v, vv]
-	 yield(k, vv)
-       }
-     end
-     def each_sort(t)
-       return unless block_given?
-       db = @dbs[t]
-       return nil unless db
-       ar = db.to_a
-       ar.map! {|k, v| [to_num(k), to_num(v)] }
-       ar.sort.each {|k, v|
-	 k.sub!(/^\?/, '') if k =~ /^\?/ #åé ­ã®?ã¯åãé¤ã
-	 vv = get(t, k)	#p ['each', t, k, v, vv]
-	 yield(k, vv)
-       }
-     end
-     #----------------------------------------------------------------------
-     def get(t, key=nil) #tã¨ãããã¼ã¿ãã¼ã¹ã®keyã­ã¼ãå¼ãã¦è¿ã
-       db = @dbs[t]
-       return db if key.nil?
-       return nil unless db
-       return db.myget(key)
-     end
-     def put(t, key, v) #tã¨ãããã¼ã¿ãã¼ã¹ã®keyã«vãããã
-       db = @dbs[t]
-       if db == nil
-	 db = make_db(t) 
-	 db = open_db(t) 
-	 db = @dbs[t]
-       end
-       db.myput(key, v) #putãã
-     end
-   end
-
-   class CharDB < DB #------------------------------------ MCS-UTF8ãã­ã¼ã¨ããå±æ§ã¸ã®ãã¼ã¿ãã¼ã¹
-     include Singleton
-     def initialize()
-       super
-       @glob, @pre, @post = "#{DB_DIR}/system-char-id/*", "#{DB_DIR}/system-char-id/", ""
-       open_dbs()
-     end
-     def get_all(u8) #å¨ãã¼ã¿ãã¼ã¹ã®u8ã­ã¼ãå¼ãã¦Hashã«ã¾ã¨ãã¦è¿ã
-       atrs = Hash.new
-       @dbs.each {|t, db|
-	 v = get(t, u8)
-	 atrs[t] = v if v != nil
-       }
-       return atrs
-     end
-   end
-
-   class CodesysDB < DB #----------------------------------------------------------------------
-     include Singleton
-     def initialize()
-       super
-       @glob, @pre, @post = "#{DB_DIR}/*/system-char-id", "#{DB_DIR}/", "/system-char-id"
-       open_dbs()
-     end
-     #def keys() @dbs.keys.sort end #ã©ããªCodesysã®æå ±ãæã£ã¦ãããã®ä¸è¦§
-     def keys() @dbs.keys end #ã©ããªCodesysã®æå ±ãæã£ã¦ãããã®ä¸è¦§
-     def get_codesys(t)
-       db = get(t)
-       return nil unless db
-       return Codesys.new(t)
-     end
-   end
-
-   class Codesys < DB #======================================================================
-     def initialize(name)
-#       super
-       @name = name
-       @dbs = CodesysDB.instance
-     end
-     def keys() #ã©ããªã³ã¼ããã¤ã³ãã®æå ±ãæã£ã¦ãããã®ä¸è¦§
-       ks = @dbs.get(@name).keys
-       if @name =~ /jisx0208/ #ç¹å¥å¦ç
-	 n = @dbs.get('=jis-x0208').keys 
-	 #	 p ['keys', @name, ks, n]
-	 ks += n
-       end
-       ks.map! {|k| to_num(k) }
-       ks
-     end
-     def get(key)
-       v = @dbs.get(@name, key)
-       return v if v
-       if @name =~ /jisx0208/ #jisx0208ãå«ã¾ãã¦ããå ´åã ãç¹å¥å¦çãã
-	 return @dbs.get('=jis-x0208', key)
-       end
-       return nil
-     end
-     def each()
-       return unless block_given?
-       db = @dbs.get(@name)
-       return nil unless db
-       db.each {|k, v|
-	 k = to_num(k)
-	 v = to_num(v)
-	 k.sub!(/^\?/, '') if k =~ /^\?/ #åé ­ã®?ã¯åãé¤ã
-	 vv = @dbs.get(@name, k)	#p ['each', t, k, v, vv]
-	 yield(k, vv)
-       }
-     end
-     def each_sort()
-       return unless block_given?
-       db = @dbs.get(@name)
-       return nil unless db
-       ar = db.to_a
-       ar.map! {|k, v| [to_num(k), to_num(v)] }
-       ar.sort.each {|k, v|
-	 k.sub!(/^\?/, '') if k =~ /^\?/ #åé ­ã®?ã¯åãé¤ã
-	 vv = @dbs.get(@name, k)	#p ['each', t, k, v, vv]
-	 yield(k, vv)
-       }
-     end
-   end
-
-  class IDS_TEXT_DB < DB #======================================================================
-    include Singleton
-    if CHISE.windows?()
-      IDS_DB_DIR = 'd:/work/chise/ids/' #ãã®å¾ã«IDS-JIS-X0208-1990.txtã¨ããæãã«ç¶ã
-    else
-      IDS_DB_DIR = '/home/eto/work/chise/ids/' #ãã®å¾ã«IDS-JIS-X0208-1990.txtã¨ããæãã«ç¶ã
-    end
-    IDS_LIST = "
-IDS-UCS-Basic.txt
-#IDS-UCS-Compat-Supplement.txt
-#IDS-UCS-Compat.txt
-IDS-UCS-Ext-A.txt
-IDS-UCS-Ext-B-1.txt
-IDS-UCS-Ext-B-2.txt
-IDS-UCS-Ext-B-3.txt
-IDS-UCS-Ext-B-4.txt
-IDS-UCS-Ext-B-5.txt
-IDS-UCS-Ext-B-6.txt
-IDS-JIS-X0208-1990.txt
-IDS-Daikanwa-01.txt
-IDS-Daikanwa-02.txt
-IDS-Daikanwa-03.txt
-IDS-Daikanwa-04.txt
-IDS-Daikanwa-05.txt
-IDS-Daikanwa-06.txt
-IDS-Daikanwa-07.txt
-IDS-Daikanwa-08.txt
-IDS-Daikanwa-09.txt
-IDS-Daikanwa-10.txt
-IDS-Daikanwa-11.txt
-IDS-Daikanwa-12.txt
-IDS-Daikanwa-dx.txt
-IDS-Daikanwa-ho.txt
-IDS-CBETA.txt
-".split
-    def initialize()
-      super
-      @ids_list = IDS_LIST
-      @chars = []
-      @glob, @pre, @post = "#{IDS_DB_DIR}/db/*", "#{IDS_DB_DIR}/db/", ""
-      dir = File.dirname(@pre)
-      Dir.mkdir(dir) unless FileTest.exist?(dir)
-      open_dbs()
-    end
-    def each_file()
-      return unless block_given?
-      @ids_list.each {|file|
-	next if file =~ /^#/
-	yield(IDS_DB_DIR+file)
-      }
-    end
-    def each_line(file)
-      open(file){|f|
-	while line = f.gets
-	  next if line =~ /^;/ #ã³ã¡ã³ãã¯ã¨ã°ã
-	  line.chomp!
-	  code, char, ids = line.split
-	  yield(code, char, ids)
-	end
-      }
-    end
-    def dump_text_all
-      each_file {|file|
-	dir = File.dirname(file) + '/../ids-new/'
-	Dir.mkdir(dir) if ! FileTest.directory?(dir)
-	newfile = dir + File.basename(file)
-	p [file, newfile]
-	open(newfile, "w"){|out|
-	  out.binmode.sync = true
-	  each_line(file){|code, ch, ids|
-	    char = Character.get(ch)
-	    ids = char.decompose
-	    out.print "#{code}	#{ch}	#{ids}\n"
-	  }
-	}
+	u = get_char_attribute(a)
+	return u if u != nil
       }
+      return nil
     end
-    def make_ids_error
-      each_file {|file|
-	dir = File.dirname(file) + '/../ids-error'
-	Dir.mkdir(dir) unless FileTest.exist?(dir)
-	errfile = dir + '/' + File.basename(file)
-#	p [file, errfile]
-	open(errfile, "w"){|out|
-	  out.binmode.sync = true
-	  each_line(file){|code, ch, ids|
-	    char = Character.get(ch)
-	    ids_error = char['ids-error']
-	    next if ids_error.nil?
-	    out.print "#{code}	#{ch}	#{ids}	#{ids_error}\n"
-	  }
-	}
-      }
-    end
-  end
-
-  class IDS_DB < DB #======================================================================BDBåããIDS DBãæ±ã
-    include Singleton
-    def initialize
-      @dbs = CharDB.instance
-    end
-    def make_ids_db
-      db = IDS_TEXT_DB.instance
-      db.each_file {|file|
-	@char_counter = 0
-	@same_ids_counter = 0
-	@good_ids_counter = 0
-	@conflict_ids_counter = 0
-	db.each_line(file){|code, ch, ids|
-	  @char_counter += 1
 
-	  ids = "" if ids == nil
-	  next if ids == "" #IDSãå®ç¾©ããã¦ããªãå ´åã¯ããã£ããã¨ç¡è¦ããã¹ããã
-
-	  charimg = Character.get(ch) #å®ä½åç§ã§ããå¯è½æ§ããã
-
-	  next if code =~ /'$/ || code =~ /"$/ #å¤§æ¼¢åçªå·ã®ããã·ã¥ä»ãã¯ç¡è¦ãã
-	  char = Character.get("&"+code+";") #codeè¡¨è¨ãåã«å®ä½åç§ãä½ã£ã¦è§£éãã
-	  if char.nil? || char.to_s == "" #ãã¾ãæå­ã«ãªããªãã£ã
-	    print "char == null	#{char.inspect}	#{code}	#{ch}	#{ids}\n" unless code =~ /^M-/ || code =~ /^CB/
-	    #å¤§æ¼¢åãCBETAä»¥å¤ã®å ´åã¯ãã¨ã©ã¼ã¡ãã»ã¼ã¸ã
-	    next
-	  end
-	  if char != charimg #codeè¡¨è¨ã¨æå­ãä¸è´ãã¦ããªã?
-	    unless code =~ /^M-/ || code =~ /^MH-/ || code =~ /^CB/ #é£ãéã£ã¦ãã¦å½ç¶ã§ããã®ã§ä½ãããªã
-	      print "unknown char	#{char.inspect}	#{code}	#{ch}	#{ids}\n"
-	      next #ããä»¥å¤ã®å ´åã¯ã¨ã©ã¼ã¡ãã»ã¼ã¸ãã ãã¦ãæ¬¡ã¸ã
-	    end
-	  end
-	  #next if !char.has_attribute? #isolated characterã¯ã¾ãããã¾ããªãã
-
-	  ids.de_er! #å®ä½åç§ãè§£é¤ãã
-	  next if ids == char.to_s #ããæå­ã¨ã¾ã£ããä¸ç·ãªããæå³ãç¡ãã®ã§æå ±ãæããªã
-	  next if ids.char_length == 1
-
-	  idstree = IDS_Tree.new(ids)
-	  c = idstree.check_integrity
-	  c = "contains self" if ids.include?(char.to_s)
-	  if c #ã¡ãã£ã¨ã§ãã¨ã©ã¼ãããå ´åã¯ã
-	    char['ids-error'] = c #ã¨ã©ã¼ãè¨é²ãã¦ããã¼ã¿ã¨ãã¦ã¯ä¿æããªã
-	    next
-	  end
-
-	  if char['ids'].nil? || char['ids'] == "" #åãIDSãç¡ãã£ãå ´åã¯ã
-	    char['ids'] = ids #æ®éã«ä»£å¥ããã°ããã§ããã§ãã
-	    @good_ids_counter += 1
-	  else #ããããã¾ã¾ã§ã«ãã§ã«IDSãå®ç¾©ããã¦ããå ´åã¯?
-	    if char['ids'] == ids #æ°ããIDSã¨å¤ãIDSãå®å¨ã«ä¸è´ãããªãç¡è¦ãã¾ãããã
-	      @same_ids_counter += 1
-	    else #ããããã¾ã¾ã§ã®IDSã¨æ°ããIDSãé£ãéã£ãå ´åã¯?
-	      @conflict_ids_counter += 1
-#	      print "conflict	#{char.inspect}	#{code}	#{ids}	#{char['ids']}\n"
-	    end
-	  end
-	}
-	print "#{file}	#{@char_counter}	#{@same_ids_counter}	#{@conflict_ids_counter}	#{@good_ids_counter}\n"
-	CharacterFactory.instance.reset()
-      }
-      @dbs.dump_db('ids-error') #ãã­ã¹ãåãã
-      @dbs.dump_db('ids') #ãã­ã¹ãåãã
-    end
-    def make_ids_reverse
-      h = Hash.new
-      @dbs.each('ids') {|k, v|
-	char = k.char
-	ids = char.decompose
-	h[ids] = "" if h[ids].nil?
-	h[ids] += k #è¿½å ãã
-      }
-      h.each {|k, v|
-	h[k] = char_sort(v) #æå­ã®é çªããããä½¿ãã£ã½ããã®ããã®é çªã«ãã
-      }
-      h.delete_if {|k, v| #h[k]ã""ã«ãªãå¯è½æ§ãããããããã¯keyã¨ãã¦å¥ããªããã¨ã«ããã
-	v == ""
-      }
-      print "length	#{h.length}\n"
-      cdb = CodesysDB.instance
-      cdb.make_db_no_question_mark('ids', h)
-      cdb.open_db('ids') #ãããç¡ãã¨ãdump_dbããã¾ããã
-      cdb.dump_db('ids')
-    end
-    def char_sort(composed)
-      return composed if composed.char_length == 1
-      ar = composed.to_a
-      arorg = ar.dup
-      ar2 = []
-      ar.dup.each {|ch|
-	char = ch.char
-	if char.char_id < 0xfffff #Unicodeã£ã½ã?
-	  ar2 << ch
-	  ar.delete(ch)
-	end
-      }
-      if 0 < ar.length
-	EntityReference.each_codesys{|codesys, er_prefix, keta, numtype|
-	  ar.each {|ch|
-	    char = ch.char
-	    v = char[codesys]
-#	    p [codesys, v] if v
-	    if v #EntityReferenceã®é çªã«æºæ ããã
-	      ar2 << ch
-	      ar.delete(ch)
-	    end
-	  }
-	}
-      end
-      if 0 < ar.length
-#	p ['yokuwakaran character', ar, ar[0].inspect_all, arorg]
-	EntityReference.each_codesys{|codesys, er_prefix, keta, numtype|
-	  ar.dup.each {|ch|
-	    char = ch.char
-	    v = char[codesys]
-#	    p [codesys, v] if v
-	  }
-	}
+    #----------------------------------------------------------------------CCSé¢ä¿
+    def to_utf8() Uconv.u4tou8(Character.u4itou4(ucs())) end #UTF8æå­åãè¿ã
+    #alias to_s to_utf8
+    alias to_s mcs_utf8
+    def map_utf8()
+      u = ucs()
+      if u.nil? || 0xffff < u
+	return to_er()
+      else
+	return to_utf8()
       end
-      return ar2.join("")
     end
-    def dump_ids_duplicated
-      open('ids-duplicated.txt', 'w'){|out|
-	#out.binmode
-	CodesysDB.instance.each('ids') {|k, v|
-	  if v.nil?
-	    out.print "nil	#{k}	#{v}\n"
-	    next
-	  end
-	  n = v.char_length
-	  next if n == 1
-	  out.print "#{n}	#{k}	#{v}"
-	  v.each_char {|ch|
-	    char = ch.char
-	    out.print "	#{char.inspect}"
-	  }
-	  out.print "\n"
-	}
-      }
-    end
-    def make_ids_aggregated
-      @dbs.each('ids') {|k, v|
-	char = k.char
-	ids = char.decompose
-	ag = ids.aggregate
-	char['ids-aggregated'] = ag
-      }
-      @dbs.dump_db('ids-aggregated')
+    alias map_ucs map_utf8
+    def map_ucs_er()
+      u = ucs()
+      if u.nil? || 0xffff < u
+	return to_er()
+      else
+	return Character.get(u).to_er()
+      end
     end
-    def dump_ids_aggregated
-      open('ids-aggregated.txt', 'w'){|out|
-	#out.binmode
-	@dbs.each('ids') {|k, v|
-	  char = k.char
-	  ids = char['ids']
-	  ag  = char['ids-aggregated']
-	  out.print "#{char.to_s}	#{ag}	#{ids}\n" if ids != ag
-	}
-      }
+    def to_euc()
+      u = ucs()
+      return "" if u.nil? || 0xffff < u
+      Uconv.u16toeuc(Uconv.u4tou16(Character.u4itou4(ucs())))
     end
-    def make_ids_parts
-      @dbs.each('ids') {|k, v|
-	char = k.char
-	pids = char.to_s
-	ar = []
-	counter = 0
-	loop {
-	  ids = pids.decompose
-	  break if ids == pids #ããä»¥ä¸åå²ã§ããªãããã ã£ããçµäºãã
-	  ar += ids.to_a
-	  counter += 1
-	  p [char.to_s, pids, ids, ar] if 10 < counter #ããã¯ä½ããããããã¨
-	  pids = ids
-	}
-	ar.sort!
-	ar.uniq!
-#ãã£ã±ãIDSæå­ãå ãããã¨ã«ãã. by eto 2003-02-05
-#	ar.delete_if {|ch|
-#	  ch.char.is_ids? #IDSæå­ã¯ã¾ãããã¾ããªãã
-#	}
-	str = ar.join('')
-	char['ids-parts'] = str
-      }
-      @dbs.dump_db('ids-parts')
+    def map_euc()
+      e = to_euc()
+      return e if e != ""
+      return to_er()
     end
-    def make_ids_contained
-      h = Hash.new
-      @dbs.each('ids-parts') {|k, v|
-	char = k.char
-	parts = char.ids_parts
-	parts.each_char {|ch|
-#	  part = ch.char
-	  h[ch] = [] if h[ch].nil?
-	  h[ch] << k
-#	  h[ch] += k
-#	  part['ids-contained'] = "" if part['ids-contained'].nil?
-#	  part['ids-contained'] += k
-	}
-      }
-      h.each {|k, v|
-	char = k.char
-	v.sort!
-	char['ids-contained'] = v.join('')
-	
-      }
-      @dbs.dump_db('ids-contained')
+    def to_sjis()
+      u = ucs()
+      return "" if u.nil? || 0xffff < u
+      Uconv.u16tosjis(Uconv.u4tou16(Character.u4itou4(ucs())))
     end
-    def make_ids_decomposed
-      @dbs.each('ids') {|k, v|
-	char = k.char
-	de= char.decompose_all
-	char['ids-decomposed'] = de
-      }
-      @dbs.dump_db('ids-decomposed')
+    def map_sjis()
+      e = to_sjis()
+      return e if e != ""
+      return to_er()
     end
-  end
 
-  class Node < Array #=======================================================æ¨æ§é ã®ä¸­ã®ä¸ã¤ã®æ
-    def initialize(nodeleaf=nil, nodenum=nil)
-      super()
-      @nodeleaf = nodeleaf
-      @nodenum = nodenum
-      if @nodeleaf
-	original_add(@nodeleaf)
-      end
-    end
-    attr_reader :nodenum
-    alias original_add <<
-    private :original_add
-    def <<(obj)
-      original_add(obj)
-      @nodenum -= 1 if @nodenum
+    #----------------------------------------------------------------------
+    def to_er(codesys=nil) #å®ä½åç§ãè¿ããå¸æããcodesysãå¼æ°(æªå®è£)
+      return "" if @char_id == nil
+      return sprintf("&#x%04x;", @char_id) if @char_id <= 0xffff
+      return sprintf("&#x%05x;", @char_id) if @char_id <= 0xfffff
+      EntityReference.each_codesys {|codesys, er_prefix, keta, numtype|
+	code = self[codesys]
+	next if code == nil
+	return sprintf("&#{er_prefix}%0#{keta}#{numtype};", code)
+      }
+      return sprintf("&MCS-%08X;", @char_id) #æ¬å½ã¯ããã¯ç¡ãã«ããã
     end
-    def nodes
+    def to_er_list()
       ar = []
-      ar << self.to_s
-      self.each {|n|
-	ar += n.nodes if n.is_a? Node
+      EntityReference.each_codesys {|codesys, er_prefix, keta, numtype|
+	er = to_er(codesys)
+	ar << er if er != nil
       }
-      return ar
+      ar
     end
-  end
 
-  class Tree #======================================================================æ¨æ§é ãæ±ã
-    def initialize()
-      @root = Node.new()
-      @stack = [@root]
-      @leafnum = 0
-      @depth = 1 #stackã®æ·±ããæå¤§ã«ãªã£ãã¨ããã®å¤ãæ¨æ§é ãç¡ãã¨ãã¯1ã¨ãªã
-    end
-    def depth() @depth - 1 end
-    def add_node(nodeleaf=nil, nodenum=nil) #æãè¿½å 
-      new_node = Node.new(nodeleaf, nodenum)
-      @stack.last << new_node
-      @stack << new_node
-      if @depth < @stack.length
-	@depth = @stack.length
-      end
-      self
-    end
-    def end_node() #ãã®æã¯çµã
-      @stack.pop
-      self
+    def inspect_x()
+      return "<>" if @char_id == nil
+      ar = [to_utf8(), to_er().sub(/^&/,'').chop]
+      "<"+ar.join(',')+">"
     end
-    def add_leaf(a) #èãè¿½å 
-      @stack.last << a
-      end_check()
-      self
+    alias inspect inspect_x
+    def inspect_all_codesys() #æªå®æ
+      #to_erãå¨ã¦ã®codesysã«ããã¦å®è¡ããããã®çµæãã³ã³ãã¯ãã«ã¾ã¨ãã
     end
-    def end_check()
-      n = @stack.last.nodenum
-      if n && n == 0
-	end_node()
-	end_check() #åå¸°
-      end
-    end
-    def check_integrity
-      n = @stack.last.nodenum
-      return nil if @root.length == 0 #no tree is good tree
-      return "unmatch leaves" if n && n != 0
-      return "extra nodes" if @root.first.is_a?(Node) && @root.length != 1
-      return "extra leaves" if @root.length != 1
-      return nil
-    end
-    def nodes
-      r = @root.nodes
-      r.shift
-      r
-    end
-    def sub_nodes
-      r = nodes
-      r.shift
-      r
+    def inspect_all()
+      ar = [inspect.chop]
+      alist.to_a.sort.each {|a, v| ar << "#{a}:#{v}" }
+      return ar.join(',')+">"
     end
-    def to_s()    @root.to_s    end
-    def inspect() @root.inspect end
-  end
-
-  class IDS_Tree < Tree #======================================================================
-    def initialize(str)
-      @str = str
-      super()
-      parse()
+    def dump_all()
+      ar = [inspect]
+      alist.to_a.sort.each {|a, v| ar << "#{a}:#{v}" }
+      return ar.join('\n')+'\n'
     end
-    def parse()
-      @str.each_char {|ch|
-	char = Character.new(ch)
-	if is_ids?(char)
-	  add_node(char, ids_operator_argc(char))
-	else
-	  add_leaf(char)
-	end
+    def get_attributes()
+      str = ""
+      alist.to_a.sort.each {|a, v|
+	str += "#{a}: #{v}\n"
       }
+      str
     end
-    def is_ids?(obj)
-      return true if "+*".include?(obj.to_s) #ãã¹ãç¨ã§ããã­
-      return true if obj.is_ids?
-      return false
-    end
-    def ids_operator_argc(obj)
-      return obj.ids_operator_argc if 0 < obj.ids_operator_argc
-      return 2 #ãã¹ãç¨ã£ã¦ãã¨ã§
-    end
-    def check_integrity
-      r = super
-      return r if r #ä¸å®å¨ããã§ã«ããã£ã¦ãããªãreturn
-      return "contains ques" if @str =~ /\?/ #?ãå«ã¾ãã¦ãã?
-      return nil
-    end
-
-  end
-
-  class IDS #======================================================================IDSãã®ãã®ãæ±ãclass
-    def initialize(str) #IDSæå­åãããã¨ãã
-      @str = str
-    end
-    def parse
-    end
-    def parse_x #æè»åã®Parse. IDSã­ã£ã©ã¯ã¿ã¼ãåã«ãã¦ãªãã¦ãããããªã©ãªã©ã
-    end
-  end
 
-  class Counter #======================================================================
-    #ä½¿ãæ¹
-    #counter = Counter.new(50) { exit }
-    #counter.count
-    def initialize(max)
-      @max = max
-      @count = 0
-      @proc = proc
-    end
-    def count
-      @count += 1
-      if @max <= @count
-	@proc.call
+    def inspect_ids(hex_flag=false)
+      ids = decompose
+      ar = []
+      ar << (hex_flag ? "x"+mcs_hex : to_utf8)
+      if to_s != ids #idsãé¨åãã®ãã®ã ã£ããé¨åè¿½å ã¯ããªã
+	ids.each_char {|ch|
+	  char = ch.char
+	  next if char.is_ids?
+	  if hex_flag then
+	    ar << "x"+char.mcs_hex
+	  else
+	    u = char.to_utf8
+	    if u != ""
+	      ar << u
+	    else
+	      ar << char.to_er
+	    end
+	  end
+	}
       end
+      return "("+ar.join("\t")+")"
+    end
+
+    #----------------------------------------------------------------------IDSé¢ä¿
+    def decompose
+      k = self.to_s
+      #       idss = self['ids']
+      #       return idss if idss
+      #       return k if self.is_basic_kanji? #åºæ¬æ¼¢å­ã¯stop kanjiã¨ãããã¨ã
+      return self['ids-represent'] if self['ids-represent'] #ids_representãæã£ã¦ããå ´åã¯ãã®å¤ã¨ããã
+      return self['ids-element'] if self['ids-element'] #ids_elementãæã£ã¦ããå ´åã¯ãã®å¤ã¨ããã
+
+      idss = self['ids-meaning']
+      return idss if idss != nil && 0 < idss.length && k != idss
+      idss = self['ids-aggregated']
+      return idss if idss != nil && 0 < idss.length && k != idss
+      idss = self['ids']
+      return idss if idss != nil && 0 < idss.length && k != idss
+      return k
+      #       return k if idss.nil? || idss.length == 0 || k == idss
+      #       if idss.char_length == 2
+      #	p ['What???', k, idss, k.inspect_all]
+      #	 #return idssx[1] #äºåç®ã ãè¿ãã¨ã?
+      #	 return k #IDSã«å±éããæ¹æ³ãç¡ãã¨ã
+      #       end
+      #       return k if k == idss
+      #       if idss.include?(k) #<C5-4C4D><C6-4A37>ãã®äºæå­ã®BUGå¯¾ç­
+      #	 #return idss.sub(k, '')
+      #	 return k #IDSã«å±éããæ¹æ³ãç¡ãã¨ã
+      #       end
+      #       return idss
+    end
+    def decompose_all
+      pde = ""
+      de = self.decompose #åºçºç¹
+      level = 0
+      while true
+	pde = de
+	de = pde.decompose #ããä¸åº¦åè§£ããã¦ã¿ãã
+	break if pde == de #ã«ã¼ããæãã ã
+	exit if 10 < level #p ['too many recursive', self] 
+	level += 1
+      end
+      return de
     end
-  end
-
-  class DBS_Management #======================================================================ãã¡ã¤ã«ç®¡ç
-    OBSOLETE_ATTRIBUTES = "
-cns-radical
-cns-radical?
-kangxi-radical
-daikanwa-radical
-unicode-radical
-
-cns-strokes
-kangxi-strokes
-daikanwa-strokes
-shinjigen-1-radical
-gb-original-radical
-japanese-strokes
-jis-strokes-a
-jis-strokes-b
-jisx0208-strokes
-jis-x0213-strokes
-jisx0213-strokes
-unicode-strokes
-
-totalstrokes
-cns-total-strokes
-jis-total-strokes-b
-
-non-morohashi
-
-=>ucs*
-#=>mojikyo
-#=mojikyo
-->identical
-
-ancient-ideograph-of
-ancient-char-of-shinjigen-1
-original-ideograph-of
-original-char-of-shinjigen-1
-simplified-ideograph-of
-vulgar-ideograph-of
-vulgar-char-of-shinjigen-1
-ideograph=
-ideographic-variants
-variant-of-shinjigen-1
-
-iso-10646-comment
-".split
-    def initialize
-      @odir = DB_DIR+"/system-char-id/obsolete" #ç´æã¡ãã¦ããã
-    end
-    def move_obsolete_files # å»æ­¢äºå®ã®bdbãã¡ã¤ã«ãobsoleteãã£ã¬ã¯ããªã¼ã«ã¤ã£ãã
-      db = CharDB.instance
-      db.close_all
-      Dir.mkdir(@odir) unless FileTest.directory? @odir
-      OBSOLETE_ATTRIBUTES.each {|attr|
-	next if attr =~ /^#/
-	filename = db.get_filename(attr)
-	move_to_obsolete(filename)
-	move_to_obsolete(filename+".txt")
-      }
-    end
-    def move_to_obsolete(file)
-      cmd = "mv #{file} #{@odir}"
-#      p cmd
-      system cmd
-    end
-  end
-
-  class JoyoList #======================================================================
-    include Singleton
-    #JP_JOYO_FILE = DB_DIR+"/../jp-joyo.txt" #EUC-jisx0213
-    JP_JOYO_FILE = DB_DIR+"/../joyo-ucs.txt" #UCS
-    COMPOSIT_KANJI = "é³´åå åå¤ç¥åéèååè¦ååç²è²§ææ£®æ ¡æ±æä½ä½å¥½å²©ç éç·çç¿ä¼ç­ç©ºåå³¶åç¾å­èµ¤çåååªåè§£æ°æ­èªè©±å¼µå¼·å¿æ²ç­æ´ç¾æ­£å­å®å®ç°ç§ç§å°å½å»åååèå±å³å·¦åååéè¿è¿·è±èéæºä¸»å¤ªæ°·å·ç¹åºåº«ä»å¸³å¹¼é²å¼éæ©ç´ç­ç­éçªååæ¯æ­»å¤å¾é²éç¦ç§å®¶ä¸åè°·åååå¯ºæé»é²æ°å¸æè¡æ³£"
-#    COMPOSIT_KANJI = "é³´åå åå¤"
-    def initialize
-      @nchars = []
-      read_file
-    end
-    attr_reader :nchars
-    def read_file
-      open(JP_JOYO_FILE) {|f|
-	while line = f.gets
-	  next if line =~ /^;/ #ã³ã¡ã³ãã¯ã¨ã°ã
-	  line.chomp!
-	  #stroke, nchar, ochar = line.split #new char, old char, old charã¯nilãå¤ã
-	  stroke, nchar = line.split
-	  @nchars << nchar
-	end
-      }
-    end
-    def dump_ids(ar)
-      ar.each {|ch|
-	char = ch.char
-	print char.inspect_ids(true), "\t;", char.inspect_ids(false), "\n"
-      }
+    def decompose_all_nu(level=nil)
+      level = 0 if level.nil?
+      if 10 < level
+	p ['too many recursive', self] 
+	exit
+      end
+      de = self.decompose
+      return de.decompose_all(level+1) if de != self #ãªã«ãå¤åããã£ãããåå¸°
+      return de #ããããä»¥ä¸å¤åã¯ç¡ãããã ãã¨ã
+    end
+    def is_ids?() 0x2ff0 <= @char_id && @char_id <= 0x2fff end
+    def ids_operator_argc()
+      return 0 unless is_ids?
+      return 3 if @char_id == 0x2ff2 || @char_id == 0x2ff3
+      return 2
     end
   end