From 1fcb1467ee6ef47f5948268ebdfd0a57037d9f4c Mon Sep 17 00:00:00 2001
From: eto <eto>
Date: Mon, 10 Nov 2003 08:10:12 +0000
Subject: [PATCH] change directory

---
 doc/index.html |    4 +-
 src/chise.rb   |  627 +-------------------------------------------------------
 t/tc_ids.rb    |   92 +++++++++
 3 files changed, 103 insertions(+), 620 deletions(-)
diff --git a/doc/index.html b/doc/index.html
index 0f19b59..ddf1d66 100755
--- a/doc/index.html
+++ b/doc/index.html
@@ -46,13 +46,13 @@ Rubyã¸ç§»æ¤ãããã¨ãè©¦ã¿ãã¢ã¸ã¥ã¼ã«ã§ããã<br>
 <li>2003-0312	<a href="http://eto.com/2003/ruby/ruby-chise-20030312.tar.bz2" class="s">ruby-chise-20030312.tar.bz2</a><br>
 æ§ããªã©ã¤ãã©ãªãè¿½å ã
 <li>2003-1004	<a href="http://eto.com/2003/ruby/ruby-chise-20031004.tar.bz2" class="s">ruby-chise-20031004.tar.bz2</a><br>
-æ°ããç´ æ§åã«å¯¾å¿ãããCopyright noticeããã¡ãã¨ãããã
+æ°ããç´ æ§åã«å¯¾å¿ãããCopyright noticeããããã
 </ul>
 <hr>
 <h3>â <a href="http://cvs.m17n.org/cgi-bin/viewcvs/ruby/?cvsroot=chise">CVS access</a></h3>
 <hr>
 <h3>â ã©ã¤ã»ã³ã¹</h3>
-GPLã§ããä»å±ã®COPYINGããããä¸ããã
+<p>GPLã§ããCOPYINGãããããã ããã</p>
 <p>
 </div>
 
diff --git a/src/chise.rb b/src/chise.rb
index f2ef8da..28b0b98 100755
--- a/src/chise.rb
+++ b/src/chise.rb
@@ -1,619 +1,10 @@
 #!/usr/bin/env ruby
-#
-# Ruby/CHISE module by eto 2002-1114
-# Copyright (C) 2002-2003 Kouichirou Eto
-#     All rights reserved.
-#     This is free software with ABSOLUTELY NO WARRANTY.
-#
-# You can redistribute it and/or modify it under the terms of 
-# the GNU General Public License version 2.
-#
-
-require 'bdb'
-require 'uconv'
-require 'singleton'
-require 'rbchise'
-require 'db'
-require 'ids'
-
-$KCODE = 'u' #ä»ã®ã¨ããããä»¥å¤ã§ã¯åããªããString.splitãå½±é¿å¤§ãinspectãå½±é¿ã
-$debug = false #ããã¯ãã¹ãç¨
-$debug = true #ããã¯ãã¹ãç¨
-$stdout.binmode if $debug
-$stdout.sync = true if $debug
-
-class String #======================================================================
-  def to_a() self.split(//) end #$KCODEãè¨­å®ããã¦ããã®ã§ãUTF-8çãªä¸æå­ã¥ã¤ãchã«ã¯ãã
-  def each_char() to_a.each {|ch| yield ch } end
-  def each_character() to_a.each {|ch| yield ch.char } end
-  def char_length() to_a.length end
-  def char_at(n) to_a()[n] end
-  def char() Character.get(to_a[0]) end
-  #alias to_c char #æ©ã¿ä¸­
-  #def char_id() char.char_id() end #ãªãã¨ãªãå»æ­¢
-  #def get_char_attribute(a) char.get_char_attribute(a) end #ãªãã¨ãªãå»æ­¢
-  #def ucs() char.ucs() end
-  def to_utf8()
-    return to_a.map {|ch|
-      ch.char.to_utf8
-    }.join('')
-  end
-
-  def map_char(block = Proc.new)
-    return unless block_given?
-    return self.to_a.map {|ch| (block.call(ch)).to_s }.join("")
-  end
-  def map_char!(block = Proc.new)
-    return unless block_given?
-    self.replace(self.map_char {|ch| block.call(ch)})
-  end
-  def map_character(block = Proc.new)
-    return unless block_given?
-    return self.to_a.map {|ch| (block.call(ch.char)).to_s }.join("")
-  end
-  def map_character!(block = Proc.new)
-    return unless block_given?
-    self.replace(self.map_char {|ch| block.call(ch.char)})
-  end
-
-  def method_missing(mid, *args)
-    if char_length == 1 #çç¥å½¢ãæå¹ãªã®ã¯ãä¸æå­ã®æã ã
-      char.method_missing(mid, *args)
-    else
-      raise NameError, "undefined method `#{mid.id2name}'", caller(1)
-    end
-  end
-
-  def map_utf8() map_char {|ch| ch.char.map_utf8 } end
-  alias map_ucs map_utf8
-  def map_ucs_er() map_char {|ch| ch.char.map_ucs_er } end
-  def to_er() map_char {|ch| ch.char.to_er } end
-
-  #puté¢ä¿ã[]é¢ä¿ã¯ç¨æããªããã¨ã«ããã
-  def de_er!() #EntityReferenceãåãé¤ã
-    return self unless self =~ Regexp.new(EntityReference::REGEXP_PART) #ãããããã®ãç¡ããã°ä½ãããªã
-    er = "&"+$1+";"      
-    self.sub!(Regexp.new(Regexp.escape(er)), Character.new(er).mcs_utf8) #å¤æèªä½ã¯Characterã«ã¾ããã
-    return self.de_er! if self =~ Regexp.new(EntityReference::REGEXP_PART) #ã¾ã ãã£ããåå¸°
-    return self
-  end
-  def de_er() return self.dup.de_er!; end
-
-  def inspect_all() map_char {|ch| ch.char.inspect_all } end
-  def inspect_x()   map_char {|ch| ch.char.inspect_x   } end
-
-  def to_euc()   map_char {|ch| ch.char.to_euc   } end
-  def map_euc()  map_char {|ch| ch.char.map_euc  } end
-  def to_sjis()  map_char {|ch| ch.char.to_sjis  } end
-  def map_sjis() map_char {|ch| ch.char.map_sjis } end
-
-  def decompose() map_char {|ch| ch.char.decompose } end
-  def decompose!() self.replace(self.decompose); self; end
-  def decompose_all_nu(level=nil)
-    level = 0 if level.nil?
-    if 10 < level
-      p ['too many recursive', self] 
-      exit
-    end
-    de = self.decompose
-    return de.decompose_all(level+1) if de != self #ãªã«ãå¤åããã£ãããåå¸°
-    de #ããããä»¥ä¸å¤åã¯ç¡ãããã ãã¨ã
-  end
-  def decompose_all() map_char {|ch| ch.char.decompose_all } end
-  def decompose_all!() self.replace(self.decompose_all); self; end
-
-  def find() #"æ¥é²"â"æ"ã¨ãããæãã®æä½
-    ar = []
-    length = char_length()
-    each_char {|ch|
-      char = ch.char
-      ar << char.ids_contained #ãã®æå­ãå«ãã§ããæ¼¢å­ã®ãªã¹ã
-    }
-    h = Hash.new(0)
-    ar.each {|list|
-      next if list.nil?
-      list.each_char {|ch|
-	h[ch] += 1
-      }
-    }
-    str = ""
-    h.each {|k, v|
-      #      p [k, v]
-      if length == v #å¨é¨ã«é¡ãåºãã¦ããã
-	str += k
-      end
-    }
-    #    p str
-    str
-  end
-  def compose()
-    db = CodesysDB.instance
-    composed = db.get('ids', self)
-    return "" if composed.nil? #ãªãã£ããã¨ã
-    return "" if composed.char_length == 0 #ãªã«ãã¨?
-    return composed if composed.char_length == 1
-    composed.each_char {|ch|
-      char = ch.char
-      return ch if char.has_attribute? #ã¨ããããæåã«ã¿ã¤ãã£ããã®ãè¿ãã¨ãããã«ãä»æ§
-    }
-    return "" #attributeãæã¤ãã®ãä¸ã¤ãç¡ãã£ããã""ã«ãã
-  end
-  def aggregate()
-    #selfã§ããæå­åãIDSã ã¨ä»®å®ãããããå®å¨ã«composeããããªãã§ã
-    #ãã®é¨åéåã ããã¨ãã ãã¦ãcomposeå¯è½ã§ããã°ã§ããã ãcomposeããã
-    tree = IDS_Tree.new(self)
-    return self if tree.depth <= 1 #sub_nodesãç¡ãå ´åã¯ããã§ãããªã
-    tree.sub_nodes.each {|node|
-      c = node.compose
-      next if c.nil? || c == ""
-      #      print "#{self}	#{node}	#{c}\n"
-      #      p [self, node, c]
-      n = self.gsub(node, c)
-      return n.aggregate
-    }
-    return self #ããããããããã®ãã¾ã£ãããªãã£ãããèªåããããã
-  end
-end
-
-module CHISE #======================================================================
-  def windows?()
-    (RUBY_PLATFORM =~ /cygwin/ || RUBY_PLATFORM =~ /mswin32/ || RUBY_PLATFORM =~ /mingw32/)
-  end
-  module_function :windows?
-  if windows?()
-    DB_DIR = 'd:/work/chise/char-db' #ãã®å¾ã«/sysmtem-char-id/ucsã¨ããæãã«ç¶ã
-    IDS_DB_DIR = 'd:/work/chise/ids/' #ãã®å¾ã«IDS-JIS-X0208-1990.txtã¨ããæãã«ç¶ã
-  else
-    DB_DIR = '/usr/local/lib/xemacs-21.4.12/i686-pc-linux/char-db' #ãã®å¾ã«/sysmtem-char-id/ucsã¨ããæãã«ç¶ã
-    IDS_DB_DIR = '/home/eto/work/chise/ids/' #ãã®å¾ã«IDS-JIS-X0208-1990.txtã¨ããæãã«ç¶ã
-  end
-
-  class EntityReference #======================================================================
-    #ç¶æ³ã«ãã£ã¦ã©ã®ERã«å¤æããããç°ãªãå¯è½æ§ãããã®ã§ãæ®éã®classã¨ãã¦å®è£ããã»ãããã?
-#    CODESYS_TABLE = [
-#      %w( chinese-big5-cdp	CDP- 4 X),
-#      %w( ideograph-daikanwa	M-   5 d),
-#      %w( ideograph-cbeta	CB   5 d),
-#      %w( ideograph-gt		GT-  5 d),
-#      %w( ideograph-gt-k	GT-K 5 d),
-#      %w( japanese-jisx0208-1990 J90- 4 X),
-#      %w( japanese-jisx0208	J83- 4 X),
-#      %w( japanese-jisx0213-1	JX1- 4 X),
-#      %w( japanese-jisx0213-2	JX2- 4 X),
-#      %w( japanese-jisx0212	JSP- 4 X),
-#      %w( japanese-jisx0208-1978 J78- 4 X),
-#      %w( chinese-cns11643-1	C1-  4 X),
-#      %w( chinese-cns11643-2	C2-  4 X),
-#      %w( chinese-cns11643-3	C3-  4 X),
-#      %w( chinese-cns11643-4	C4-  4 X),
-#      %w( chinese-cns11643-5	C5-  4 X),
-#      %w( chinese-cns11643-6	C6-  4 X),
-#      %w( chinese-cns11643-7	C7-  4 X),
-#      %w( korean-ksc5601	K0- 4 X),
-#    ]
-#    CODESYS_ORDER = %w(japanese chinese korean ideograph)
-    CODESYS_TABLE = [
-      %w( =jis-x0208-1990	J90- 4 X),
-      %w( =jis-x0208-1983	J83- 4 X),
-      %w( =jis-x0208-1978	J78- 4 X),
-      %w( =jis-x0208		J90- 4 X), #ç¶æ¿ã®ã¢ãããã¯ãªå®è£
-      %w( =jis-x0208		J83- 4 X), #ç¶æ¿ã®ã¢ãããã¯ãªå®è£
-      %w( =jis-x0208		J78- 4 X), #ç¶æ¿ã®ã¢ãããã¯ãªå®è£
-      %w( =jis-x0213-1-2000	JX1- 4 X),
-      %w( =jis-x0213-2-2000	JX2- 4 X),
-      %w( =jis-x0212		JSP- 4 X),
-      %w( =big5-cdp		CDP- 4 X),
-      %w( =cns11643-1		C1-  4 X),
-      %w( =cns11643-2		C2-  4 X),
-      %w( =cns11643-3		C3-  4 X),
-      %w( =cns11643-4		C4-  4 X),
-      %w( =cns11643-5		C5-  4 X),
-      %w( =cns11643-6		C6-  4 X),
-      %w( =cns11643-7		C7-  4 X),
-      %w( =ks-x1001		K0-  4 X),
-      %w( =daikanwa		M-   5 d),
-      %w( =cbeta		CB   5 d),
-      %w( =gt			GT-  5 d),
-      %w( =gt-k			GT-K 5 d),
-    ]
-    REGEXP_PART = "&([-+0-9A-Za-z#]+);"
-    REGEXP_ALL = "^#{REGEXP_PART}$"
-
-    def self.match?(er) (er =~ Regexp.new(REGEXP_PART)) != nil end
-
-    def self.parse(er) #char_idãFIXNUMã§è¿ã
-      return "" unless er =~ Regexp.new(REGEXP_ALL) #ãªãããééã£ã¦ã?
-      er = $1 #ã¤ãã§ã«ä¸­èº«ã®é¨åãåãåºã
-      return $1.hex if er =~ /^MCS-([0-9A-Fa-f]+)/ #MCS
-      #      if er =~ /^U[-+]?([0-9A-Fa-f]+)/ #Unicodeç´æã¡
-      if er =~ /^U[-+]?([0-9A-Fa-f]+)/ || er =~ /^#x([0-9A-Fa-f]+)/ #Unicodeç´æã¡
-	return $1.hex 
-      end
-
-      er.sub!(/^I-/, '') if er =~ /^I-/ #I-ãã¤ãã¦ãã¨ã©ãéãã®ãã¯ããããããªã
-      each_codesys {|codesys, er_prefix, keta, numtype|	#p [codesys, er_prefix, keta, numtype]
-	numtyperegex = '\d' #if numtype == 'd'
-	numtyperegex = '[0-9A-Fa-f]' if numtype == 'X'
-	regexpstr = "^#{er_prefix}(#{numtyperegex}{#{keta},#{keta}})$"
-	if er =~ Regexp.new(regexpstr)
-	  codestr = $1
-	  code = codestr.to_i #if numtype == 'd'
-	  code = codestr.hex if numtype == 'X'
-	  char_id_u8 = EntityReference.get_database(codesys, code)
-	  char_id_num = Character.parse_char_id(char_id_u8)
-	  next if char_id_num == nil
-	  return char_id_num
-	end
-      }
-      return ""
-    end
-
-    def self.each_codesys()
-#      CODESYS_ORDER.each {|lang|
-#	CODESYS_TABLE.each {|codesys, er_prefix, keta, numtype| #æ®éããããæ¸ãæ¹ã¯ããªããã«ã¼ãä¸åã«ããã
-#	  next unless codesys =~ lang
-#	  yield(codesys, er_prefix, keta, numtype)
-#	}
-#      }
-      CODESYS_TABLE.each {|codesys, er_prefix, keta, numtype|
-	yield(codesys, er_prefix, keta, numtype)
-      }
-    end
-    def self.get_database(codesys, code)
-      c = CodesysDB.instance.get(codesys, code)
-      return c if c != nil
-#      if codesys =~ /-jisx0208/
-#	#return self.get_database("=jis-x0208", code) #åå¸°ã§ã©ãã ?
-#	c = CodesysDB.instance.get("=jis-x0208", code)
-#	return c
-#      end
-      return nil
-    end
-  end
-
-  class CharacterFactory #============================================æå­ãªãã¸ã§ã¯ãã®çæãcache
-    include Singleton
-    MAX = 10000
-    def initialize
-      @max = MAX
-      reset()
-    end
-    def get(char_id)
-      check_max()
-      n = Character.parse_char_id(char_id)
-      c = @chars[n]
-      @chars[n] = Character.new(n) if @chars[n] == nil
-      return @chars[n]
-    end
-    def reset()
-      @chars = nil
-      @chars = Hash.new
-      GC.start #ã¬ã¼ãã¼ã¸ã³ã¬ã¯ã·ã§ã³
-    end
-    def length() @chars.length; end
-    def check_max()
-      reset if @max < @chars.length #MAXãè¶ãããresetãã¦ãã¾ããä¹±æ´ãããcacheãªã®ã§ããã§ããã®ã ã
-    end
-  end
-
-  class Character #=============================================================== æå­ãªãã¸ã§ã¯ã
-    def initialize(char_id=nil)
-      @char_id = Character.parse_char_id(char_id)
-      @attributes = Hash.new
-      @check_all_database = false
-    end
-    attr_reader :char_id
-    def to_i() @char_id end
-    def mcs_utf8() Character.u4itou8(@char_id) end
-    def mcs_hex() sprintf("%x", @char_id) end
-
-    #----------------------------------------------------------------------
-    def self.get(char_id) CharacterFactory.instance.get(char_id) end #flyweightãã¿ã¼ã³
-
-    #----------------------------------------------------------------------
-    def normalize_attribute_name(b)
-      a = b.dup
-      a.gsub!(/_/, '-') #underlineã¯-ã«ç½®æ
-      a.sub!(/-at-/,  '@')
-      a.sub!(/^map-/,  '=>')
-      a.sub!(/^to-/,   '->')
-      a.sub!(/^from-/, '<-')
-      a
-    end
-    def get_char_attribute(b) # XEmacs UTF-2000äºæAPIç¾¤
-      a = normalize_attribute_name(b)
-      #p [a, b]
-      atr = @attributes[a]
-      return atr if atr
-      atr = check_database(a)
-      if atr
-	@attributes[a] = atr
-	return atr
-      end
-      return get_char_attribute("="+a) unless a =~ /^=/ #é ­ã«=ãã¤ãã¦ãªãå ´åã¯ãããçç¥ããã¦ãããã¨ãä»®å®ãã¦ãåå¸°ãã
-      nil
-    end
-    def put_char_attribute(b,v)
-      a = normalize_attribute_name(b)
-      @attributes[a] = v;
-      CharDB.instance.put(a, mcs_utf8(), v)
-    end
-    def char_attribute_alist() check_all_database(); @attributes; end
-    def char_attribute_list()  check_all_database(); @attributes.keys; end
-    alias [] get_char_attribute  #ãã®ç¥ç§°
-    alias []= put_char_attribute
-    alias alist char_attribute_alist
-    alias list  char_attribute_list
-
-    def method_missing(mid, *args) #åè:ostruct.rb
-      mname = mid.id2name
-      return get_char_attribute(mname) if args.length == 0
-      put_char_attribute(mname.chop, args[0]) if mname =~ /=$/ #ä»£å¥
-    end
-
-    def has_attribute?() #æå³ã®ããattributeãæã£ã¦ã¾ãã?
-      keys = list
-      keys.delete_if {|k|
-	k =~ /ids/
-      }
-      return (keys.length != 0)
-    end
-
-    #----------------------------------------------------------------------
-    def ==(ch)
-      return false if ch == nil
-      return false unless ch.is_a? Character
-      self.char_id == ch.char_id
-    end
-
-    #----------------------------------------------------------------------
-    def self.parse_char_id(char_id) #FIXNUMãè¿ã
-      return nil if char_id == nil
-      if char_id.is_a?(Numeric)	#p [char_id]
-	char_id = 0x80000000 + char_id if char_id < 0  #è£æ°è¡¨ç¾
-	return char_id.to_i
-      elsif char_id.is_a?(String)
-	return char_id.to_i if char_id =~ /^\d+$/ && 1 < char_id.length #æå­åã«ããæ°å­ã ã£ããæ°å¤åãã¦return
-	return EntityReference.parse(char_id) if char_id =~ Regexp.new(EntityReference::REGEXP_ALL) #å®ä½åç§?
-	char_id.sub!(/^\?/, '') if char_id =~ /^\?/ #ããåé ­ã«?ãã¤ãã¦ãããåé¤
-	#ãã®ã¸ãæ¬å½ã¯ãã£ã¨ã¡ããã¨ãã§ãã¯ããã¹ã
-	begin
-	  u4 = Uconv.u8tou4(char_id) #UCS-4æå­åã«å¤æ
-	rescue
-	  p $!
-	  p char_id
-	  return 0
-	end
-	return Character.u4tou4i(u4) #UCS-4æ°å¤ã«ãã¦return
-      else
-	raise ArgumentError, "unknown object for char_id", caller(1)
-      end
-    end
-    def self.u4tou4i(u4)
-      return 0 if u4 == nil || u4 == ""
-      return (u4[3] << 24 | u4[2] << 16 | u4[1] << 8 | u4[0]) #UCS-4æ°å¤ã«ãã¦return
-    end
-    def self.u4itou4(num)
-      return "" unless num.is_a?(Integer)
-      return sprintf("%c%c%c%c", num&0xff, (num >> 8)&0xff, (num >> 16)&0xff, (num >> 24)&0xff) #UCS-4æ°å¤ãæå­åã«ãã¦return
-    end
-    def self.u4itou8(char_id) #ucsã®æ°å¤ãåãã¨ããUTF-8ã®æå­ä¸æå­ãè¿ã
-      begin
-	u4 = Character.u4itou4(char_id)
-	u8 = Uconv.u4tou8(u4)
-	return u8
-      rescue
-	#raise ArgumentError, "invalid char_id (#{char_id})", caller(1)
-	#print "error\n"
-	return ""
-      end
-    end
-
-    #----------------------------------------------------------------------
-    def check_database(a)
-      db = CharDB.instance
-      u8 = mcs_utf8()
-      v = db.get(a, u8) #u8ã§è¡¨ãããæå­ã®aã¢ããªãã¥ã¼ããèª¿ã¹ãã
-      return v
-    end
-    def check_all_database() #ç¾å¨ã®@char_idãããæå­ãã¼ã¿ãã¼ã¹ãåç§ãã
-      return if @check_all_database
-      return if @char_id == nil
-      db = CharDB.instance
-      u8 = mcs_utf8()
-      atrs = db.get_all(u8) #u8ã§è¡¨ãããæå­ã®ã¢ããªãã¥ã¼ããå¨é¨æã£ã¦ãã
-      atrs.each {|a,v|
-	@attributes[a] = v #ã¨ãããæãã§ä»£å¥ããã®ã§ããããª?
-      }
-      @check_all_database = true #éãå¦çãªã®ã§ä¸å¿checkãã
-    end
-
-    #----------------------------------------------------------------------
-    def ucs()      #p 'ucs'
-      #ar = %w{ucs ucs-big5 ucs-cdp ucs-cns ucs-jis ucs-ks =>ucs =>ucs* =>ucs-jis}
-      #ar = %w{ucs ucs-jis ucs-big5 ucs-cdp ucs-cns ucs-ks =>ucs =>ucs* =>ucs-jis}
-      ar = %w{ucs-jis ucs =>ucs-jis}
-      #ä¸¦ã³é ã¯æ£æçã§ãucs-jisãåã«åºãã¦ãããæ¬æ¥ã¯ãããæå®ã§ããããã«ããã¹ãã
-      ar.each {|a|	#p [a]
-	u = get_char_attribute(a)
-	return u if u != nil
-      }
-      return nil
-    end
-
-    #----------------------------------------------------------------------CCSé¢ä¿
-    def to_utf8() Uconv.u4tou8(Character.u4itou4(ucs())) end #UTF8æå­åãè¿ã
-    #alias to_s to_utf8
-    alias to_s mcs_utf8
-    def map_utf8()
-      u = ucs()
-      if u.nil? || 0xffff < u
-	return to_er()
-      else
-	return to_utf8()
-      end
-    end
-    alias map_ucs map_utf8
-    def map_ucs_er()
-      u = ucs()
-      if u.nil? || 0xffff < u
-	return to_er()
-      else
-	return Character.get(u).to_er()
-      end
-    end
-    def to_euc()
-      u = ucs()
-      return "" if u.nil? || 0xffff < u
-      Uconv.u16toeuc(Uconv.u4tou16(Character.u4itou4(ucs())))
-    end
-    def map_euc()
-      e = to_euc()
-      return e if e != ""
-      return to_er()
-    end
-    def to_sjis()
-      u = ucs()
-      return "" if u.nil? || 0xffff < u
-      Uconv.u16tosjis(Uconv.u4tou16(Character.u4itou4(ucs())))
-    end
-    def map_sjis()
-      e = to_sjis()
-      return e if e != ""
-      return to_er()
-    end
-
-    #----------------------------------------------------------------------
-    def to_er(codesys=nil) #å®ä½åç§ãè¿ããå¸æããcodesysãå¼æ°(æªå®è£)
-      return "" if @char_id == nil
-      return sprintf("&#x%04x;", @char_id) if @char_id <= 0xffff
-      return sprintf("&#x%05x;", @char_id) if @char_id <= 0xfffff
-      EntityReference.each_codesys {|codesys, er_prefix, keta, numtype|
-	code = self[codesys]
-	next if code == nil
-	return sprintf("&#{er_prefix}%0#{keta}#{numtype};", code)
-      }
-      return sprintf("&MCS-%08X;", @char_id) #æ¬å½ã¯ããã¯ç¡ãã«ããã
-    end
-    def to_er_list()
-      ar = []
-      EntityReference.each_codesys {|codesys, er_prefix, keta, numtype|
-	er = to_er(codesys)
-	ar << er if er != nil
-      }
-      ar
-    end
-
-    def inspect_x()
-      return "<>" if @char_id == nil
-      ar = [to_utf8(), to_er().sub(/^&/,'').chop]
-      "<"+ar.join(',')+">"
-    end
-    alias inspect inspect_x
-    def inspect_all_codesys() #æªå®æ
-      #to_erãå¨ã¦ã®codesysã«ããã¦å®è¡ããããã®çµæãã³ã³ãã¯ãã«ã¾ã¨ãã
-    end
-    def inspect_all()
-      ar = [inspect.chop]
-      alist.to_a.sort.each {|a, v| ar << "#{a}:#{v}" }
-      return ar.join(',')+">"
-    end
-    def dump_all()
-      ar = [inspect]
-      alist.to_a.sort.each {|a, v| ar << "#{a}:#{v}" }
-      return ar.join('\n')+'\n'
-    end
-    def get_attributes()
-      str = ""
-      alist.to_a.sort.each {|a, v|
-	str += "#{a}: #{v}\n"
-      }
-      str
-    end
-
-    def inspect_ids(hex_flag=false)
-      ids = decompose
-      ar = []
-      ar << (hex_flag ? "x"+mcs_hex : to_utf8)
-      if to_s != ids #idsãé¨åãã®ãã®ã ã£ããé¨åè¿½å ã¯ããªã
-	ids.each_char {|ch|
-	  char = ch.char
-	  next if char.is_ids?
-	  if hex_flag then
-	    ar << "x"+char.mcs_hex
-	  else
-	    u = char.to_utf8
-	    if u != ""
-	      ar << u
-	    else
-	      ar << char.to_er
-	    end
-	  end
-	}
-      end
-      return "("+ar.join("\t")+")"
-    end
-
-    #----------------------------------------------------------------------IDSé¢ä¿
-    def decompose
-      k = self.to_s
-      #       idss = self['ids']
-      #       return idss if idss
-      #       return k if self.is_basic_kanji? #åºæ¬æ¼¢å­ã¯stop kanjiã¨ãããã¨ã
-      return self['ids-represent'] if self['ids-represent'] #ids_representãæã£ã¦ããå ´åã¯ãã®å¤ã¨ããã
-      return self['ids-element'] if self['ids-element'] #ids_elementãæã£ã¦ããå ´åã¯ãã®å¤ã¨ããã
-
-      idss = self['ids-meaning']
-      return idss if idss != nil && 0 < idss.length && k != idss
-      idss = self['ids-aggregated']
-      return idss if idss != nil && 0 < idss.length && k != idss
-      idss = self['ids']
-      return idss if idss != nil && 0 < idss.length && k != idss
-      return k
-      #       return k if idss.nil? || idss.length == 0 || k == idss
-      #       if idss.char_length == 2
-      #	p ['What???', k, idss, k.inspect_all]
-      #	 #return idssx[1] #äºåç®ã ãè¿ãã¨ã?
-      #	 return k #IDSã«å±éããæ¹æ³ãç¡ãã¨ã
-      #       end
-      #       return k if k == idss
-      #       if idss.include?(k) #<C5-4C4D><C6-4A37>ãã®äºæå­ã®BUGå¯¾ç­
-      #	 #return idss.sub(k, '')
-      #	 return k #IDSã«å±éããæ¹æ³ãç¡ãã¨ã
-      #       end
-      #       return idss
-    end
-    def decompose_all
-      pde = ""
-      de = self.decompose #åºçºç¹
-      level = 0
-      while true
-	pde = de
-	de = pde.decompose #ããä¸åº¦åè§£ããã¦ã¿ãã
-	break if pde == de #ã«ã¼ããæãã ã
-	exit if 10 < level #p ['too many recursive', self] 
-	level += 1
-      end
-      return de
-    end
-    def decompose_all_nu(level=nil)
-      level = 0 if level.nil?
-      if 10 < level
-	p ['too many recursive', self] 
-	exit
-      end
-      de = self.decompose
-      return de.decompose_all(level+1) if de != self #ãªã«ãå¤åããã£ãããåå¸°
-      return de #ããããä»¥ä¸å¤åã¯ç¡ãããã ãã¨ã
-    end
-    def is_ids?() 0x2ff0 <= @char_id && @char_id <= 0x2fff end
-    def ids_operator_argc()
-      return 0 unless is_ids?
-      return 3 if @char_id == 0x2ff2 || @char_id == 0x2ff3
-      return 2
-    end
-  end
-
-end
-
-#----------------------------------------------------------------------çµäº
+# $Id: chise.rb,v 1.18 2003-11-10 08:10:12 eto Exp $
+# Copyright (C) 2002-2003 Kouichirou Eto, All rights reserved.
+# This is free software with ABSOLUTELY NO WARRANTY.
+# You can redistribute it and/or modify it under the terms of the GNU GPL2.
+
+require 'chise/char'
+require 'chise/rbchise'
+require 'chise/db'
+require 'chise/ids'
diff --git a/t/tc_ids.rb b/t/tc_ids.rb
index 288e513..884472d 100755
--- a/t/tc_ids.rb
+++ b/t/tc_ids.rb
@@ -171,6 +171,98 @@ class TC_IDS < Test::Unit::TestCase
     assert_equal("â¿°æ¨æ¨", "â¿°æ¨æ¨".compose.decompose)
     assert_equal("æ".ucs, "â¿°æ¨æ¨".compose.ucs)
   end
+  def test_idc_shortcut
+    assert_equal(IDC_LR, "æ".decompose.first_char)
+    assert_equal(IDC_LR+"æ¨æ¨", "æ".decompose)
+
+    assert_equal(IDC_AB, "æ£®".decompose.first_char)
+    assert_equal(IDC_AB+"æ¨æ", "æ£®".decompose)
+    assert_equal(IDC_AB+"ç«ç«", "ç".decompose)
+
+    assert_equal(IDC_LMR, "ç­".decompose.first_char)
+    assert_equal(IDC_LMR+"å½³"+IDC_AB+"å±±ç"+"æµ", "å¾´".decompose) #meaning?
+
+    assert_equal(IDC_AMB, "é¼»".decompose.first_char)
+    assert_equal(IDC_AMB+"èªç°å»¾", "é¼»".decompose)
+    assert_equal(IDC_AMB+"å£«åå", "å£±".decompose)
+    assert_equal(IDC_AMB+"ç©´å¶å¿", "çª".decompose)
+    assert_equal(IDC_AMB+"ä¸åå·¾", "å¸¯".decompose)
+
+    assert_equal(IDC_FS, "å²".decompose.first_char)
+    assert_equal(IDC_FS+"åäº", "å²".decompose)
+    assert_equal(IDC_FS+"è¡é", "è¡".decompose)
+    assert_equal(IDC_FS+"è¡å­", "è¡".decompose)
+    assert_equal(IDC_FS+"è¡é", "è¡".decompose)
+    assert_equal(IDC_FS+IDC_AB+"ä¸åµç°", "ç»".decompose)
+
+    assert_equal(IDC_FA, "å".decompose.first_char)
+    assert_equal(IDC_FA+"éå£", "å".decompose)
+    assert_equal(IDC_FA+"é"+IDC_LR+"è±å¯¸", "é".decompose)
+    assert_equal(IDC_FA+"æå¥³", "å¨".decompose)
+    assert_equal(IDC_FA+"èè£", "èµ".decompose)
+    assert_equal(IDC_FA+"å°ºæ¦", "æ¼".decompose)
+    assert_equal(IDC_FA+"åå¥", "å".decompose)
+    assert_equal(IDC_FA+"å ä¸¶", "å¡".decompose)
+    assert_equal(IDC_FA+"å "+IDC_AB+"ä¸¿è«", "é¢¨".decompose)
+
+    assert_equal(IDC_FB, "å¶".decompose.first_char)
+    assert_equal(IDC_AB+"æ­¢"+IDC_FB+"åµç±³", "æ­¯".decompose)
+
+    assert_equal(IDC_FL, "å ".decompose.first_char)
+    assert_equal(IDC_FL+"åæ¤", "å ".decompose)
+    assert_equal(IDC_FL+"åç¢", "å»".decompose)
+    assert_equal(IDC_FL+"åè¥", "å¿".decompose)
+    assert_equal(IDC_FL+"åå¿", "å¹".decompose)
+
+    assert_equal(IDC_FUL, "åº".decompose.first_char)
+    assert_equal(IDC_FUL+"å¹¿ä¸", "åº".decompose)
+    assert_equal(IDC_FUL+"æ­¹å", "æ­»".decompose)
+    assert_equal(IDC_FUL+"å°¹å£", "å".decompose)
+    assert_equal(IDC_FUL+"éº»é¬¼", "é­".decompose)
+    assert_equal(IDC_FUL+"åºè", "è".decompose)
+    assert_equal(IDC_FUL+"éº»æ", "æ©".decompose)
+    assert_equal(IDC_FUL+"èæ", "æ®".decompose)
+    assert_equal(IDC_FUL+"é£å£", "å".decompose)
+    assert_equal(IDC_AB+"æ¥"+IDC_FUL+"è³å", "æ".decompose)
+    assert_equal(IDC_FUL+"æç®", "ç".decompose) #meaning
+    assert_equal(IDC_FUL+"è¾°å£", "å".decompose) #?
+
+    assert_equal(IDC_FUR, "å¥".decompose.first_char)
+    assert_equal(IDC_FUR+"å¹å£", "å¥".decompose)
+    assert_equal(IDC_FUR+"å¹ä¸¶", "åº".decompose)
+    assert_equal(IDC_FUR+"å¹æ¥", "æ¬".decompose)
+    assert_equal(IDC_FUR+"æå»¾", "æ".decompose)
+    assert_equal(IDC_FUR+"å¼å·¥", "å¼".decompose)
+    assert_equal(IDC_FUR+"åä¸¿", "å".decompose)
+    assert_equal(IDC_FUR+"é³¥å±±", "å³¶".decompose) #meaning
+
+    assert_equal(IDC_FLL, "é".decompose.first_char)
+    assert_equal(IDC_FLL+"å»´è¿", "å»º".decompose)
+    assert_equal(IDC_FLL+"èµ°æ", "è¶".decompose)
+    assert_equal(IDC_FLL+"èµ°å·³", "èµ·".decompose)
+    assert_equal(IDC_FLL+"èµ°å", "è¶£".decompose)
+    assert_equal(IDC_FLL+"èµ°å¬", "è¶".decompose)
+    assert_equal(IDC_FLL+"æ¯é ", "é¡".decompose)
+    assert_equal(IDC_FLL+"åå", "å".decompose)
+    assert_equal(IDC_FLL+"é¬¼æª", "é­".decompose)
+    assert_equal(IDC_FLL+"é»ç¬", "é»".decompose)
+
+    assert_equal(IDC_O, "å¤ª".decompose.first_char)
+    assert_equal(IDC_O+"å¤§ä¸¶", "å¤ª".decompose)
+    assert_equal(IDC_O+"è¡£ä¸­", "è¡·".decompose)
+    assert_equal(IDC_O+"è¡£é", "è£".decompose)
+    assert_equal(IDC_O+"å¹å·³", "å".decompose)
+    assert_equal(IDC_O+"å¹ä¹", "å".decompose)
+    assert_equal(IDC_O+"æ¨æ¥", "æ±".decompose)
+    assert_equal(IDC_O+"å¼ä¸", "å¼".decompose)
+    assert_equal(IDC_O+"è¡£ä¿", "è¤".decompose)
+  end
+  def test_glyph_decompose
+    assert_equal("é³", "é³".decompose)
+#    assert_equal(IDC_AB+"ç«æ¥", "é³".glyph_decompose)
+    assert_equal(IDC_FLL, "ä¸".decompose.first_char)
+    assert_equal("ä¸", "ä¸".glyph_decompose)
+  end
   def test_find
 #    p "æ¥é²".find #"æ"
     assert(4 <= "æ¥é²".find .char_length) #"æ"
-- 
1.7.10.4