1 ;; -*- coding: utf-8-mcs-er -*-
2 (require 'char-db-util)
3 ;; (require 'concord-images)
5 (setq file-name-coding-system 'utf-8-mcs-er)
8 (concord-assign-genre 'image-resource "/usr/local/var/photo/db")
9 (concord-assign-genre 'glyph-image "/usr/local/var/photo/db")
11 (concord-assign-genre 'creator@ruimoku "/usr/local/var/ruimoku/db")
12 (concord-assign-genre 'person-name@ruimoku "/usr/local/var/ruimoku/db")
14 (concord-assign-genre 'journal-volume@ruimoku "/usr/local/var/ruimoku/db")
15 (concord-assign-genre 'article@ruimoku "/usr/local/var/ruimoku/db")
16 (concord-assign-genre 'book@ruimoku "/usr/local/var/ruimoku/db")
18 (concord-assign-genre 'classification@ruimoku "/usr/local/var/ruimoku/db")
19 (concord-assign-genre 'region@ruimoku "/usr/local/var/ruimoku/db")
20 (concord-assign-genre 'era@ruimoku "/usr/local/var/ruimoku/db")
21 (concord-assign-genre 'period@ruimoku "/usr/local/var/ruimoku/db")
22 (concord-assign-genre 'journal@ruimoku "/usr/local/var/ruimoku/db")
23 (concord-assign-genre 'journal-name@ruimoku "/usr/local/var/ruimoku/db")
24 (concord-assign-genre 'publisher@ruimoku "/usr/local/var/ruimoku/db")
25 (concord-assign-genre 'publisher-name@ruimoku "/usr/local/var/ruimoku/db")
27 (mount-char-attribute-table '*instance@ruimoku/bibliography/title)
28 ;; (mount-char-attribute-table '*instance@ruimoku/bibliography/content*note)
30 (concord-assign-genre 'entry@zh-classical "/usr/local/var/kanbun/db")
31 ;; (concord-assign-genre 'morpheme-entry@zh-classical "/usr/local/var/kanbun/db")
32 (concord-assign-genre 'word-class@zh-classical "/usr/local/var/kanbun/db")
33 (concord-assign-genre 'morpheme@zh-classical "/usr/local/var/kanbun/db")
34 (concord-assign-genre 'sentence@zh-classical "/usr/local/var/kanbun/db")
35 ;; (concord-assign-genre 'sentence-entry@zh-classical "/usr/local/var/kanbun/db")
37 (mount-char-attribute-table '*instance@morpheme-entry/zh-classical)
40 (concord-assign-genre 'hng-card "/usr/local/var/hng-card/db")
42 (mount-char-attribute-table '->HNG)
43 (mount-char-attribute-table '<-HNG)
46 (defvar est-hide-cgi-mode nil)
47 (defvar est-view-url-prefix "..")
48 (defvar chise-wiki-view-url "view.cgi")
49 (defvar chise-wiki-edit-url "edit.cgi")
51 (defvar chise-wiki-bitmap-glyphs-url
52 "http://www.chise.org/glyphs")
54 (defvar chise-wiki-hng-bitmap-glyphs-url
55 "http://hng.chise.org/glyphs/HNG")
57 (defvar chise-wiki-glyph-cgi-url
58 "http://www.chise.org/chisewiki/glyph.cgi")
60 (defvar chise-wiki-displayed-features nil)
62 (defvar est-coded-charset-priority-list
64 =cns11643-1 =cns11643-2 =cns11643-3
65 =cns11643-4 =cns11643-5 =cns11643-6 =cns11643-7
67 =jis-x0208 =jis-x0208@1990
72 =jis-x0213-1@2000 =jis-x0213-1@2004
73 =jis-x0208@1983 =jis-x0208@1978
74 =zinbun-oracle =>zinbun-oracle
78 =>>>jis-x0208 =>>>jis-x0213-1 =>>>jis-x0213-2
79 =>>jis-x0208 =>>jis-x0213-1 =>>jis-x0213-2
81 =+>jis-x0208 =+>jis-x0213-1 =+>jis-x0213-2
84 =>jis-x0208 =>jis-x0213-1
86 =>ucs@iso =>ucs@unicode
87 =>ucs@jis =>ucs@cns =>ucs@ks
88 =>>ucs@iso =>>ucs@unicode
89 =>>ucs@jis =>>ucs@cns =>>ucs@ks
90 =>>>ucs@iso =>>>ucs@unicode
91 =>>>ucs@jis =>>>ucs@cns =>>>ucs@ks
114 (defun decode-uri-string (string &optional coding-system)
115 (if (> (length string) 0)
119 (mapconcat (lambda (char)
122 (char-to-string char)))
124 (while (string-match "%\\([0-9A-F][0-9A-F]\\)" string i)
125 (setq dest (concat dest
126 (substring string i (match-beginning 0))
129 (string-to-int (match-string 1 string) 16))))
131 (decode-coding-string
132 (concat dest (substring string i))
135 (defun www-feature-type (feature-name)
136 (or (char-feature-property feature-name 'type)
137 (let ((str (symbol-name feature-name)))
139 ((string-match "\\*note\\(@[^*]+\\)?$" str)
141 ((string-match "\\*sources\\(@[^*]+\\)?$" str)
143 ((string-match "\\*" str)
145 ((string-match "^\\(->\\|<-\\)" str)
147 ((string-match "^ideographic-structure\\(@\\|$\\)" str)
151 (defun www-feature-format (feature-name)
152 (or (char-feature-property feature-name 'presentation-format)
153 (char-feature-property feature-name 'format)
155 (setq fn feature-name)
156 (while (and (setq parent (char-feature-name-parent fn))
158 (char-feature-property
162 '((name) " : " (value))))
164 (defun www-feature-value-format (feature-name)
165 (or (char-feature-property feature-name 'value-presentation-format)
166 (char-feature-property feature-name 'value-format)
168 (setq fn feature-name)
169 (while (and (setq parent (char-feature-name-parent fn))
171 (or (char-feature-property
172 parent 'value-presentation-format)
173 (char-feature-property
174 parent 'value-format)))))
177 (let ((type (www-feature-type feature-name)))
178 (cond ((eq type 'relation)
180 ((eq type 'structure)
181 'space-separated-ids)
185 (if (find-charset feature-name)
186 (if (and (= (charset-dimension feature-name) 2)
187 (= (charset-chars feature-name) 94))
189 " (" (decimal) ") <" (ku-ten) "> " (prev-char) (next-char))
190 '("0x" (HEX) " (" (decimal) ") " (prev-char) (next-char))))
193 (defun char-feature-name-at-domain (feature-name domain)
195 (let ((name (symbol-name feature-name)))
197 ((string-match "@[^*]+$" name)
198 (intern (format "%s/%s" name domain))
201 (intern (format "%s@%s" name domain))
205 (defun char-feature-name-parent (feature-name)
206 (let ((name (symbol-name feature-name)))
207 (if (string-match "@[^@/*]+\\(/[^@/*]+\\)*$" name)
208 (intern (substring name 0 (car (last (match-data) 2)))))))
210 (defun char-feature-name-domain (feature-name)
211 (let ((name (symbol-name feature-name)))
212 (if (string-match "@[^@/*]+\\(/[^@/*]+\\)*$" name)
213 (intern (substring name (1+ (match-beginning 0)))))))
215 (defun char-feature-name-sans-versions (feature)
216 (let ((feature-name (symbol-name feature)))
217 (if (string-match "[@/]\\$rev=latest$" feature-name)
218 (intern (substring feature-name 0 (match-beginning 0)))
221 (defun est-object-genre (object)
222 (if (characterp object)
224 (concord-object-genre object)))
226 (defun www-get-feature-value (object feature)
227 (let ((latest-feature (char-feature-name-at-domain feature '$rev=latest)))
230 (mount-char-attribute-table latest-feature)
231 (or (char-feature object latest-feature)
232 (char-feature object feature))
235 (or (condition-case nil
236 (concord-object-get object latest-feature)
239 (concord-object-get object feature)
243 (defun get-previous-code-point (ccs code)
244 (let ((chars (charset-chars ccs))
245 (dim (charset-dimension ccs))
247 mask byte-min byte-max
270 (setq bytes (make-vector dim 0))
272 (aset bytes i (logand (lsh code (* i -8)) mask))
275 (while (and (< i dim)
277 (aset bytes i (1- (aref bytes i)))
278 (< (aref bytes i) byte-min)))
279 (aset bytes i byte-max)
282 (setq dest (aref bytes 0)
285 (setq dest (logior dest (lsh (aref bytes i) (* i 8)))
289 (defun get-next-code-point (ccs code)
290 (let ((chars (charset-chars ccs))
291 (dim (charset-dimension ccs))
293 mask byte-min byte-max
316 (setq bytes (make-vector dim 0))
318 (aset bytes i (logand (lsh code (* i -8)) mask))
321 (while (and (< i dim)
323 (aset bytes i (1+ (aref bytes i)))
324 (> (aref bytes i) byte-max)))
325 (aset bytes i byte-min)
328 (setq dest (aref bytes 0)
331 (setq dest (logior dest (lsh (aref bytes i) (* i 8)))
335 (defun find-previous-defined-code-point (ccs code)
336 (let ((i (get-previous-code-point ccs code))
339 ((eq ccs '=jis-x0208)
340 (setq ccs '=jis-x0208@1990))
341 ((eq ccs '=jis-x0213-1)
342 (setq ccs '=jis-x0213-1@2004)))
345 (null (setq char (decode-char ccs i
346 (unless (eq ccs '=ucs)
348 (setq i (get-previous-code-point ccs i)))
351 (defun find-next-defined-code-point (ccs code)
352 (let ((i (get-next-code-point ccs code))
354 (setq max (+ code 1000))
356 ((eq ccs '=jis-x0208)
357 (setq ccs '=jis-x0208@1990))
358 ((eq ccs '=jis-x0213-1)
359 (setq ccs '=jis-x0213-1@2004)))
362 (null (setq char (decode-char ccs i
363 (unless (eq ccs '=ucs)
365 (setq i (get-next-code-point ccs i)))
369 ;;; @ URI representation
372 (defun est-uri-decode-feature-name-body (uri-feature)
373 (let ((len (length uri-feature))
380 (if (eq (aref uri-feature i) ?\.)
381 (if (and (< (+ i 2) len)
382 (eq (aref uri-feature (+ i 2)) ?\.))
385 ((eq (setq ch (aref uri-feature (1+ i))) ?\.)
390 (substring uri-feature i (+ i 3))
396 (char-to-string (aref uri-feature i))
400 (defun est-uri-encode-feature-name-body (feature)
401 (mapconcat (lambda (c)
406 (t (char-to-string c))))
409 (defun www-uri-decode-feature-name (uri-feature)
411 (setq uri-feature (decode-uri-string uri-feature 'utf-8-mcs-er))
413 ((string-match "^from\\." uri-feature)
414 (intern (format "<-%s"
415 (est-uri-decode-feature-name-body
416 (substring uri-feature (match-end 0)))))
418 ((string-match "^to\\." uri-feature)
419 (intern (format "->%s"
420 (est-uri-decode-feature-name-body
421 (substring uri-feature (match-end 0)))))
423 ((string-match "^rep\\." uri-feature)
424 (intern (format "=%s"
425 (est-uri-decode-feature-name-body
426 (substring uri-feature (match-end 0)))))
428 ((string-match "^rep[2i]\\." uri-feature)
429 (intern (format "===%s"
430 (est-uri-decode-feature-name-body
431 (substring uri-feature (match-end 0)))))
433 ((string-match "^g\\." uri-feature)
434 (intern (format "=>>%s"
435 (est-uri-decode-feature-name-body
436 (substring uri-feature (match-end 0)))))
438 ((string-match "^g[i2]\\." uri-feature)
439 (intern (format "==%s"
440 (est-uri-decode-feature-name-body
441 (substring uri-feature (match-end 0)))))
443 ((string-match "^gi\\([0-9]+\\)\\." uri-feature)
444 (intern (format "=>>%s%s"
445 (make-string (string-to-int
446 (match-string 1 uri-feature))
448 (est-uri-decode-feature-name-body
449 (substring uri-feature (match-end 0)))))
451 ((string-match "^o\\." uri-feature)
452 (intern (format "=+>%s"
453 (est-uri-decode-feature-name-body
454 (substring uri-feature (match-end 0)))))
456 ((string-match "^a\\." uri-feature)
457 (intern (format "=>%s"
458 (est-uri-decode-feature-name-body
459 (substring uri-feature (match-end 0)))))
461 ((string-match "^a\\([0-9]+\\)\\." uri-feature)
462 (intern (format "%s>%s"
463 (make-string (string-to-int
464 (match-string 1 uri-feature))
466 (est-uri-decode-feature-name-body
467 (substring uri-feature (match-end 0)))))
469 ((and (setq uri-feature (est-uri-decode-feature-name-body uri-feature))
470 (setq feature (intern (format "=>%s" uri-feature)))
471 (find-charset feature))
473 ((and (setq feature (intern (format "=>>%s" uri-feature)))
474 (find-charset feature))
476 ((and (setq feature (intern (format "=>>>%s" uri-feature)))
477 (find-charset feature))
479 ((and (setq feature (intern (format "=%s" uri-feature)))
480 (find-charset feature))
482 (t (intern uri-feature)))))
484 (defun www-uri-encode-feature-name (feature-name)
485 (setq feature-name (symbol-name feature-name))
487 ((string-match "^=\\+>\\([^=>]+\\)" feature-name)
489 (est-uri-encode-feature-name-body
490 (substring feature-name (match-beginning 1))))
492 ((string-match "^=\\([^=>]+\\)" feature-name)
494 (est-uri-encode-feature-name-body
495 (substring feature-name (match-beginning 1))))
497 ((string-match "^==\\([^=>]+\\)" feature-name)
499 (est-uri-encode-feature-name-body
500 (substring feature-name (match-beginning 1))))
502 ((string-match "^===\\([^=>]+\\)" feature-name)
504 (est-uri-encode-feature-name-body
505 (substring feature-name (match-beginning 1))))
507 ((string-match "^=>>\\([^=>]+\\)" feature-name)
509 (est-uri-encode-feature-name-body
510 (substring feature-name (match-beginning 1))))
512 ((string-match "^=>>>\\([^=>]+\\)" feature-name)
514 (est-uri-encode-feature-name-body
515 (substring feature-name (match-beginning 1))))
517 ((string-match "^=>>\\(>+\\)" feature-name)
519 (length (match-string 1 feature-name))
520 (est-uri-encode-feature-name-body
521 (substring feature-name (match-end 1))))
523 ((string-match "^=>\\([^=>]+\\)" feature-name)
525 (est-uri-encode-feature-name-body
526 (substring feature-name (match-beginning 1))))
528 ((string-match "^\\(=+\\)>" feature-name)
530 (length (match-string 1 feature-name))
531 (est-uri-encode-feature-name-body
532 (substring feature-name (match-end 0))))
534 ((string-match "^->" feature-name)
536 (est-uri-encode-feature-name-body
537 (substring feature-name (match-end 0))))
539 ((string-match "^<-" feature-name)
541 (est-uri-encode-feature-name-body
542 (substring feature-name (match-end 0))))
544 (t (est-uri-encode-feature-name-body feature-name))))
546 (defun www-uri-make-feature-name-url (uri-genre uri-feature-name uri-object)
547 (if est-hide-cgi-mode
548 (format "../feature/%s&%s/%s"
549 uri-feature-name uri-genre uri-object)
550 (format "%s?feature=%s&%s=%s"
551 chise-wiki-view-url uri-feature-name uri-genre uri-object)))
553 (defun www-uri-decode-object (genre char-rep)
556 ((string-match (if est-hide-cgi-mode
557 "\\(%3D\\|=\\|%3A\\|:\\)"
558 "\\(%3A\\|:\\)") char-rep)
559 (setq ccs (substring char-rep 0 (match-beginning 0))
560 cpos (substring char-rep (match-end 0)))
561 (setq ccs (www-uri-decode-feature-name ccs))
562 (setq cpos (est-uri-decode-feature-name-body cpos))
564 ((string-match "^0x" cpos)
566 (string-to-number (substring cpos (match-end 0)) 16))
569 (setq cpos (car (read-from-string
571 cpos file-name-coding-system))))
573 (if (and (eq genre 'character)
575 (decode-char ccs cpos)
576 (concord-decode-object ccs cpos genre))
579 (setq char-rep (decode-uri-string char-rep 'utf-8-mcs-er))
581 ((eq genre 'character)
582 (when (= (length char-rep) 1)
586 (concord-decode-object
587 '=id (www-uri-decode-feature-name char-rep) 'feature)
590 (concord-decode-object
591 '=id (car (read-from-string char-rep)) genre)
594 (defun www-uri-encode-object (object)
595 (if (characterp object)
596 (if (encode-char object '=ucs)
599 (format "%%%02X" byte))
600 (encode-coding-string (char-to-string object) 'utf-8-mcs-er)
602 (let ((ccs-list est-coded-charset-priority-list)
605 (setq ccs (pop ccs-list))
606 (not (setq ret (encode-char object ccs 'defined-only)))))
608 (format (if est-hide-cgi-mode
611 (www-uri-encode-feature-name ccs)
613 ((and (setq ccs (car (split-char object)))
614 (setq ret (encode-char object ccs)))
615 (format (if est-hide-cgi-mode
618 (www-uri-encode-feature-name ccs)
621 (format (if est-hide-cgi-mode
622 "system-char-id=0x%X"
623 "system-char-id:0x%X")
624 (encode-char object 'system-char-id))
626 (format (if est-hide-cgi-mode
629 (est-uri-encode-feature-name-body
630 (format "%s" (concord-object-id object))))))
632 (defun est-format-object (object &optional readable)
633 (if (characterp object)
634 (char-to-string object)
635 (let ((ret (or (if readable
636 (or (concord-object-get object 'name)
637 (concord-object-get object '=name)
638 (concord-object-get object 'title)))
639 (concord-object-id object))))
642 (defun www-uri-make-object-url (object &optional uri-object)
643 (if est-hide-cgi-mode
646 (est-object-genre object)
648 (www-uri-encode-object object)))
651 (est-object-genre object)
653 (www-uri-encode-object object)))))
656 ;;; @ Feature name presentation
659 (defun www-format-feature-name-default (feature-name)
663 (symbol-name feature-name)
667 (defun www-format-feature-name-as-metadata (feature-name &optional lang)
668 (let ((str (symbol-name feature-name))
671 ((string-match "\\*[^*]+$" str)
672 (setq base (substring str 0 (match-beginning 0))
673 meta (substring str (match-beginning 0)))
674 (concat (www-format-feature-name* (intern base) lang)
677 (www-format-feature-name-default feature-name)
680 (defun www-format-feature-name-as-rel-to (feature-name)
681 (concat "\u2192" (substring (symbol-name feature-name) 2)))
683 (defun www-format-feature-name-as-rel-from (feature-name)
684 (concat "\u2190" (substring (symbol-name feature-name) 2)))
686 (defun www-format-feature-name-as-CCS (feature-name)
689 (symbol-name feature-name)
691 (dest (upcase (pop rest))))
692 (when (string-match "^=+>*" dest)
693 (setq dest (concat (substring dest 0 (match-end 0))
695 (substring dest (match-end 0)))))
699 (setq dest (concat dest " " (upcase (pop rest)))))
700 (if (string-match "^[0-9]+$" (car rest))
701 (concat dest "-" (car rest))
702 (concat dest " " (upcase (car rest))))
706 (defun www-format-feature-name* (feature-name &optional lang)
707 (let (name fn parent ret)
710 (char-feature-property
712 (intern (format "name@%s" lang))))
713 (char-feature-property
714 feature-name 'name)))
715 ((and (setq name (symbol-name feature-name))
716 (string-match "\\*" name))
717 (www-format-feature-name-as-metadata feature-name lang))
719 (setq fn feature-name)
720 (while (and (setq parent (char-feature-name-parent fn))
723 (char-feature-property
725 (intern (format "name@%s" lang))))
726 (char-feature-property
731 (concat ret (substring (symbol-name feature-name)
732 (length (symbol-name parent)))))
733 ((find-charset feature-name)
734 (www-format-feature-name-as-CCS feature-name))
735 ((string-match "^\\(->\\)" name)
736 (www-format-feature-name-as-rel-to feature-name))
737 ((string-match "^\\(<-\\)" name)
738 (www-format-feature-name-as-rel-from feature-name))
740 (www-format-feature-name-default feature-name)
744 (defun www-format-feature-name (feature-name &optional lang)
745 (www-format-encode-string
746 (www-format-feature-name* feature-name lang)))
752 (defvar www-format-char-img-style "vertical-align:bottom;")
754 (defun www-format-encode-string (string &optional without-tags as-body)
757 (let (plane code subcode start end char variants ret rret)
759 (goto-char (point-min))
760 (while (search-forward "&" nil t)
761 (replace-match "&" nil t)))
762 (goto-char (point-min))
763 (while (search-forward "<" nil t)
764 (replace-match "<" nil t))
765 (goto-char (point-min))
766 (while (search-forward ">" nil t)
767 (replace-match ">" nil t))
769 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
770 (let ((coded-charset-entity-reference-alist
774 '(=hanyo-denshi/ja "HD-JA-" 4 X)
775 '(=hanyo-denshi/jb "HD-JB-" 4 X)
776 '(=hanyo-denshi/jc "HD-JC-" 4 X)
777 '(=hanyo-denshi/jd "HD-JD-" 4 X)
778 '(=hanyo-denshi/ft "HD-FT-" 4 X)
779 '(=hanyo-denshi/ia "HD-IA-" 4 X)
780 '(=hanyo-denshi/ib "HD-IB-" 4 X)
781 '(=hanyo-denshi/hg "HD-HG-" 4 X)
782 '(=hanyo-denshi/ip "HD-IP-" 4 X)
783 '(=hanyo-denshi/jt "HD-JT-" 4 X)
784 '(=hanyo-denshi/ks "HD-KS-" 6 d)
785 '(=>>hanyo-denshi/ja "G-HD-JA-" 4 X)
786 '(=>>hanyo-denshi/jb "G-HD-JB-" 4 X)
787 '(=>>hanyo-denshi/jc "G-HD-JC-" 4 X)
788 '(=>>hanyo-denshi/jd "G-HD-JD-" 4 X)
789 '(=>>hanyo-denshi/ft "G-HD-FT-" 4 X)
790 '(=>>hanyo-denshi/ia "G-HD-IA-" 4 X)
791 '(=>>hanyo-denshi/ib "G-HD-IB-" 4 X)
792 '(=>>hanyo-denshi/hg "G-HD-HG-" 4 X)
793 '(=>>hanyo-denshi/ip "G-HD-IP-" 4 X)
794 '(=>>hanyo-denshi/jt "G-HD-JT-" 4 X)
795 '(=>>hanyo-denshi/ks "G-HD-KS-" 6 d)
797 '(==hanyo-denshi/ja "g2-HD-JA-" 4 X)
798 '(==hanyo-denshi/jb "g2-HD-JB-" 4 X)
799 '(==hanyo-denshi/jc "g2-HD-JC-" 4 X)
800 '(==hanyo-denshi/jd "g2-HD-JD-" 4 X)
801 '(==hanyo-denshi/ft "g2-HD-FT-" 4 X)
802 '(==hanyo-denshi/ia "g2-HD-IA-" 4 X)
803 '(==hanyo-denshi/ib "g2-HD-IB-" 4 X)
804 '(==hanyo-denshi/hg "g2-HD-HG-" 4 X)
805 '(==hanyo-denshi/ip "g2-HD-IP-" 4 X)
806 '(==hanyo-denshi/jt "g2-HD-JT-" 4 X)
807 '(==hanyo-denshi/ks "g2-HD-KS-" 6 d)
808 '(=cns11643-1 "C1-" 4 X)
809 '(=cns11643-2 "C2-" 4 X)
810 '(=cns11643-3 "C3-" 4 X)
811 '(=cns11643-4 "C4-" 4 X)
812 '(=cns11643-5 "C5-" 4 X)
813 '(=cns11643-6 "C6-" 4 X)
814 '(=cns11643-7 "C7-" 4 X)
815 '(=adobe-japan1-6 "AJ1-" 5 d)
816 '(=big5-cdp "CDP-" 4 X)
818 '(=gb12345 "G1-" 4 X)
819 '(=jis-x0208@1990 "J90-" 4 X)
820 '(=jis-x0212 "JSP-" 4 X)
822 '(=jis-x0208@1997 "J97-" 4 X)
823 '(=jis-x0208@1978 "J78-" 4 X)
824 '(=jis-x0208@1983 "J83-" 4 X)
825 '(=ruimoku-v6 "RUI6-" 4 X)
826 '(=zinbun-oracle "ZOB-" 4 d)
827 '(=jef-china3 "JC3-" 4 X)
828 '(=ucs@unicode "UU+" 4 X)
829 '(=ucs@JP/hanazono "hanaJU+" 4 X)
830 '(==cns11643-1 "R-C1-" 4 X)
831 '(==cns11643-2 "R-C2-" 4 X)
832 '(==cns11643-3 "R-C3-" 4 X)
833 '(==cns11643-4 "R-C4-" 4 X)
834 '(==cns11643-5 "R-C5-" 4 X)
835 '(==cns11643-6 "R-C6-" 4 X)
836 '(==cns11643-7 "R-C7-" 4 X)
837 '(=hanziku-1 "HZK01-" 4 X)
838 '(=hanziku-2 "HZK02-" 4 X)
839 '(=hanziku-3 "HZK03-" 4 X)
840 '(=hanziku-4 "HZK04-" 4 X)
841 '(=hanziku-5 "HZK05-" 4 X)
842 '(=hanziku-6 "HZK06-" 4 X)
843 '(=hanziku-7 "HZK07-" 4 X)
844 '(=hanziku-8 "HZK08-" 4 X)
845 '(=hanziku-9 "HZK09-" 4 X)
846 '(=hanziku-10 "HZK10-" 4 X)
847 '(=hanziku-11 "HZK11-" 4 X)
848 '(=hanziku-12 "HZK12-" 4 X)
850 '(=daikanwa "M-" 5 d)
851 coded-charset-entity-reference-alist)))
852 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
854 (goto-char (point-min))
855 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\)?CB\\([0-9]+\\);" nil t)
856 (setq code (string-to-int (match-string 2)))
858 (format "<img alt=\"CB%05d\" src=\"%s/cb-gaiji/%02d/CB%05d.gif\"
861 chise-wiki-bitmap-glyphs-url
863 www-format-char-img-style)
866 (goto-char (point-min))
867 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?J\\(78\\|83\\|90\\|97\\|SP\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
868 (setq plane (match-string 2)
869 code (string-to-int (match-string 3) 16))
871 (format "<img alt=\"J%s-%04X\" src=\"%s/JIS-%s/%02d-%02d.gif\"
874 chise-wiki-bitmap-glyphs-url
877 (- (logand code 255) 32)
878 www-format-char-img-style)
881 (goto-char (point-min))
882 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?J0-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
883 (setq code (string-to-int (match-string 2) 16))
885 (format "<img alt=\"J0-%04X\" src=\"%s/JIS-90/%02d-%02d.gif\"
888 chise-wiki-bitmap-glyphs-url
890 (- (logand code 255) 32)
891 www-format-char-img-style)
894 (goto-char (point-min))
895 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-\\(JA\\|JB\\|JC\\|JD\\|FT\\|IA\\|IB\\|HG\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
896 (setq plane (match-string 2)
897 code (string-to-int (match-string 3) 16))
899 (format "<img alt=\"HD-%s-%04X\" src=\"%s/IVD/HanyoDenshi/%s%02d%02d.png\"
902 chise-wiki-bitmap-glyphs-url
905 (- (logand code 255) 32)
906 www-format-char-img-style)
909 (goto-char (point-min))
910 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-\\(IP\\|JT\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
911 (setq plane (match-string 2)
912 code (string-to-int (match-string 3) 16))
914 (format "<img alt=\"HD-%s-%04X\" src=\"%s/IVD/HanyoDenshi/%s%04X.png\"
917 chise-wiki-bitmap-glyphs-url
919 www-format-char-img-style)
922 (goto-char (point-min))
923 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-KS-\\([0-9]+\\);" nil t)
924 (setq code (string-to-int (match-string 2)))
926 (format "<img alt=\"HD-KS%06d\" src=\"%s/IVD/HanyoDenshi/KS%06d.png\"
927 style=\"vertical-align:middle\">"
929 chise-wiki-bitmap-glyphs-url
931 www-format-char-img-style)
934 (goto-char (point-min))
935 (while (re-search-forward "&G\\([01]\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
936 (setq plane (string-to-int (match-string 1))
937 code (string-to-int (match-string 2) 16))
939 (format "<img alt=\"GB%d-%04X\" src=\"%s/GB%d/%02d-%02d.gif\"
942 chise-wiki-bitmap-glyphs-url
945 (- (logand code 255) 32)
946 www-format-char-img-style)
949 (goto-char (point-min))
950 (while (re-search-forward "&\\(R-\\)?C\\([1-7]\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
951 (setq plane (string-to-int (match-string 2))
952 code (string-to-int (match-string 3) 16))
954 (format "<img alt=\"CNS%d-%04X\" src=\"%s/CNS%d/%04X.gif\"
957 chise-wiki-bitmap-glyphs-url
959 www-format-char-img-style)
962 (goto-char (point-min))
963 (while (re-search-forward "&\\(R-\\)?JC3-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
964 (setq code (string-to-int (match-string 2) 16))
966 (format "<img alt=\"JC3-%04X\" src=\"http://kanji.zinbun.kyoto-u.ac.jp/db/CHINA3/Gaiji/%04x.gif\">"
970 (goto-char (point-min))
971 (while (re-search-forward "&\\(A-\\)?ZOB-\\([0-9]+\\);" nil t)
972 (setq code (string-to-int (match-string 2)))
974 (format "<img alt=\"ZOB-%04d\" src=\"%s/ZOB-1968/%04d.png\"
975 style=\"vertical-align:middle\">"
977 chise-wiki-bitmap-glyphs-url
979 www-format-char-img-style)
982 (goto-char (point-min))
983 (while (re-search-forward "&HNG\\([0-9]+\\)-\\([0-9][0-9][0-9][0-9]\\)\\([0-9]\\);" nil t)
984 (setq plane (match-string 1)
985 code (string-to-int (match-string 2))
986 subcode (string-to-int (match-string 3)))
990 (char-to-string (decode-char 'ascii (+ 96 subcode)))))
993 "<div class=\"tooltip\"><img alt=\"HNG%s-%04d%s\" src=\"%s/%s/%04d%s.png\" style=\"
994 vertical-align:middle; width: 48px; height: 48px\"><span
995 class=\"tooltiptext\">%s</span></div>"
997 chise-wiki-hng-bitmap-glyphs-url
1000 (car (find (format "HNG%s-" plane)
1001 coded-charset-entity-reference-alist
1002 :test (lambda (key cell)
1003 (string= key (nth 1 cell))))))
1007 (goto-char (point-min))
1008 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?AJ1-\\([0-9]+\\);" nil t)
1009 (setq code (string-to-int (match-string 2)))
1011 (format "<img alt=\"AJ1-%05d\" src=\"%s/IVD/AdobeJapan1/CID+%d.png\"
1012 style=\"vertical-align:middle\">"
1014 chise-wiki-bitmap-glyphs-url
1016 www-format-char-img-style)
1019 (goto-char (point-min))
1020 (while (re-search-forward "&\\(A-\\|o-\\|G-\\|g2-\\|R-\\)?MJ\\([0-9]+\\);" nil t)
1021 (setq code (string-to-int (match-string 2)))
1023 (format "<img alt=\"MJ%06d\" src=\"http://mojikiban.ipa.go.jp/search/MJ%06d\"
1024 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1027 www-format-char-img-style)
1030 (goto-char (point-min))
1031 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\)?IU[+-]\\([0-9A-F]+\\);" nil t)
1032 (setq code (string-to-int (match-string 2) 16))
1034 (format "<img alt=\"u%04x\" src=\"http://glyphwiki.org/glyph/u%04x.100px.png\"
1035 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1038 www-format-char-img-style)
1041 (goto-char (point-min))
1042 (while (re-search-forward "&A-compU[+-]\\([0-9A-F]+\\);" nil t)
1043 (setq code (string-to-int (match-string 1) 16))
1045 (format "<img alt=\"u%04x\" src=\"http://glyphwiki.org/glyph/u%04x.100px.png\"
1046 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1049 www-format-char-img-style)
1052 (goto-char (point-min))
1053 (while (re-search-forward
1054 "&\\(A-\\)?U-i\\([0-9]+\\)\\+\\([0-9A-F]+\\);"
1056 (setq plane (string-to-int (match-string 2))
1057 code (string-to-int (match-string 3) 16))
1059 (format "<img alt=\"u%04x-itaiji-%03d\" src=\"http://glyphwiki.org/glyph/u%04x-itaiji-%03d.100px.png\"
1060 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1065 www-format-char-img-style)
1068 (goto-char (point-min))
1069 (while (re-search-forward "&A-IWDSU\\+\\([0-9A-F]+\\);" nil t)
1070 (setq code (string-to-int (match-string 1) 16))
1072 (format "<img alt=\"A-IWDSU+%04x\" src=\"http://glyphwiki.org/glyph/u%04x.100px.png\"
1073 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1076 www-format-char-img-style)
1079 (goto-char (point-min))
1080 (while (re-search-forward "&U-v\\([0-9]+\\)\\+\\([0-9A-F]+\\);" nil t)
1081 (setq plane (string-to-int (match-string 1))
1082 code (string-to-int (match-string 2) 16))
1084 (format "<img alt=\"u%04x-itaiji-%03d\" src=\"http://glyphwiki.org/glyph/u%04x-var-%03d.100px.png\"
1085 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1090 www-format-char-img-style)
1093 (goto-char (point-min))
1094 (while (re-search-forward "&\\(A-\\|G-\\|R-\\|g2-\\)?GT-\\([0-9]+\\);" nil t)
1095 (setq code (string-to-int (match-string 2)))
1097 (format "<img alt=\"GT-%05d\" src=\"%s?char=GT-%05d\"
1100 chise-wiki-glyph-cgi-url
1102 www-format-char-img-style)
1105 (goto-char (point-min))
1106 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\)?GT-K\\([0-9]+\\);" nil t)
1107 (setq code (string-to-int (match-string 2)))
1109 (format "<img alt=\"GT-K%05d\" src=\"%s?char=GT-K%05d\"
1112 chise-wiki-glyph-cgi-url
1114 www-format-char-img-style)
1117 (goto-char (point-min))
1118 (while (re-search-forward "&B-\\([0-9A-F]+\\);" nil t)
1119 (setq code (string-to-int (match-string 1) 16))
1121 (format "<img alt=\"B-%04X\" src=\"%s?char=B-%04X\"
1124 chise-wiki-glyph-cgi-url
1126 www-format-char-img-style)
1129 (goto-char (point-min))
1130 (while (re-search-forward
1131 "&\\(A-\\|G-\\|g2-\\|R-\\)?CDP-\\([0-9A-F]+\\);" nil t)
1132 (setq code (string-to-int (match-string 2) 16))
1134 (format "<img alt=\"CDP-%04X\" src=\"%s?char=CDP-%04X\"
1137 chise-wiki-glyph-cgi-url
1139 www-format-char-img-style)
1142 (goto-char (point-min))
1143 (while (re-search-forward
1144 "&\\(I-\\)?HZK\\(0[1-9]\\|1[0-2]\\)-\\([0-9A-F]+\\);" nil t)
1145 (setq plane (match-string 2)
1146 code (string-to-int (match-string 3) 16))
1148 (format "<img alt=\"HZK%s-%04X\" src=\"%s?char=HZK%s-%04X\"
1152 chise-wiki-glyph-cgi-url
1155 www-format-char-img-style)
1158 (goto-char (point-min))
1159 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\|R-\\)?RUI6-\\([0-9A-F]+\\);" nil t)
1160 (setq code (string-to-int (match-string 2) 16))
1162 (format "<img alt=\"RUI6-%04X\" src=\"%s?char=RUI6-%04X\"
1163 style=\"vertical-align:middle\">"
1165 chise-wiki-glyph-cgi-url
1167 www-format-char-img-style)
1170 (goto-char (point-min))
1171 (while (re-search-forward "&hanaJU\\+\\([0-9A-F]+\\);" nil t)
1172 (setq code (string-to-int (match-string 1) 16))
1174 (format "<img alt=\"hanaJU+%04X\" src=\"%s?char=hana-JU+%04X\"
1175 style=\"vertical-align:middle\">"
1177 chise-wiki-glyph-cgi-url
1179 www-format-char-img-style)
1182 (goto-char (point-min))
1183 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\|R-\\)?\\(UU\\+\\|U-\\)\\([0-9A-F]+\\);" nil t)
1184 (setq code (string-to-int (match-string 3) 16))
1186 (format "<img alt=\"UU+%04X\" src=\"http://www.unicode.org/cgi-bin/refglyph?24-%04X\"
1187 style=\"vertical-align:middle\">"
1190 www-format-char-img-style)
1193 (goto-char (point-min))
1194 (while (re-search-forward "&MCS-\\([0-9A-F]+\\);" nil t)
1195 (setq code (string-to-int (match-string 1) 16))
1196 (setq start (match-beginning 0)
1198 (setq char (decode-char 'system-char-id code))
1200 ((and (setq variants
1201 (or (www-get-feature-value char '->subsumptive)
1202 (www-get-feature-value char '->denotational)))
1204 (if (characterp variants)
1205 (setq variants (list variants)))
1206 (while (and variants
1207 (setq ret (www-format-encode-string
1208 (char-to-string (car variants))))
1209 (string-match "&MCS-\\([0-9A-F]+\\);" ret))
1210 (setq variants (cdr variants)))
1212 (unless (string-match "&MCS-\\([0-9A-F]+\\);" ret)
1214 (delete-region start end)
1217 ((setq ret (or (www-get-feature-value char 'ideographic-combination)
1218 (www-get-feature-value char 'ideographic-structure)))
1223 (if (characterp (setq rret (find-char ch)))
1226 (www-format-encode-string
1227 (char-to-string ch) without-tags)
1228 (www-format-encode-string
1229 (format "%S" ch) without-tags)))
1233 (delete-region start end)
1237 ;; (goto-char (point-min))
1238 ;; (while (search-forward ">-" nil t)
1239 ;; (replace-match "&GT-" t 'literal))
1242 (defun www-html-display-text (text)
1246 (goto-char (point-min))
1247 (while (search-forward "<" nil t)
1248 (replace-match "<" nil t))
1249 (goto-char (point-min))
1250 (while (search-forward ">" nil t)
1251 (replace-match ">" nil t))
1252 (goto-char (point-min))
1253 (while (re-search-forward "\\[\\[\\([^]|[]+\\)|\\([^][]+\\)\\]\\]" nil t)
1255 (format "<a href=\"%s\">%s</a>"
1259 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
1260 (goto-char (point-min))
1261 (while (search-forward ">-" nil t)
1262 (replace-match "&GT-" nil t))
1265 (defun www-html-display-paragraph (text)
1267 (www-html-display-text text)
1274 (defvar coded-charset-GlyphWiki-id-alist
1275 '((===adobe-japan1-0 "aj1-" 5 d nil)
1276 (===adobe-japan1-1 "aj1-" 5 d nil)
1277 (===adobe-japan1-2 "aj1-" 5 d nil)
1278 (===adobe-japan1-3 "aj1-" 5 d nil)
1279 (===adobe-japan1-4 "aj1-" 5 d nil)
1280 (===adobe-japan1-5 "aj1-" 5 d nil)
1281 (===adobe-japan1-6 "aj1-" 5 d nil)
1282 (===ucs@jis "u" 4 x nil)
1283 (===daikanwa "dkw-" 5 d nil)
1284 (===ucs@ks "u" 4 x "-k")
1285 (=ucs-var-001 "u" 4 x "-var-001")
1286 (=ucs-var-002 "u" 4 x "-var-002")
1287 (=ucs-var-003 "u" 4 x "-var-003")
1288 (=ucs-itaiji-001 "u" 4 x "-itaiji-001")
1289 (=ucs-itaiji-002 "u" 4 x "-itaiji-002")
1290 (=ucs-itaiji-003 "u" 4 x "-itaiji-003")
1291 (=ucs-itaiji-084 "u" 4 x "-itaiji-084")
1292 (=>ucs-itaiji-001 "u" 4 x "-itaiji-001")
1293 (==adobe-japan1-0 "aj1-" 5 d nil)
1294 (==adobe-japan1-1 "aj1-" 5 d nil)
1295 (==adobe-japan1-2 "aj1-" 5 d nil)
1296 (==adobe-japan1-3 "aj1-" 5 d nil)
1297 (==adobe-japan1-4 "aj1-" 5 d nil)
1298 (==adobe-japan1-5 "aj1-" 5 d nil)
1299 (==adobe-japan1-6 "aj1-" 5 d nil)
1300 (==ucs@jis "u" 4 x nil)
1301 (==ucs@iso "u" 4 x nil)
1302 (==ucs@cns "u" 4 x "-t")
1303 (==ucs@unicode "u" 4 x "-us")
1304 (==daikanwa "dkw-" 5 d nil)
1305 (==ucs@ks "u" 4 x "-k")
1306 (==jis-x0208@1978 "j78-" 4 x nil)
1307 (==jis-x0208 "j90-" 4 x nil)
1308 (==jis-x0208@1990 "j90-" 4 x nil)
1309 (==jis-x0208@1983 "j83-" 4 x nil)
1310 (==cbeta "cbeta-" 5 d nil)
1311 (=>>hanyo-denshi/ks "koseki-" 6 d nil)
1312 (=>>jis-x0208@1978 "j78-" 4 x nil)
1313 (=>>big5-cdp "cdp-" 4 x nil)
1314 (=>>jis-x0208 "j90-" 4 x nil)
1315 (=>>jis-x0208@1990 "j90-" 4 x nil)
1316 (=>>jis-x0208@1983 "j83-" 4 x nil)
1317 (=>>daikanwa "dkw-" 5 d nil)
1318 (=adobe-japan1-0 "aj1-" 5 d nil)
1319 (=adobe-japan1-1 "aj1-" 5 d nil)
1320 (=adobe-japan1-2 "aj1-" 5 d nil)
1321 (=adobe-japan1-3 "aj1-" 5 d nil)
1322 (=adobe-japan1-4 "aj1-" 5 d nil)
1323 (=adobe-japan1-5 "aj1-" 5 d nil)
1324 (=adobe-japan1-6 "aj1-" 5 d nil)
1325 (=decomposition@cid)
1326 (=decomposition@hanyo-denshi)
1327 (=hanyo-denshi/ks "koseki-" 6 d nil)
1328 (=koseki "koseki-" 6 d nil)
1329 (=ucs@jis "u" 4 x nil)
1330 (=ucs@cns "u" 4 x "-t")
1331 (=ucs@ks "u" 4 x "-k")
1332 (=ucs@JP "u" 4 x nil)
1333 (=ucs@gb "u" 4 x "-g")
1334 (=ucs@iso "u" 4 x "-u")
1335 (=ucs@unicode "u" 4 x "-us")
1336 (=big5-cdp "cdp-" 4 x nil)
1337 (=>big5-cdp "cdp-" 4 x nil)
1338 (=cbeta "cbeta-" 5 d nil)
1339 (=big5-cdp-var-3 "cdp-" 4 x "-var-3")
1340 (=big5-cdp-var-5 "cdp-" 4 x "-var-5")
1341 (=jef-china3 "jc3-" 4 x nil)
1342 (=jis-x0212 "jsp-" 4 x nil)
1343 (=jis-x0213-1@2000 "jx1-2000-" 4 x nil)
1344 (=jis-x0213-1@2004 "jx1-2004-" 4 x nil)
1345 (=jis-x0213-2 "jx2-" 4 x nil)
1346 (=gt-k "gt-k" 5 d nil)
1347 (=jis-x0208@1978/1pr "j78-" 4 x nil)
1348 (=jis-x0208@1978/-4pr "j78-" 4 x nil)
1349 (=jis-x0208@1978 "j78-" 4 x nil)
1350 (=+>jis-x0208@1978 "j78-" 4 x nil)
1351 (=+>jis-x0208 "j90-" 4 x nil)
1352 (=+>jis-x0208@1990 "j90-" 4 x nil)
1353 (=+>jis-x0208@1983 "j83-" 4 x nil)
1355 (=big5 "b-" 4 x nil)
1356 (=daikanwa "dkw-" 5 d nil)
1358 (=ruimoku-v6 "rui6-" 4 x nil)
1359 (=>ruimoku-v6 "rui6-" 4 x nil)
1360 (=ks-x1001 "k0-" 4 x nil)
1361 (=cns11643-1 "c1-" 4 x nil)
1362 (=cns11643-2 "c2-" 4 x nil)
1363 (=cns11643-3 "c3-" 4 x nil)
1364 (=cns11643-4 "c4-" 4 x nil)
1365 (=cns11643-5 "c5-" 4 x nil)
1366 (=cns11643-6 "c6-" 4 x nil)
1367 (=cns11643-7 "c7-" 4 x nil)
1368 (=jis-x0208 "j90-" 4 x nil)
1369 (=jis-x0208@1990 "j90-" 4 x nil)
1370 (=jis-x0208@1983 "j83-" 4 x nil)
1373 (defun char-GlyphWiki-id (char)
1374 (let ((rest coded-charset-GlyphWiki-id-alist)
1377 (setq spec (pop rest))
1378 (null (setq ret (char-feature char (car spec))))))
1382 (mapconcat #'char-GlyphWiki-id ret "-"))
1383 (and (memq (car spec) '(=ucs@unicode '=ucs@iso))
1385 ((and (or (encode-char char '=jis-x0208@1990)
1386 (encode-char char '=jis-x0212)
1387 (encode-char char '=jis-x0213-1)
1388 (encode-char char '=jis-x0213-2))
1389 (setq code (encode-char char '=ucs@jis)))
1390 (format "u%04x" code)
1392 ((and (or (encode-char char '=gb2312)
1393 (encode-char char '=gb12345))
1394 (setq code (encode-char char '=ucs@gb)))
1395 (format "u%04x-g" code)
1397 ((and (or (encode-char char '=cns11643-1)
1398 (encode-char char '=cns11643-2)
1399 (encode-char char '=cns11643-3)
1400 (encode-char char '=cns11643-4)
1401 (encode-char char '=cns11643-5)
1402 (encode-char char '=cns11643-6)
1403 (encode-char char '=cns11643-7))
1404 (setq code (encode-char char '=ucs@cns)))
1405 (format "u%04x-t" code)
1407 ((and (encode-char char '=ks-x1001)
1408 (setq code (encode-char char '=ucs@ks)))
1409 (format "u%04x-k" code)
1411 (format (format "%s%%0%d%s%s"
1415 (or (nth 4 spec) ""))
1422 (provide 'cwiki-common)
1424 ;;; cwiki-common.el ends here