1 ;; -*- coding: utf-8-mcs-er -*-
2 (require 'char-db-util)
3 ;; (require 'concord-images)
5 (setq file-name-coding-system 'utf-8-mcs-er)
8 (concord-assign-genre 'image-resource "/usr/local/var/photo/db")
10 (concord-assign-genre 'creator@ruimoku "/usr/local/var/ruimoku/db")
11 (concord-assign-genre 'person-name@ruimoku "/usr/local/var/ruimoku/db")
13 (concord-assign-genre 'journal-volume@ruimoku "/usr/local/var/ruimoku/db")
14 (concord-assign-genre 'article@ruimoku "/usr/local/var/ruimoku/db")
15 (concord-assign-genre 'book@ruimoku "/usr/local/var/ruimoku/db")
17 (concord-assign-genre 'classification@ruimoku "/usr/local/var/ruimoku/db")
18 (concord-assign-genre 'region@ruimoku "/usr/local/var/ruimoku/db")
19 (concord-assign-genre 'era@ruimoku "/usr/local/var/ruimoku/db")
20 (concord-assign-genre 'period@ruimoku "/usr/local/var/ruimoku/db")
21 (concord-assign-genre 'journal@ruimoku "/usr/local/var/ruimoku/db")
22 (concord-assign-genre 'journal-name@ruimoku "/usr/local/var/ruimoku/db")
23 (concord-assign-genre 'publisher@ruimoku "/usr/local/var/ruimoku/db")
24 (concord-assign-genre 'publisher-name@ruimoku "/usr/local/var/ruimoku/db")
26 (mount-char-attribute-table '*instance@ruimoku/bibliography/title)
27 ;; (mount-char-attribute-table '*instance@ruimoku/bibliography/content*note)
29 (concord-assign-genre 'entry@zh-classical "/usr/local/var/kanbun/db")
30 ;; (concord-assign-genre 'morpheme-entry@zh-classical "/usr/local/var/kanbun/db")
31 (concord-assign-genre 'word-class@zh-classical "/usr/local/var/kanbun/db")
32 (concord-assign-genre 'morpheme@zh-classical "/usr/local/var/kanbun/db")
33 (concord-assign-genre 'sentence@zh-classical "/usr/local/var/kanbun/db")
34 ;; (concord-assign-genre 'sentence-entry@zh-classical "/usr/local/var/kanbun/db")
36 (mount-char-attribute-table '*instance@morpheme-entry/zh-classical)
39 (mount-char-attribute-table '->HNG)
40 (mount-char-attribute-table '<-HNG)
43 (defvar est-hide-cgi-mode nil)
44 (defvar est-view-url-prefix "..")
45 (defvar chise-wiki-view-url "view.cgi")
46 (defvar chise-wiki-edit-url "edit.cgi")
48 (defvar chise-wiki-bitmap-glyphs-url
49 "http://www.chise.org/glyphs")
51 (defvar chise-wiki-hng-bitmap-glyphs-url
52 "http://hng.chise.org/glyphs/HNG")
54 (defvar chise-wiki-glyph-cgi-url
55 "http://www.chise.org/chisewiki/glyph.cgi")
57 (defvar chise-wiki-displayed-features nil)
59 (defvar est-coded-charset-priority-list
61 =cns11643-1 =cns11643-2 =cns11643-3
62 =cns11643-4 =cns11643-5 =cns11643-6 =cns11643-7
64 =jis-x0208 =jis-x0208@1990
69 =jis-x0213-1@2000 =jis-x0213-1@2004
70 =jis-x0208@1983 =jis-x0208@1978
71 =zinbun-oracle =>zinbun-oracle
75 =>>>jis-x0208 =>>>jis-x0213-1 =>>>jis-x0213-2
76 =>>jis-x0208 =>>jis-x0213-1 =>>jis-x0213-2
78 =+>jis-x0208 =+>jis-x0213-1 =+>jis-x0213-2
81 =>jis-x0208 =>jis-x0213-1
83 =>ucs@iso =>ucs@unicode
84 =>ucs@jis =>ucs@cns =>ucs@ks
85 =>>ucs@iso =>>ucs@unicode
86 =>>ucs@jis =>>ucs@cns =>>ucs@ks
87 =>>>ucs@iso =>>>ucs@unicode
88 =>>>ucs@jis =>>>ucs@cns =>>>ucs@ks
107 (defun decode-uri-string (string &optional coding-system)
108 (if (> (length string) 0)
112 (mapconcat (lambda (char)
115 (char-to-string char)))
117 (while (string-match "%\\([0-9A-F][0-9A-F]\\)" string i)
118 (setq dest (concat dest
119 (substring string i (match-beginning 0))
122 (string-to-int (match-string 1 string) 16))))
124 (decode-coding-string
125 (concat dest (substring string i))
128 (defun www-feature-type (feature-name)
129 (or (char-feature-property feature-name 'type)
130 (let ((str (symbol-name feature-name)))
132 ((string-match "\\*note\\(@[^*]+\\)?$" str)
134 ((string-match "\\*sources\\(@[^*]+\\)?$" str)
136 ((string-match "\\*" str)
138 ((string-match "^\\(->\\|<-\\)" str)
140 ((string-match "^ideographic-structure\\(@\\|$\\)" str)
144 (defun www-feature-format (feature-name)
145 (or (char-feature-property feature-name 'presentation-format)
146 (char-feature-property feature-name 'format)
148 (setq fn feature-name)
149 (while (and (setq parent (char-feature-name-parent fn))
151 (char-feature-property
155 '((name) " : " (value))))
157 (defun www-feature-value-format (feature-name)
158 (or (char-feature-property feature-name 'value-presentation-format)
159 (char-feature-property feature-name 'value-format)
161 (setq fn feature-name)
162 (while (and (setq parent (char-feature-name-parent fn))
164 (or (char-feature-property
165 parent 'value-presentation-format)
166 (char-feature-property
167 parent 'value-format)))))
170 (let ((type (www-feature-type feature-name)))
171 (cond ((eq type 'relation)
173 ((eq type 'structure)
174 'space-separated-ids)
178 (if (find-charset feature-name)
179 (if (and (= (charset-dimension feature-name) 2)
180 (= (charset-chars feature-name) 94))
182 " (" (decimal) ") <" (ku-ten) "> " (prev-char) (next-char))
183 '("0x" (HEX) " (" (decimal) ") " (prev-char) (next-char))))
186 (defun char-feature-name-at-domain (feature-name domain)
188 (let ((name (symbol-name feature-name)))
190 ((string-match "@[^*]+$" name)
191 (intern (format "%s/%s" name domain))
194 (intern (format "%s@%s" name domain))
198 (defun char-feature-name-parent (feature-name)
199 (let ((name (symbol-name feature-name)))
200 (if (string-match "@[^@/*]+\\(/[^@/*]+\\)*$" name)
201 (intern (substring name 0 (car (last (match-data) 2)))))))
203 (defun char-feature-name-domain (feature-name)
204 (let ((name (symbol-name feature-name)))
205 (if (string-match "@[^@/*]+\\(/[^@/*]+\\)*$" name)
206 (intern (substring name (1+ (match-beginning 0)))))))
208 (defun char-feature-name-sans-versions (feature)
209 (let ((feature-name (symbol-name feature)))
210 (if (string-match "[@/]\\$rev=latest$" feature-name)
211 (intern (substring feature-name 0 (match-beginning 0)))
214 (defun est-object-genre (object)
215 (if (characterp object)
217 (concord-object-genre object)))
219 (defun www-get-feature-value (object feature)
220 (let ((latest-feature (char-feature-name-at-domain feature '$rev=latest)))
223 (mount-char-attribute-table latest-feature)
224 (or (char-feature object latest-feature)
225 (char-feature object feature))
228 (or (condition-case nil
229 (concord-object-get object latest-feature)
232 (concord-object-get object feature)
236 (defun get-previous-code-point (ccs code)
237 (let ((chars (charset-chars ccs))
238 (dim (charset-dimension ccs))
240 mask byte-min byte-max
263 (setq bytes (make-vector dim 0))
265 (aset bytes i (logand (lsh code (* i -8)) mask))
268 (while (and (< i dim)
270 (aset bytes i (1- (aref bytes i)))
271 (< (aref bytes i) byte-min)))
272 (aset bytes i byte-max)
275 (setq dest (aref bytes 0)
278 (setq dest (logior dest (lsh (aref bytes i) (* i 8)))
282 (defun get-next-code-point (ccs code)
283 (let ((chars (charset-chars ccs))
284 (dim (charset-dimension ccs))
286 mask byte-min byte-max
309 (setq bytes (make-vector dim 0))
311 (aset bytes i (logand (lsh code (* i -8)) mask))
314 (while (and (< i dim)
316 (aset bytes i (1+ (aref bytes i)))
317 (> (aref bytes i) byte-max)))
318 (aset bytes i byte-min)
321 (setq dest (aref bytes 0)
324 (setq dest (logior dest (lsh (aref bytes i) (* i 8)))
328 (defun find-previous-defined-code-point (ccs code)
329 (let ((i (get-previous-code-point ccs code))
332 ((eq ccs '=jis-x0208)
333 (setq ccs '=jis-x0208@1990))
334 ((eq ccs '=jis-x0213-1)
335 (setq ccs '=jis-x0213-1@2004)))
338 (null (setq char (decode-char ccs i
339 (unless (eq ccs '=ucs)
341 (setq i (get-previous-code-point ccs i)))
344 (defun find-next-defined-code-point (ccs code)
345 (let ((i (get-next-code-point ccs code))
347 (setq max (+ code 1000))
349 ((eq ccs '=jis-x0208)
350 (setq ccs '=jis-x0208@1990))
351 ((eq ccs '=jis-x0213-1)
352 (setq ccs '=jis-x0213-1@2004)))
355 (null (setq char (decode-char ccs i
356 (unless (eq ccs '=ucs)
358 (setq i (get-next-code-point ccs i)))
362 ;;; @ URI representation
365 (defun est-uri-decode-feature-name-body (uri-feature)
366 (let ((len (length uri-feature))
373 (if (eq (aref uri-feature i) ?\.)
374 (if (and (< (+ i 2) len)
375 (eq (aref uri-feature (+ i 2)) ?\.))
378 ((eq (setq ch (aref uri-feature (1+ i))) ?\.)
383 (substring uri-feature i (+ i 3))
389 (char-to-string (aref uri-feature i))
393 (defun est-uri-encode-feature-name-body (feature)
394 (mapconcat (lambda (c)
399 (t (char-to-string c))))
402 (defun www-uri-decode-feature-name (uri-feature)
404 (setq uri-feature (decode-uri-string uri-feature 'utf-8-mcs-er))
406 ((string-match "^from\\." uri-feature)
407 (intern (format "<-%s"
408 (est-uri-decode-feature-name-body
409 (substring uri-feature (match-end 0)))))
411 ((string-match "^to\\." uri-feature)
412 (intern (format "->%s"
413 (est-uri-decode-feature-name-body
414 (substring uri-feature (match-end 0)))))
416 ((string-match "^rep\\." uri-feature)
417 (intern (format "=%s"
418 (est-uri-decode-feature-name-body
419 (substring uri-feature (match-end 0)))))
421 ((string-match "^rep[2i]\\." uri-feature)
422 (intern (format "===%s"
423 (est-uri-decode-feature-name-body
424 (substring uri-feature (match-end 0)))))
426 ((string-match "^g\\." uri-feature)
427 (intern (format "=>>%s"
428 (est-uri-decode-feature-name-body
429 (substring uri-feature (match-end 0)))))
431 ((string-match "^g[i2]\\." uri-feature)
432 (intern (format "==%s"
433 (est-uri-decode-feature-name-body
434 (substring uri-feature (match-end 0)))))
436 ((string-match "^gi\\([0-9]+\\)\\." uri-feature)
437 (intern (format "=>>%s%s"
438 (make-string (string-to-int
439 (match-string 1 uri-feature))
441 (est-uri-decode-feature-name-body
442 (substring uri-feature (match-end 0)))))
444 ((string-match "^o\\." uri-feature)
445 (intern (format "=+>%s"
446 (est-uri-decode-feature-name-body
447 (substring uri-feature (match-end 0)))))
449 ((string-match "^a\\." uri-feature)
450 (intern (format "=>%s"
451 (est-uri-decode-feature-name-body
452 (substring uri-feature (match-end 0)))))
454 ((string-match "^a\\([0-9]+\\)\\." uri-feature)
455 (intern (format "%s>%s"
456 (make-string (string-to-int
457 (match-string 1 uri-feature))
459 (est-uri-decode-feature-name-body
460 (substring uri-feature (match-end 0)))))
462 ((and (setq uri-feature (est-uri-decode-feature-name-body uri-feature))
463 (setq feature (intern (format "=>%s" uri-feature)))
464 (find-charset feature))
466 ((and (setq feature (intern (format "=>>%s" uri-feature)))
467 (find-charset feature))
469 ((and (setq feature (intern (format "=>>>%s" uri-feature)))
470 (find-charset feature))
472 ((and (setq feature (intern (format "=%s" uri-feature)))
473 (find-charset feature))
475 (t (intern uri-feature)))))
477 (defun www-uri-encode-feature-name (feature-name)
478 (setq feature-name (symbol-name feature-name))
480 ((string-match "^=\\+>\\([^=>]+\\)" feature-name)
482 (est-uri-encode-feature-name-body
483 (substring feature-name (match-beginning 1))))
485 ((string-match "^=\\([^=>]+\\)" feature-name)
487 (est-uri-encode-feature-name-body
488 (substring feature-name (match-beginning 1))))
490 ((string-match "^==\\([^=>]+\\)" feature-name)
492 (est-uri-encode-feature-name-body
493 (substring feature-name (match-beginning 1))))
495 ((string-match "^===\\([^=>]+\\)" feature-name)
497 (est-uri-encode-feature-name-body
498 (substring feature-name (match-beginning 1))))
500 ((string-match "^=>>\\([^=>]+\\)" feature-name)
502 (est-uri-encode-feature-name-body
503 (substring feature-name (match-beginning 1))))
505 ((string-match "^=>>>\\([^=>]+\\)" feature-name)
507 (est-uri-encode-feature-name-body
508 (substring feature-name (match-beginning 1))))
510 ((string-match "^=>>\\(>+\\)" feature-name)
512 (length (match-string 1 feature-name))
513 (est-uri-encode-feature-name-body
514 (substring feature-name (match-end 1))))
516 ((string-match "^=>\\([^=>]+\\)" feature-name)
518 (est-uri-encode-feature-name-body
519 (substring feature-name (match-beginning 1))))
521 ((string-match "^\\(=+\\)>" feature-name)
523 (length (match-string 1 feature-name))
524 (est-uri-encode-feature-name-body
525 (substring feature-name (match-end 0))))
527 ((string-match "^->" feature-name)
529 (est-uri-encode-feature-name-body
530 (substring feature-name (match-end 0))))
532 ((string-match "^<-" feature-name)
534 (est-uri-encode-feature-name-body
535 (substring feature-name (match-end 0))))
537 (t (est-uri-encode-feature-name-body feature-name))))
539 (defun www-uri-make-feature-name-url (uri-genre uri-feature-name uri-object)
540 (if est-hide-cgi-mode
541 (format "../feature/%s&%s/%s"
542 uri-feature-name uri-genre uri-object)
543 (format "%s?feature=%s&%s=%s"
544 chise-wiki-view-url uri-feature-name uri-genre uri-object)))
546 (defun www-uri-decode-object (genre char-rep)
549 ((string-match (if est-hide-cgi-mode
550 "\\(%3D\\|=\\|%3A\\|:\\)"
551 "\\(%3A\\|:\\)") char-rep)
552 (setq ccs (substring char-rep 0 (match-beginning 0))
553 cpos (substring char-rep (match-end 0)))
554 (setq ccs (www-uri-decode-feature-name ccs))
555 (setq cpos (est-uri-decode-feature-name-body cpos))
557 ((string-match "^0x" cpos)
559 (string-to-number (substring cpos (match-end 0)) 16))
562 (setq cpos (car (read-from-string
564 cpos file-name-coding-system))))
566 (if (and (eq genre 'character)
568 (decode-char ccs cpos)
569 (concord-decode-object ccs cpos genre))
572 (setq char-rep (decode-uri-string char-rep 'utf-8-mcs-er))
574 ((eq genre 'character)
575 (when (= (length char-rep) 1)
579 (concord-decode-object
580 '=id (www-uri-decode-feature-name char-rep) 'feature)
583 (concord-decode-object
584 '=id (car (read-from-string char-rep)) genre)
587 (defun www-uri-encode-object (object)
588 (if (characterp object)
589 (if (encode-char object '=ucs)
592 (format "%%%02X" byte))
593 (encode-coding-string (char-to-string object) 'utf-8-mcs-er)
595 (let ((ccs-list est-coded-charset-priority-list)
598 (setq ccs (pop ccs-list))
599 (not (setq ret (encode-char object ccs 'defined-only)))))
601 (format (if est-hide-cgi-mode
604 (www-uri-encode-feature-name ccs)
606 ((and (setq ccs (car (split-char object)))
607 (setq ret (encode-char object ccs)))
608 (format (if est-hide-cgi-mode
611 (www-uri-encode-feature-name ccs)
614 (format (if est-hide-cgi-mode
615 "system-char-id=0x%X"
616 "system-char-id:0x%X")
617 (encode-char object 'system-char-id))
619 (format (if est-hide-cgi-mode
622 (est-uri-encode-feature-name-body
623 (format "%s" (concord-object-id object))))))
625 (defun est-format-object (object &optional readable)
626 (if (characterp object)
627 (char-to-string object)
628 (let ((ret (or (if readable
629 (or (concord-object-get object 'name)
630 (concord-object-get object '=name)
631 (concord-object-get object 'title)))
632 (concord-object-id object))))
635 (defun www-uri-make-object-url (object &optional uri-object)
636 (if est-hide-cgi-mode
639 (est-object-genre object)
641 (www-uri-encode-object object)))
644 (est-object-genre object)
646 (www-uri-encode-object object)))))
649 ;;; @ Feature name presentation
652 (defun www-format-feature-name-default (feature-name)
656 (symbol-name feature-name)
660 (defun www-format-feature-name-as-metadata (feature-name &optional lang)
661 (let ((str (symbol-name feature-name))
664 ((string-match "\\*[^*]+$" str)
665 (setq base (substring str 0 (match-beginning 0))
666 meta (substring str (match-beginning 0)))
667 (concat (www-format-feature-name* (intern base) lang)
670 (www-format-feature-name-default feature-name)
673 (defun www-format-feature-name-as-rel-to (feature-name)
674 (concat "\u2192" (substring (symbol-name feature-name) 2)))
676 (defun www-format-feature-name-as-rel-from (feature-name)
677 (concat "\u2190" (substring (symbol-name feature-name) 2)))
679 (defun www-format-feature-name-as-CCS (feature-name)
682 (symbol-name feature-name)
684 (dest (upcase (pop rest))))
685 (when (string-match "^=+>*" dest)
686 (setq dest (concat (substring dest 0 (match-end 0))
688 (substring dest (match-end 0)))))
692 (setq dest (concat dest " " (upcase (pop rest)))))
693 (if (string-match "^[0-9]+$" (car rest))
694 (concat dest "-" (car rest))
695 (concat dest " " (upcase (car rest))))
699 (defun www-format-feature-name* (feature-name &optional lang)
700 (let (name fn parent ret)
703 (char-feature-property
705 (intern (format "name@%s" lang))))
706 (char-feature-property
707 feature-name 'name)))
708 ((and (setq name (symbol-name feature-name))
709 (string-match "\\*" name))
710 (www-format-feature-name-as-metadata feature-name lang))
712 (setq fn feature-name)
713 (while (and (setq parent (char-feature-name-parent fn))
716 (char-feature-property
718 (intern (format "name@%s" lang))))
719 (char-feature-property
724 (concat ret (substring (symbol-name feature-name)
725 (length (symbol-name parent)))))
726 ((find-charset feature-name)
727 (www-format-feature-name-as-CCS feature-name))
728 ((string-match "^\\(->\\)" name)
729 (www-format-feature-name-as-rel-to feature-name))
730 ((string-match "^\\(<-\\)" name)
731 (www-format-feature-name-as-rel-from feature-name))
733 (www-format-feature-name-default feature-name)
737 (defun www-format-feature-name (feature-name &optional lang)
738 (www-format-encode-string
739 (www-format-feature-name* feature-name lang)))
745 (defvar www-format-char-img-style "vertical-align:bottom;")
747 (defun www-format-encode-string (string &optional without-tags as-body)
750 (let (plane code subcode start end char variants ret rret)
752 (goto-char (point-min))
753 (while (search-forward "&" nil t)
754 (replace-match "&" nil t)))
755 (goto-char (point-min))
756 (while (search-forward "<" nil t)
757 (replace-match "<" nil t))
758 (goto-char (point-min))
759 (while (search-forward ">" nil t)
760 (replace-match ">" nil t))
762 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
763 (let ((coded-charset-entity-reference-alist
767 '(=hanyo-denshi/ja "HD-JA-" 4 X)
768 '(=hanyo-denshi/jb "HD-JB-" 4 X)
769 '(=hanyo-denshi/jc "HD-JC-" 4 X)
770 '(=hanyo-denshi/jd "HD-JD-" 4 X)
771 '(=hanyo-denshi/ft "HD-FT-" 4 X)
772 '(=hanyo-denshi/ia "HD-IA-" 4 X)
773 '(=hanyo-denshi/ib "HD-IB-" 4 X)
774 '(=hanyo-denshi/hg "HD-HG-" 4 X)
775 '(=hanyo-denshi/ip "HD-IP-" 4 X)
776 '(=hanyo-denshi/jt "HD-JT-" 4 X)
777 '(=hanyo-denshi/ks "HD-KS-" 6 d)
778 '(=>>hanyo-denshi/ja "G-HD-JA-" 4 X)
779 '(=>>hanyo-denshi/jb "G-HD-JB-" 4 X)
780 '(=>>hanyo-denshi/jc "G-HD-JC-" 4 X)
781 '(=>>hanyo-denshi/jd "G-HD-JD-" 4 X)
782 '(=>>hanyo-denshi/ft "G-HD-FT-" 4 X)
783 '(=>>hanyo-denshi/ia "G-HD-IA-" 4 X)
784 '(=>>hanyo-denshi/ib "G-HD-IB-" 4 X)
785 '(=>>hanyo-denshi/hg "G-HD-HG-" 4 X)
786 '(=>>hanyo-denshi/ip "G-HD-IP-" 4 X)
787 '(=>>hanyo-denshi/jt "G-HD-JT-" 4 X)
788 '(=>>hanyo-denshi/ks "G-HD-KS-" 6 d)
790 '(==hanyo-denshi/ja "g2-HD-JA-" 4 X)
791 '(==hanyo-denshi/jb "g2-HD-JB-" 4 X)
792 '(==hanyo-denshi/jc "g2-HD-JC-" 4 X)
793 '(==hanyo-denshi/jd "g2-HD-JD-" 4 X)
794 '(==hanyo-denshi/ft "g2-HD-FT-" 4 X)
795 '(==hanyo-denshi/ia "g2-HD-IA-" 4 X)
796 '(==hanyo-denshi/ib "g2-HD-IB-" 4 X)
797 '(==hanyo-denshi/hg "g2-HD-HG-" 4 X)
798 '(==hanyo-denshi/ip "g2-HD-IP-" 4 X)
799 '(==hanyo-denshi/jt "g2-HD-JT-" 4 X)
800 '(==hanyo-denshi/ks "g2-HD-KS-" 6 d)
801 '(=cns11643-1 "C1-" 4 X)
802 '(=cns11643-2 "C2-" 4 X)
803 '(=cns11643-3 "C3-" 4 X)
804 '(=cns11643-4 "C4-" 4 X)
805 '(=cns11643-5 "C5-" 4 X)
806 '(=cns11643-6 "C6-" 4 X)
807 '(=cns11643-7 "C7-" 4 X)
808 '(=adobe-japan1-6 "AJ1-" 5 d)
809 '(=big5-cdp "CDP-" 4 X)
811 '(=gb12345 "G1-" 4 X)
812 '(=jis-x0208@1990 "J90-" 4 X)
813 '(=jis-x0212 "JSP-" 4 X)
815 '(=jis-x0208@1997 "J97-" 4 X)
816 '(=jis-x0208@1978 "J78-" 4 X)
817 '(=jis-x0208@1983 "J83-" 4 X)
818 '(=ruimoku-v6 "RUI6-" 4 X)
819 '(=zinbun-oracle "ZOB-" 4 d)
820 '(=jef-china3 "JC3-" 4 X)
821 '(=ucs@unicode "UU+" 4 X)
822 '(=ucs@JP/hanazono "hanaJU+" 4 X)
823 '(==cns11643-1 "R-C1-" 4 X)
824 '(==cns11643-2 "R-C2-" 4 X)
825 '(==cns11643-3 "R-C3-" 4 X)
826 '(==cns11643-4 "R-C4-" 4 X)
827 '(==cns11643-5 "R-C5-" 4 X)
828 '(==cns11643-6 "R-C6-" 4 X)
829 '(==cns11643-7 "R-C7-" 4 X)
830 '(=hanziku-1 "HZK01-" 4 X)
831 '(=hanziku-2 "HZK02-" 4 X)
832 '(=hanziku-3 "HZK03-" 4 X)
833 '(=hanziku-4 "HZK04-" 4 X)
834 '(=hanziku-5 "HZK05-" 4 X)
835 '(=hanziku-6 "HZK06-" 4 X)
836 '(=hanziku-7 "HZK07-" 4 X)
837 '(=hanziku-8 "HZK08-" 4 X)
838 '(=hanziku-9 "HZK09-" 4 X)
839 '(=hanziku-10 "HZK10-" 4 X)
840 '(=hanziku-11 "HZK11-" 4 X)
841 '(=hanziku-12 "HZK12-" 4 X)
843 '(=daikanwa "M-" 5 d)
844 coded-charset-entity-reference-alist)))
845 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
847 (goto-char (point-min))
848 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\)?CB\\([0-9]+\\);" nil t)
849 (setq code (string-to-int (match-string 2)))
851 (format "<img alt=\"CB%05d\" src=\"%s/cb-gaiji/%02d/CB%05d.gif\"
854 chise-wiki-bitmap-glyphs-url
856 www-format-char-img-style)
859 (goto-char (point-min))
860 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?J\\(78\\|83\\|90\\|97\\|SP\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
861 (setq plane (match-string 2)
862 code (string-to-int (match-string 3) 16))
864 (format "<img alt=\"J%s-%04X\" src=\"%s/JIS-%s/%02d-%02d.gif\"
867 chise-wiki-bitmap-glyphs-url
870 (- (logand code 255) 32)
871 www-format-char-img-style)
874 (goto-char (point-min))
875 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?J0-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
876 (setq code (string-to-int (match-string 2) 16))
878 (format "<img alt=\"J0-%04X\" src=\"%s/JIS-90/%02d-%02d.gif\"
881 chise-wiki-bitmap-glyphs-url
883 (- (logand code 255) 32)
884 www-format-char-img-style)
887 (goto-char (point-min))
888 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-\\(JA\\|JB\\|JC\\|JD\\|FT\\|IA\\|IB\\|HG\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
889 (setq plane (match-string 2)
890 code (string-to-int (match-string 3) 16))
892 (format "<img alt=\"HD-%s-%04X\" src=\"%s/IVD/HanyoDenshi/%s%02d%02d.png\"
895 chise-wiki-bitmap-glyphs-url
898 (- (logand code 255) 32)
899 www-format-char-img-style)
902 (goto-char (point-min))
903 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-\\(IP\\|JT\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
904 (setq plane (match-string 2)
905 code (string-to-int (match-string 3) 16))
907 (format "<img alt=\"HD-%s-%04X\" src=\"%s/IVD/HanyoDenshi/%s%04X.png\"
910 chise-wiki-bitmap-glyphs-url
912 www-format-char-img-style)
915 (goto-char (point-min))
916 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-KS-\\([0-9]+\\);" nil t)
917 (setq code (string-to-int (match-string 2)))
919 (format "<img alt=\"HD-KS%06d\" src=\"%s/IVD/HanyoDenshi/KS%06d.png\"
920 style=\"vertical-align:middle\">"
922 chise-wiki-bitmap-glyphs-url
924 www-format-char-img-style)
927 (goto-char (point-min))
928 (while (re-search-forward "&G\\([01]\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
929 (setq plane (string-to-int (match-string 1))
930 code (string-to-int (match-string 2) 16))
932 (format "<img alt=\"GB%d-%04X\" src=\"%s/GB%d/%02d-%02d.gif\"
935 chise-wiki-bitmap-glyphs-url
938 (- (logand code 255) 32)
939 www-format-char-img-style)
942 (goto-char (point-min))
943 (while (re-search-forward "&\\(R-\\)?C\\([1-7]\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
944 (setq plane (string-to-int (match-string 2))
945 code (string-to-int (match-string 3) 16))
947 (format "<img alt=\"CNS%d-%04X\" src=\"%s/CNS%d/%04X.gif\"
950 chise-wiki-bitmap-glyphs-url
952 www-format-char-img-style)
955 (goto-char (point-min))
956 (while (re-search-forward "&\\(R-\\)?JC3-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
957 (setq code (string-to-int (match-string 2) 16))
959 (format "<img alt=\"JC3-%04X\" src=\"http://kanji.zinbun.kyoto-u.ac.jp/db/CHINA3/Gaiji/%04x.gif\">"
963 (goto-char (point-min))
964 (while (re-search-forward "&\\(A-\\)?ZOB-\\([0-9]+\\);" nil t)
965 (setq code (string-to-int (match-string 2)))
967 (format "<img alt=\"ZOB-%04d\" src=\"%s/ZOB-1968/%04d.png\"
968 style=\"vertical-align:middle\">"
970 chise-wiki-bitmap-glyphs-url
972 www-format-char-img-style)
975 (goto-char (point-min))
976 (while (re-search-forward "&HNG\\([0-9]+\\)-\\([0-9][0-9][0-9][0-9]\\)\\([0-9]\\);" nil t)
977 (setq plane (match-string 1)
978 code (string-to-int (match-string 2))
979 subcode (string-to-int (match-string 3)))
983 (char-to-string (decode-char 'ascii (+ 96 subcode)))))
986 "<div class=\"tooltip\"><img alt=\"HNG%s-%04d%s\" src=\"%s/%s/%04d%s.png\" style=\"
987 vertical-align:middle; width: 48px; height: 48px\"><span
988 class=\"tooltiptext\">%s</span></div>"
990 chise-wiki-hng-bitmap-glyphs-url
993 (car (find (format "HNG%s-" plane)
994 coded-charset-entity-reference-alist
995 :test (lambda (key cell)
996 (string= key (nth 1 cell))))))
1000 (goto-char (point-min))
1001 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?AJ1-\\([0-9]+\\);" nil t)
1002 (setq code (string-to-int (match-string 2)))
1004 (format "<img alt=\"AJ1-%05d\" src=\"%s/IVD/AdobeJapan1/CID+%d.png\"
1005 style=\"vertical-align:middle\">"
1007 chise-wiki-bitmap-glyphs-url
1009 www-format-char-img-style)
1012 (goto-char (point-min))
1013 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?MJ\\([0-9]+\\);" nil t)
1014 (setq code (string-to-int (match-string 2)))
1016 (format "<img alt=\"MJ%06d\" src=\"http://mojikiban.ipa.go.jp/search/MJ%06d\"
1017 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1020 www-format-char-img-style)
1023 (goto-char (point-min))
1024 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\)?IU[+-]\\([0-9A-F]+\\);" nil t)
1025 (setq code (string-to-int (match-string 2) 16))
1027 (format "<img alt=\"u%04x\" src=\"http://glyphwiki.org/glyph/u%04x.100px.png\"
1028 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1031 www-format-char-img-style)
1034 (goto-char (point-min))
1035 (while (re-search-forward "&U-i\\([0-9]+\\)\\+\\([0-9A-F]+\\);" nil t)
1036 (setq plane (string-to-int (match-string 1))
1037 code (string-to-int (match-string 2) 16))
1039 (format "<img alt=\"u%04x-itaiji-%03d\" src=\"http://glyphwiki.org/glyph/u%04x-itaiji-%03d.100px.png\"
1040 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1045 www-format-char-img-style)
1048 (goto-char (point-min))
1049 (while (re-search-forward "&A-IWDSU\\+\\([0-9A-F]+\\);" nil t)
1050 (setq code (string-to-int (match-string 1) 16))
1052 (format "<img alt=\"A-IWDSU+%04x\" src=\"http://glyphwiki.org/glyph/u%04x.100px.png\"
1053 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1056 www-format-char-img-style)
1059 (goto-char (point-min))
1060 (while (re-search-forward "&U-v\\([0-9]+\\)\\+\\([0-9A-F]+\\);" nil t)
1061 (setq plane (string-to-int (match-string 1))
1062 code (string-to-int (match-string 2) 16))
1064 (format "<img alt=\"u%04x-itaiji-%03d\" src=\"http://glyphwiki.org/glyph/u%04x-var-%03d.100px.png\"
1065 style=\"vertical-align:middle; width: 48px; height: 48px\">"
1070 www-format-char-img-style)
1073 (goto-char (point-min))
1074 (while (re-search-forward "&\\(A-\\|G-\\|R-\\|g2-\\)?GT-\\([0-9]+\\);" nil t)
1075 (setq code (string-to-int (match-string 2)))
1077 (format "<img alt=\"GT-%05d\" src=\"%s?char=GT-%05d\"
1080 chise-wiki-glyph-cgi-url
1082 www-format-char-img-style)
1085 (goto-char (point-min))
1086 (while (re-search-forward "&\\(G-\\)?GT-K\\([0-9]+\\);" nil t)
1087 (setq code (string-to-int (match-string 2)))
1089 (format "<img alt=\"GT-K%05d\" src=\"%s?char=GT-K%05d\"
1092 chise-wiki-glyph-cgi-url
1094 www-format-char-img-style)
1097 (goto-char (point-min))
1098 (while (re-search-forward "&B-\\([0-9A-F]+\\);" nil t)
1099 (setq code (string-to-int (match-string 1) 16))
1101 (format "<img alt=\"B-%04X\" src=\"%s?char=B-%04X\"
1104 chise-wiki-glyph-cgi-url
1106 www-format-char-img-style)
1109 (goto-char (point-min))
1110 (while (re-search-forward "&\\(G-\\|g2-\\|R-\\)?CDP-\\([0-9A-F]+\\);" nil t)
1111 (setq code (string-to-int (match-string 2) 16))
1113 (format "<img alt=\"CDP-%04X\" src=\"%s?char=CDP-%04X\"
1116 chise-wiki-glyph-cgi-url
1118 www-format-char-img-style)
1121 (goto-char (point-min))
1122 (while (re-search-forward
1123 "&\\(I-\\)?HZK\\(0[1-9]\\|1[0-2]\\)-\\([0-9A-F]+\\);" nil t)
1124 (setq plane (match-string 2)
1125 code (string-to-int (match-string 3) 16))
1127 (format "<img alt=\"HZK%s-%04X\" src=\"%s?char=HZK%s-%04X\"
1131 chise-wiki-glyph-cgi-url
1134 www-format-char-img-style)
1137 (goto-char (point-min))
1138 (while (re-search-forward "&RUI6-\\([0-9A-F]+\\);" nil t)
1139 (setq code (string-to-int (match-string 1) 16))
1141 (format "<img alt=\"RUI6-%04X\" src=\"%s?char=RUI6-%04X\"
1142 style=\"vertical-align:middle\">"
1144 chise-wiki-glyph-cgi-url
1146 www-format-char-img-style)
1149 (goto-char (point-min))
1150 (while (re-search-forward "&hanaJU\\+\\([0-9A-F]+\\);" nil t)
1151 (setq code (string-to-int (match-string 1) 16))
1153 (format "<img alt=\"hanaJU+%04X\" src=\"%s?char=hana-JU+%04X\"
1154 style=\"vertical-align:middle\">"
1156 chise-wiki-glyph-cgi-url
1158 www-format-char-img-style)
1161 (goto-char (point-min))
1162 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\|R-\\)?\\(UU\\+\\|U-\\)\\([0-9A-F]+\\);" nil t)
1163 (setq code (string-to-int (match-string 3) 16))
1165 (format "<img alt=\"UU+%04X\" src=\"http://www.unicode.org/cgi-bin/refglyph?24-%04X\"
1166 style=\"vertical-align:middle\">"
1169 www-format-char-img-style)
1172 (goto-char (point-min))
1173 (while (re-search-forward "&MCS-\\([0-9A-F]+\\);" nil t)
1174 (setq code (string-to-int (match-string 1) 16))
1175 (setq start (match-beginning 0)
1177 (setq char (decode-char 'system-char-id code))
1179 ((and (setq variants
1180 (or (www-get-feature-value char '->subsumptive)
1181 (www-get-feature-value char '->denotational)))
1183 (while (and variants
1184 (setq ret (www-format-encode-string
1185 (char-to-string (car variants))))
1186 (string-match "&MCS-\\([0-9A-F]+\\);" ret))
1187 (setq variants (cdr variants)))
1189 (unless (string-match "&MCS-\\([0-9A-F]+\\);" ret)
1191 (delete-region start end)
1194 ((setq ret (or (www-get-feature-value char 'ideographic-combination)
1195 (www-get-feature-value char 'ideographic-structure)))
1200 (if (characterp (setq rret (find-char ch)))
1203 (www-format-encode-string
1204 (char-to-string ch) without-tags)
1205 (www-format-encode-string
1206 (format "%S" ch) without-tags)))
1210 (delete-region start end)
1214 ;; (goto-char (point-min))
1215 ;; (while (search-forward ">-" nil t)
1216 ;; (replace-match "&GT-" t 'literal))
1219 (defun www-html-display-text (text)
1223 (goto-char (point-min))
1224 (while (search-forward "<" nil t)
1225 (replace-match "<" nil t))
1226 (goto-char (point-min))
1227 (while (search-forward ">" nil t)
1228 (replace-match ">" nil t))
1229 (goto-char (point-min))
1230 (while (re-search-forward "\\[\\[\\([^]|[]+\\)|\\([^][]+\\)\\]\\]" nil t)
1232 (format "<a href=\"%s\">%s</a>"
1236 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
1237 (goto-char (point-min))
1238 (while (search-forward ">-" nil t)
1239 (replace-match "&GT-" nil t))
1242 (defun www-html-display-paragraph (text)
1244 (www-html-display-text text)
1251 (defvar coded-charset-GlyphWiki-id-alist
1252 '((===adobe-japan1-0 "aj1-" 5 d nil)
1253 (===adobe-japan1-1 "aj1-" 5 d nil)
1254 (===adobe-japan1-2 "aj1-" 5 d nil)
1255 (===adobe-japan1-3 "aj1-" 5 d nil)
1256 (===adobe-japan1-4 "aj1-" 5 d nil)
1257 (===adobe-japan1-5 "aj1-" 5 d nil)
1258 (===adobe-japan1-6 "aj1-" 5 d nil)
1259 (===ucs@jis "u" 4 x nil)
1260 (===daikanwa "dkw-" 5 d nil)
1261 (===ucs@ks "u" 4 x "-k")
1262 (=ucs-var-001 "u" 4 x "-var-001")
1263 (=ucs-var-002 "u" 4 x "-var-002")
1264 (=ucs-var-003 "u" 4 x "-var-003")
1265 (=ucs-itaiji-001 "u" 4 x "-itaiji-001")
1266 (=ucs-itaiji-002 "u" 4 x "-itaiji-002")
1267 (=ucs-itaiji-003 "u" 4 x "-itaiji-003")
1268 (=ucs-itaiji-084 "u" 4 x "-itaiji-084")
1269 (==adobe-japan1-0 "aj1-" 5 d nil)
1270 (==adobe-japan1-1 "aj1-" 5 d nil)
1271 (==adobe-japan1-2 "aj1-" 5 d nil)
1272 (==adobe-japan1-3 "aj1-" 5 d nil)
1273 (==adobe-japan1-4 "aj1-" 5 d nil)
1274 (==adobe-japan1-5 "aj1-" 5 d nil)
1275 (==adobe-japan1-6 "aj1-" 5 d nil)
1276 (==ucs@jis "u" 4 x nil)
1277 (==ucs@iso "u" 4 x nil)
1278 (==ucs@cns "u" 4 x "-t")
1279 (==ucs@unicode "u" 4 x "-us")
1280 (==daikanwa "dkw-" 5 d nil)
1281 (==ucs@ks "u" 4 x "-k")
1282 (==jis-x0208@1978 "j78-" 4 x nil)
1283 (==jis-x0208 "j90-" 4 x nil)
1284 (==jis-x0208@1990 "j90-" 4 x nil)
1285 (==jis-x0208@1983 "j83-" 4 x nil)
1286 (==cbeta "cbeta-" 5 d nil)
1287 (=>>hanyo-denshi/ks "koseki-" 6 d nil)
1288 (=>>jis-x0208@1978 "j78-" 4 x nil)
1289 (=>>big5-cdp "cdp-" 4 x nil)
1290 (=>>jis-x0208 "j90-" 4 x nil)
1291 (=>>jis-x0208@1990 "j90-" 4 x nil)
1292 (=>>jis-x0208@1983 "j83-" 4 x nil)
1293 (=>>daikanwa "dkw-" 5 d nil)
1294 (=adobe-japan1-0 "aj1-" 5 d nil)
1295 (=adobe-japan1-1 "aj1-" 5 d nil)
1296 (=adobe-japan1-2 "aj1-" 5 d nil)
1297 (=adobe-japan1-3 "aj1-" 5 d nil)
1298 (=adobe-japan1-4 "aj1-" 5 d nil)
1299 (=adobe-japan1-5 "aj1-" 5 d nil)
1300 (=adobe-japan1-6 "aj1-" 5 d nil)
1301 (=decomposition@cid)
1302 (=decomposition@hanyo-denshi)
1303 (=hanyo-denshi/ks "koseki-" 6 d nil)
1304 (=koseki "koseki-" 6 d nil)
1305 (=ucs@jis "u" 4 x nil)
1306 (=ucs@cns "u" 4 x "-t")
1307 (=ucs@ks "u" 4 x "-k")
1308 (=ucs@JP "u" 4 x nil)
1309 (=ucs@gb "u" 4 x "-g")
1310 (=ucs@iso "u" 4 x "-u")
1311 (=ucs@unicode "u" 4 x "-us")
1312 (=big5-cdp "cdp-" 4 x nil)
1313 (=cbeta "cbeta-" 5 d nil)
1314 (=big5-cdp-var-3 "cdp-" 4 x "-var-3")
1315 (=big5-cdp-var-5 "cdp-" 4 x "-var-5")
1316 (=jef-china3 "jc3-" 4 x nil)
1317 (=jis-x0212 "jsp-" 4 x nil)
1318 (=jis-x0213-1@2000 "jx1-2000-" 4 x nil)
1319 (=jis-x0213-1@2004 "jx1-2004-" 4 x nil)
1320 (=jis-x0213-2 "jx2-" 4 x nil)
1321 (=gt-k "gt-k" 5 d nil)
1322 (=jis-x0208@1978/1pr "j78-" 4 x nil)
1323 (=jis-x0208@1978/-4pr "j78-" 4 x nil)
1324 (=jis-x0208@1978 "j78-" 4 x nil)
1325 (=+>jis-x0208@1978 "j78-" 4 x nil)
1326 (=+>jis-x0208 "j90-" 4 x nil)
1327 (=+>jis-x0208@1990 "j90-" 4 x nil)
1328 (=+>jis-x0208@1983 "j83-" 4 x nil)
1330 (=big5 "b-" 4 x nil)
1331 (=daikanwa "dkw-" 5 d nil)
1333 (=ks-x1001 "k0-" 4 x nil)
1334 (=cns11643-1 "c1-" 4 x nil)
1335 (=cns11643-2 "c2-" 4 x nil)
1336 (=cns11643-3 "c3-" 4 x nil)
1337 (=cns11643-4 "c4-" 4 x nil)
1338 (=cns11643-5 "c5-" 4 x nil)
1339 (=cns11643-6 "c6-" 4 x nil)
1340 (=cns11643-7 "c7-" 4 x nil)
1341 (=jis-x0208 "j90-" 4 x nil)
1342 (=jis-x0208@1990 "j90-" 4 x nil)
1343 (=jis-x0208@1983 "j83-" 4 x nil)
1346 (defun char-GlyphWiki-id (char)
1347 (let ((rest coded-charset-GlyphWiki-id-alist)
1350 (setq spec (pop rest))
1351 (null (setq ret (char-feature char (car spec))))))
1355 (mapconcat #'char-GlyphWiki-id ret "-"))
1356 (and (memq (car spec) '(=ucs@unicode '=ucs@iso))
1358 ((and (or (encode-char char '=jis-x0208@1990)
1359 (encode-char char '=jis-x0212)
1360 (encode-char char '=jis-x0213-1)
1361 (encode-char char '=jis-x0213-2))
1362 (setq code (encode-char char '=ucs@jis)))
1363 (format "u%04x" code)
1365 ((and (or (encode-char char '=gb2312)
1366 (encode-char char '=gb12345))
1367 (setq code (encode-char char '=ucs@gb)))
1368 (format "u%04x-g" code)
1370 ((and (or (encode-char char '=cns11643-1)
1371 (encode-char char '=cns11643-2)
1372 (encode-char char '=cns11643-3)
1373 (encode-char char '=cns11643-4)
1374 (encode-char char '=cns11643-5)
1375 (encode-char char '=cns11643-6)
1376 (encode-char char '=cns11643-7))
1377 (setq code (encode-char char '=ucs@cns)))
1378 (format "u%04x-t" code)
1380 ((and (encode-char char '=ks-x1001)
1381 (setq code (encode-char char '=ucs@ks)))
1382 (format "u%04x-k" code)
1384 (format (format "%s%%0%d%s%s"
1388 (or (nth 4 spec) ""))
1395 (provide 'cwiki-common)
1397 ;;; cwiki-common.el ends here