2 (require 'cwiki-common)
4 (defun www-format-encode-string (string &optional without-tags as-body)
7 (let (plane code subcode start end char variants ret rret)
9 (goto-char (point-min))
10 (while (search-forward "&" nil t)
11 (replace-match "&" nil t)))
12 (goto-char (point-min))
13 (while (search-forward "<" nil t)
14 (replace-match "<" nil t))
15 (goto-char (point-min))
16 (while (search-forward ">" nil t)
17 (replace-match ">" nil t))
19 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
20 (let ((coded-charset-entity-reference-alist
24 '(=hanyo-denshi/ja "HD-JA-" 4 X)
25 '(=hanyo-denshi/jb "HD-JB-" 4 X)
26 '(=hanyo-denshi/jc "HD-JC-" 4 X)
27 '(=hanyo-denshi/jd "HD-JD-" 4 X)
28 '(=hanyo-denshi/ft "HD-FT-" 4 X)
29 '(=hanyo-denshi/ia "HD-IA-" 4 X)
30 '(=hanyo-denshi/ib "HD-IB-" 4 X)
31 '(=hanyo-denshi/hg "HD-HG-" 4 X)
32 '(=hanyo-denshi/ip "HD-IP-" 4 X)
33 '(=hanyo-denshi/jt "HD-JT-" 4 X)
34 '(=hanyo-denshi/ks "HD-KS-" 6 d)
35 '(=>>hanyo-denshi/ja "G-HD-JA-" 4 X)
36 '(=>>hanyo-denshi/jb "G-HD-JB-" 4 X)
37 '(=>>hanyo-denshi/jc "G-HD-JC-" 4 X)
38 '(=>>hanyo-denshi/jd "G-HD-JD-" 4 X)
39 '(=>>hanyo-denshi/ft "G-HD-FT-" 4 X)
40 '(=>>hanyo-denshi/ia "G-HD-IA-" 4 X)
41 '(=>>hanyo-denshi/ib "G-HD-IB-" 4 X)
42 '(=>>hanyo-denshi/hg "G-HD-HG-" 4 X)
43 '(=>>hanyo-denshi/ip "G-HD-IP-" 4 X)
44 '(=>>hanyo-denshi/jt "G-HD-JT-" 4 X)
45 '(=>>hanyo-denshi/ks "G-HD-KS-" 6 d)
47 '(==hanyo-denshi/ja "g2-HD-JA-" 4 X)
48 '(==hanyo-denshi/jb "g2-HD-JB-" 4 X)
49 '(==hanyo-denshi/jc "g2-HD-JC-" 4 X)
50 '(==hanyo-denshi/jd "g2-HD-JD-" 4 X)
51 '(==hanyo-denshi/ft "g2-HD-FT-" 4 X)
52 '(==hanyo-denshi/ia "g2-HD-IA-" 4 X)
53 '(==hanyo-denshi/ib "g2-HD-IB-" 4 X)
54 '(==hanyo-denshi/hg "g2-HD-HG-" 4 X)
55 '(==hanyo-denshi/ip "g2-HD-IP-" 4 X)
56 '(==hanyo-denshi/jt "g2-HD-JT-" 4 X)
57 '(==hanyo-denshi/ks "g2-HD-KS-" 6 d)
58 '(==daijiten "g2-DJT-" 5 d)
59 '(=cns11643-1 "C1-" 4 X)
60 '(=cns11643-2 "C2-" 4 X)
61 '(=cns11643-3 "C3-" 4 X)
62 '(=cns11643-4 "C4-" 4 X)
63 '(=cns11643-5 "C5-" 4 X)
64 '(=cns11643-6 "C6-" 4 X)
65 '(=cns11643-7 "C7-" 4 X)
66 '(=adobe-japan1-6 "AJ1-" 5 d)
67 '(=big5-cdp "CDP-" 4 X)
68 '(=>big5-cdp "A-CDP-" 4 X)
71 '(=jis-x0208@1990 "J90-" 4 X)
72 '(=jis-x0212 "JSP-" 4 X)
74 '(=jis-x0208@1997 "J97-" 4 X)
75 '(=jis-x0208@1978 "J78-" 4 X)
76 '(=jis-x0208@1983 "J83-" 4 X)
77 '(=ruimoku-v6 "RUI6-" 4 X)
78 '(=zinbun-oracle "ZOB-" 4 d)
79 '(=daijiten "DJT-" 5 d)
80 '(=jef-china3 "JC3-" 4 X)
81 '(=ucs@unicode "UU+" 4 X)
82 '(=ucs@JP/hanazono "hanaJU+" 4 X)
83 '(==cns11643-1 "R-C1-" 4 X)
84 '(==cns11643-2 "R-C2-" 4 X)
85 '(==cns11643-3 "R-C3-" 4 X)
86 '(==cns11643-4 "R-C4-" 4 X)
87 '(==cns11643-5 "R-C5-" 4 X)
88 '(==cns11643-6 "R-C6-" 4 X)
89 '(==cns11643-7 "R-C7-" 4 X)
90 '(=hanziku-1 "HZK01-" 4 X)
91 '(=hanziku-2 "HZK02-" 4 X)
92 '(=hanziku-3 "HZK03-" 4 X)
93 '(=hanziku-4 "HZK04-" 4 X)
94 '(=hanziku-5 "HZK05-" 4 X)
95 '(=hanziku-6 "HZK06-" 4 X)
96 '(=hanziku-7 "HZK07-" 4 X)
97 '(=hanziku-8 "HZK08-" 4 X)
98 '(=hanziku-9 "HZK09-" 4 X)
99 '(=hanziku-10 "HZK10-" 4 X)
100 '(=hanziku-11 "HZK11-" 4 X)
101 '(=hanziku-12 "HZK12-" 4 X)
102 '(==>daijiten "A2-DJT-" 5 d)
105 '(=daikanwa "M-" 5 d)
106 '(=>>daikanwa "G-M-" 5 d)
107 '(===ucs@ks "R-KU+" 4 X)
108 coded-charset-entity-reference-alist)))
109 (encode-coding-region (point-min)(point-max) 'utf-8-mcs-er)
111 (goto-char (point-min))
112 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\|R-\\)?CB\\([0-9]+\\);" nil t)
113 (setq code (string-to-int (match-string 2)))
115 (format "<img alt=\"CB%05d\" src=\"%s/cb-gaiji/%02d/CB%05d.gif\"
118 chise-wiki-legacy-bitmap-glyphs-url
120 www-format-char-img-style)
123 (goto-char (point-min))
124 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?J\\(78\\|83\\|90\\|97\\|SP\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
125 (setq plane (match-string 2)
126 code (string-to-int (match-string 3) 16))
128 (format "<img alt=\"J%s-%04X\" src=\"%s/JIS-%s/%02d-%02d.gif\"
131 chise-wiki-legacy-bitmap-glyphs-url
134 (- (logand code 255) 32)
135 www-format-char-img-style)
138 (goto-char (point-min))
139 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?J0-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
140 (setq code (string-to-int (match-string 2) 16))
142 (format "<img alt=\"J0-%04X\" src=\"%s/JIS-90/%02d-%02d.gif\"
145 chise-wiki-legacy-bitmap-glyphs-url
147 (- (logand code 255) 32)
148 www-format-char-img-style)
151 (goto-char (point-min))
152 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-\\(JA\\|JB\\|JC\\|JD\\|FT\\|IA\\|IB\\|HG\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
153 (setq plane (match-string 2)
154 code (string-to-int (match-string 3) 16))
156 (format "<img alt=\"HD-%s-%04X\" src=\"%s/IVD/HanyoDenshi/%s%02d%02d.png\"
159 chise-wiki-legacy-bitmap-glyphs-url
162 (- (logand code 255) 32)
163 www-format-char-img-style)
166 (goto-char (point-min))
167 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-\\(IP\\|JT\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
168 (setq plane (match-string 2)
169 code (string-to-int (match-string 3) 16))
171 (format "<img alt=\"HD-%s-%04X\" src=\"%s/IVD/HanyoDenshi/%s%04X.png\"
174 chise-wiki-legacy-bitmap-glyphs-url
176 www-format-char-img-style)
179 (goto-char (point-min))
180 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-KS-\\([0-9]+\\);" nil t)
181 (setq code (string-to-int (match-string 2)))
183 (format "<img alt=\"HD-KS%06d\" src=\"%s/IVD/HanyoDenshi/KS%06d.png\"
184 style=\"vertical-align:middle\">"
186 chise-wiki-legacy-bitmap-glyphs-url
188 www-format-char-img-style)
191 (goto-char (point-min))
192 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?HD-TK-\\([0-9]+\\);" nil t)
193 (setq code (string-to-int (match-string 2)))
195 (format "<img alt=\"HD-KS%06d\" src=\"%s/IVD/HanyoDenshi/TK%08d.png\"
196 style=\"vertical-align:middle\">"
198 chise-wiki-legacy-bitmap-glyphs-url
200 www-format-char-img-style)
203 (goto-char (point-min))
204 (while (re-search-forward "&G\\([01]\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
205 (setq plane (string-to-int (match-string 1))
206 code (string-to-int (match-string 2) 16))
208 (format "<img alt=\"GB%d-%04X\" src=\"%s/GB%d/%02d-%02d.gif\"
211 chise-wiki-legacy-bitmap-glyphs-url
214 (- (logand code 255) 32)
215 www-format-char-img-style)
218 (goto-char (point-min))
219 (while (re-search-forward "&\\(R-\\)?C\\([1-7]\\)-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
220 (setq plane (string-to-int (match-string 2))
221 code (string-to-int (match-string 3) 16))
223 (format "<img alt=\"CNS%d-%04X\" src=\"%s/CNS%d/%04X.gif\"
226 chise-wiki-legacy-bitmap-glyphs-url
228 www-format-char-img-style)
231 (goto-char (point-min))
232 (while (re-search-forward "&\\(R-\\)?JC3-\\([0-9A-F][0-9A-F][0-9A-F][0-9A-F]\\);" nil t)
233 (setq code (string-to-int (match-string 2) 16))
235 (format "<img alt=\"JC3-%04X\" src=\"%s/JEF-CHINA3/%04X.png\">"
236 code chise-wiki-bitmap-glyph-image-url code)
239 (goto-char (point-min))
240 (while (re-search-forward "&\\(A-\\)?ZOB-\\([0-9]+\\);" nil t)
241 (setq code (string-to-int (match-string 2)))
243 (format "<img alt=\"ZOB-%04d\" src=\"%s/ZOB-1968/%04d.png\"
244 style=\"vertical-align:middle\">"
246 chise-wiki-legacy-bitmap-glyphs-url
248 www-format-char-img-style)
251 (goto-char (point-min))
252 (while (re-search-forward "&\\(A2-\\|g2-\\|R-\\)?DJT-\\([0-9]+\\);" nil t)
253 (setq code (string-to-int (match-string 2)))
255 (format "<img alt=\"DJT-%05d\" src=\"%s/%05d.png\"
256 style=\"vertical-align:middle; width: auto; max-height: 60px\">"
258 chise-wiki-daijiten-bitmap-glyphs-url
260 www-format-char-img-style)
263 (goto-char (point-min))
264 (while (re-search-forward "&SW-JIGUGE\\([45]?\\)-\\([0-9]+\\);" nil t)
265 (setq subcode (match-string 1)
266 code (string-to-int (match-string 2)))
268 (if (string= subcode "")
272 (format "<img alt=\"SW-JIGUGE%s-%05d\" src=\"%s/ShuoWen/Jiguge%s/%05d.png\"
273 style=\"vertical-align:middle; width: auto; max-height: 80px\">"
275 chise-wiki-legacy-bitmap-glyphs-url
279 (goto-char (point-min))
280 (while (re-search-forward "&HNG\\([0-9]+\\)-\\([0-9][0-9][0-9][0-9]\\)\\([0-9]\\);" nil t)
281 (setq plane (match-string 1)
282 code (string-to-int (match-string 2))
283 subcode (string-to-int (match-string 3)))
287 (char-to-string (decode-char 'ascii (+ 96 subcode)))))
290 "<img alt=\"HNG%s-%04d%s\" src=\"%s/%s/%04d%s.png\" style=\"
291 vertical-align:middle; width: auto; max-height: 60px\">"
293 chise-wiki-hng-bitmap-glyphs-url
298 (goto-char (point-min))
299 (while (re-search-forward "&\\(R-\\)?CHISE-HDIC-TSJ\\([0-9A-F]+\\);" nil t)
300 (setq code (string-to-int (match-string 2) 16))
301 (setq char (decode-char '===chise-hdic-tsj code))
302 (when (setq ret (get-char-attribute char '=hdic-tsj-glyph-id))
305 "<img alt=\"HDIC-TSJ-%s\" src=\"https://viewer.hdic.jp/img/tsj/%s.jpg\" style=\"
306 vertical-align:middle; width: auto; max-height: 60px\">"
310 (goto-char (point-min))
311 (while (re-search-forward "&\\(R-\\)?CHISE-HDIC-SYP\\([0-9A-F]+\\);" nil t)
312 (setq code (string-to-int (match-string 2) 16))
313 (setq char (decode-char '===chise-hdic-syp code))
314 (when (setq ret (get-char-attribute char '=hdic-syp-entry-id))
317 "<img alt=\"HDIC-SYP-%s\" src=\"https://viewer.hdic.jp/img/syp/%s\" style=\"
318 vertical-align:middle; width: auto; max-height: 60px\">"
322 (goto-char (point-min))
323 (while (re-search-forward "&\\(R-\\)?CHISE-HDIC-KTB\\([0-9A-F]+\\);" nil t)
324 (setq code (string-to-int (match-string 2) 16))
325 (setq char (decode-char '===chise-hdic-ktb code))
326 (when (setq ret (get-char-attribute char '=hdic-ktb-entry-id))
329 "<img alt=\"HDIC-KTB-%s\" src=\"https://hdic.chise.org/img/ktb/%s.jpg\" style=\"
330 vertical-align:middle; width: auto; max-height: 60px\">"
334 (goto-char (point-min))
335 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?AJ1-\\([0-9]+\\);" nil t)
336 (setq code (string-to-int (match-string 2)))
338 (format "<img alt=\"AJ1-%05d\" src=\"%s/IVD/AdobeJapan1/CID+%d.png\"
339 style=\"vertical-align:middle\">"
341 chise-wiki-legacy-bitmap-glyphs-url
343 www-format-char-img-style)
346 (goto-char (point-min))
347 (while (re-search-forward "&\\(A-\\|o-\\|G-\\|g2-\\|R-\\)?MJ\\([0-9]+\\);" nil t)
348 (setq code (string-to-int (match-string 2)))
350 (format "<img alt=\"MJ%06d\" src=\"https://moji.or.jp/mojikibansearch/img/MJ/MJ%06d.png\"
351 style=\"vertical-align:middle; width: 48px; height: 48px\">"
354 www-format-char-img-style)
357 (goto-char (point-min))
358 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\)?IU[+-]\\([0-9A-F]+\\);" nil t)
359 (setq code (string-to-int (match-string 2) 16))
361 (format "<img alt=\"u%04x\" src=\"%s/u%04x.svg\"
362 style=\"vertical-align:middle; width: 48px; height: 48px\">"
364 chise-wiki-glyphwiki-glyph-image-url
366 www-format-char-img-style)
369 (goto-char (point-min))
370 (while (re-search-forward "&\\(o-\\|G-\\|g2-\\|R-\\)?KU[+-]\\([0-9A-F]+\\);" nil t)
371 (setq code (string-to-int (match-string 2) 16))
373 (format "<img alt=\"u%04x-k\" src=\"%s/u%04x-k.svg\"
374 style=\"vertical-align:middle; width: 48px; height: 48px\">"
376 chise-wiki-glyphwiki-glyph-image-url
378 www-format-char-img-style)
381 (goto-char (point-min))
382 (while (re-search-forward "&A-\\(comp\\|cgn\\)U[+-]\\([0-9A-F]+\\);" nil t)
383 (setq code (string-to-int (match-string 2) 16))
385 (format "<img alt=\"u%04x\" src=\"%s/u%04x.svg\"
386 style=\"vertical-align:middle; width: 48px; height: 48px\">"
388 chise-wiki-glyphwiki-glyph-image-url
390 www-format-char-img-style)
393 (goto-char (point-min))
394 (while (re-search-forward
395 "&\\(A-\\|g2-\\)?U-i\\([0-9]+\\)\\+\\([0-9A-F]+\\);"
397 (setq plane (string-to-int (match-string 2))
398 code (string-to-int (match-string 3) 16))
400 (format "<img alt=\"u%04x-itaiji-%03d\" src=\"%s/u%04x-itaiji-%03d.svg\"
401 style=\"vertical-align:middle; width: 48px; height: 48px\">"
404 chise-wiki-glyphwiki-glyph-image-url
407 www-format-char-img-style)
410 (goto-char (point-min))
411 (while (re-search-forward "&A-IWDSU\\+\\([0-9A-F]+\\);" nil t)
412 (setq code (string-to-int (match-string 1) 16))
414 (format "<img alt=\"A-IWDSU+%04x\" src=\"%s/u%04x.svg\"
415 style=\"vertical-align:middle; width: 48px; height: 48px\">"
417 chise-wiki-glyphwiki-glyph-image-url
419 www-format-char-img-style)
422 (goto-char (point-min))
423 (while (re-search-forward
424 "&\\(A-\\)?CDP-i\\([0-9]+\\)-\\([0-9A-F]+\\);"
426 (setq plane (string-to-int (match-string 2))
427 code (string-to-int (match-string 3) 16))
429 (format "<img alt=\"cdp-%04x-itaiji-%03d\" src=\"%s/cdp-%04x-itaiji-%03d.svg\"
430 style=\"vertical-align:middle; width: 48px; height: 48px\">"
433 chise-wiki-glyphwiki-glyph-image-url
436 www-format-char-img-style)
439 (goto-char (point-min))
440 (while (re-search-forward
441 "&\\(A-\\)?CDP-v\\([0-9]+\\)-\\([0-9A-F]+\\);"
443 (setq plane (string-to-int (match-string 2))
444 code (string-to-int (match-string 3) 16))
446 (format "<img alt=\"cdp-%04x-var-%03d\" src=\"%s/cdp-%04x-var-%03d.svg\"
447 style=\"vertical-align:middle; width: 48px; height: 48px\">"
450 chise-wiki-glyphwiki-glyph-image-url
453 www-format-char-img-style)
456 (goto-char (point-min))
457 (while (re-search-forward
458 "&\\(A-\\|G-\\|g2-\\|R-\\)?M-\\([0-9]+\\);"
460 (setq code (string-to-int (match-string 2)))
462 (format "<img alt=\"dkw-%05d\" src=\"%s/dkw-%05d.svg\"
463 style=\"vertical-align:middle; width: 48px; height: 48px\">"
465 chise-wiki-glyphwiki-glyph-image-url
467 www-format-char-img-style)
470 (goto-char (point-min))
471 (while (re-search-forward "&\\(g2-\\)?U-v\\([0-9]+\\)\\+\\([0-9A-F]+\\);" nil t)
472 (setq plane (string-to-int (match-string 2))
473 code (string-to-int (match-string 3) 16))
475 (format "<img alt=\"u%04x-var-%03d\" src=\"%s/u%04x-var-%03d.svg\"
476 style=\"vertical-align:middle; width: 48px; height: 48px\">"
479 chise-wiki-glyphwiki-glyph-image-url
482 www-format-char-img-style)
485 (goto-char (point-min))
486 (while (re-search-forward "&\\(A-\\|G-\\|R-\\|g2-\\)?GT-\\([0-9]+\\);" nil t)
487 (setq code (string-to-int (match-string 2)))
489 (format "<img alt=\"GT-%05d\" src=\"%s?char=GT-%05d\"
492 chise-wiki-glyph-cgi-url
494 www-format-char-img-style)
497 (goto-char (point-min))
498 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\)?GT-K\\([0-9]+\\);" nil t)
499 (setq code (string-to-int (match-string 2)))
501 (format "<img alt=\"GT-K%05d\" src=\"%s?char=GT-K%05d\"
504 chise-wiki-glyph-cgi-url
506 www-format-char-img-style)
509 (goto-char (point-min))
510 (while (re-search-forward "&B-\\([0-9A-F]+\\);" nil t)
511 (setq code (string-to-int (match-string 1) 16))
513 (format "<img alt=\"B-%04X\" src=\"%s?char=B-%04X\"
516 chise-wiki-glyph-cgi-url
518 www-format-char-img-style)
521 (goto-char (point-min))
522 (while (re-search-forward
523 "&\\(A-\\|G-\\|g2-\\|R-\\)?CDP-\\([0-9A-F]+\\);" nil t)
524 (setq code (string-to-int (match-string 2) 16))
526 (format "<img alt=\"CDP-%04X\" src=\"%s?char=CDP-%04X\"
529 chise-wiki-glyph-cgi-url
531 www-format-char-img-style)
534 (goto-char (point-min))
535 (while (re-search-forward
536 "&\\(I-\\)?HZK\\(0[1-9]\\|1[0-2]\\)-\\([0-9A-F]+\\);" nil t)
537 (setq plane (match-string 2)
538 code (string-to-int (match-string 3) 16))
540 (format "<img alt=\"HZK%s-%04X\" src=\"%s?char=HZK%s-%04X\"
544 chise-wiki-glyph-cgi-url
547 www-format-char-img-style)
550 (goto-char (point-min))
551 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\|R-\\)?RUI6-\\([0-9A-F]+\\);" nil t)
552 (setq code (string-to-int (match-string 2) 16))
554 (format "<img alt=\"RUI6-%04X\" src=\"%s?char=RUI6-%04X\"
555 style=\"vertical-align:middle\">"
557 chise-wiki-glyph-cgi-url
559 www-format-char-img-style)
562 (goto-char (point-min))
563 (while (re-search-forward "&hanaJU\\+\\([0-9A-F]+\\);" nil t)
564 (setq code (string-to-int (match-string 1) 16))
566 (format "<img alt=\"hanaJU+%04X\" src=\"%s?char=hana-JU+%04X\"
567 style=\"vertical-align:middle\">"
569 chise-wiki-glyph-cgi-url
571 www-format-char-img-style)
574 (goto-char (point-min))
575 (while (re-search-forward "&\\(A-\\|G-\\|g2-\\|R-\\)?\\(UU\\+\\|U-\\)\\([0-9A-F]+\\);" nil t)
576 (setq code (string-to-int (match-string 3) 16))
578 (format "<img alt=\"UU+%04X\" src=\"https://www.unicode.org/cgi-bin/refglyph?24-%04X\"
579 style=\"vertical-align:middle\">"
582 www-format-char-img-style)
585 (goto-char (point-min))
586 (while (re-search-forward "&MCS-\\([0-9A-F]+\\);" nil t)
587 (setq code (string-to-int (match-string 1) 16))
588 (setq start (match-beginning 0)
590 (setq char (decode-char 'system-char-id code))
593 (or (www-get-feature-value char '->subsumptive)
594 (www-get-feature-value char '->denotational)))
596 (if (characterp variants)
597 (setq variants (list variants)))
599 (setq ret (www-format-encode-string
600 (char-to-string (car variants))))
601 (string-match "&MCS-\\([0-9A-F]+\\);" ret))
602 (setq variants (cdr variants)))
604 (unless (string-match "&MCS-\\([0-9A-F]+\\);" ret)
606 (delete-region start end)
609 ((setq ret (or (www-get-feature-value char 'ideographic-combination)
610 (www-get-feature-value char 'ideographic-structure)))
615 (if (characterp (setq rret (find-char ch)))
618 (www-format-encode-string
619 (char-to-string ch) without-tags)
620 (www-format-encode-string
621 (format "%S" ch) without-tags)))
625 (delete-region start end)
629 ;; (goto-char (point-min))
630 ;; (while (search-forward ">-" nil t)
631 ;; (replace-match "&GT-" t 'literal))
634 (setq www-format-char-img-style "vertical-align:middle;")
636 (defun decode-url-string (string &optional coding-system)
637 (if (> (length string) 0)
640 (while (string-match "%\\([0-9A-F][0-9A-F]\\)" string i)
641 (setq dest (concat dest
642 (substring string i (match-beginning 0))
645 (string-to-int (match-string 1 string) 16))))
647 (decode-coding-string
648 (concat dest (substring string i))
651 (defconst www-ids-find-version "0.99.2")
653 (defvar www-ids-find-ideographic-products-file-name
654 (expand-file-name "ideographic-products"
659 chise-system-db-directory))))
661 (defvar www-ids-find-char-viewer-url
662 "/est/view/character/")
664 (defvar www-ids-find-chise-link-map-url-prefix
665 "http://fonts.jp/chise_linkmap/map.cgi?code=")
667 (defvar www-ids-find-tang-chars-file-name
668 "~tomo/projects/chise/ids/www/tang-chars.udd")
670 (defun www-ids-find-format-char (c &optional code-desc)
672 (format "<a href=\"%s%s\">%s</a>"
673 www-ids-find-char-viewer-url
674 (www-uri-encode-object c)
675 (www-format-encode-string (char-to-string c))))
676 ;; (let ((str (encode-coding-string (format "%c" c) 'utf-8-er))
681 ;; ((string-match "&CB\\([0-9]+\\);" str)
682 ;; (setq code (string-to-int (match-string 1 str)))
683 ;; (insert (format "<a href=\"%s"
684 ;; www-ids-find-char-viewer-url))
686 ;; (insert (format "\"><img alt=\"CB%05d\" src=\"/glyphs/cb-gaiji/%02d/CB%05d.gif\">\n"
687 ;; code (/ code 1000) code))
689 ;; (insert (format "CB%05d</a>" code)))
691 ;; ((string-match "&JC3-\\([0-9A-F]+\\);" str)
692 ;; (setq code (string-to-int (match-string 1 str) 16))
693 ;; (insert (format "<a href=\"%s"
694 ;; www-ids-find-char-viewer-url))
696 ;; (insert (format "\"><img alt=\"JC3-%04X\" src=\"http://kanji.zinbun.kyoto-u.ac.jp/db/CHINA3/Gaiji/%04x.gif\">\n"
699 ;; (insert (format "JC3-%04X</a>" code)))
701 ;; ((string-match "&J\\(78\\|83\\|90\\|SP\\)-\\([0-9A-F]+\\);" str)
702 ;; (setq plane (match-string 1 str)
703 ;; code (string-to-int (match-string 2 str) 16))
704 ;; (insert (format "<a href=\"%s"
705 ;; www-ids-find-char-viewer-url))
707 ;; (insert (format "\"><img alt=\"J%s-%04X\" src=\"/glyphs/JIS-%s/%02d-%02d.gif\">\n"
709 ;; (- (lsh code -8) 32)
710 ;; (- (logand code 255) 32)))
712 ;; (insert (format "J%s-%04X</a>" plane code)))
714 ;; ((string-match "&G\\([01]\\)-\\([0-9A-F]+\\);" str)
715 ;; (setq plane (string-to-int (match-string 1 str))
716 ;; code (string-to-int (match-string 2 str) 16))
717 ;; (insert (format "<a href=\"%s"
718 ;; www-ids-find-char-viewer-url))
720 ;; (insert (format "\"><img alt=\"G%d-%04X\" src=\"/glyphs/GB%d/%02d-%02d.gif\">\n"
722 ;; (- (lsh code -8) 32)
723 ;; (- (logand code 255) 32)))
725 ;; (insert (format "G%d-%04X</a>" plane code)))
727 ;; ((string-match "&C\\([1-7]\\)-\\([0-9A-F]+\\);" str)
728 ;; (setq plane (string-to-int (match-string 1 str))
729 ;; code (string-to-int (match-string 2 str) 16))
730 ;; (insert (format "<a href=\"%s"
731 ;; www-ids-find-char-viewer-url))
733 ;; (insert (format "\"><img alt=\"C%d-%04X\" src=\"/glyphs/CNS%d/%04X.gif\">\n"
734 ;; plane code plane code))
736 ;; (insert (format "C%d-%04X</a>" plane code)))
738 ;; ((string-match "&ZOB-\\([0-9]+\\);" str)
739 ;; (setq code (string-to-int (match-string 1 str)))
740 ;; (insert (format "<a href=\"%s"
741 ;; www-ids-find-char-viewer-url))
743 ;; (insert (format "\"><img alt=\"ZOB-%04d\" src=\"/glyphs/ZOB-1968/%04d.png\">\n"
746 ;; (insert (format "ZOB-%04d</a>" code)))
749 ;; (insert (format "<a href=\"%s"
750 ;; www-ids-find-char-viewer-url))
753 ;; (mapconcat (lambda (c)
754 ;; (if (<= (char-int c) #x7F)
755 ;; (char-to-string c)
756 ;; (format "%%%02X" c)))
762 ;; (goto-char (point-min))
763 ;; (while (search-forward "&" nil t)
764 ;; (replace-match "&" t 'literal))
765 ;; (buffer-string))))
768 (defun www-ids-find-format-line (c is)
770 (princ "<span class=\"entry\">")
771 (www-ids-find-format-char c 'code-desc)
774 (or (if (setq ucs (or (char-ucs c)
775 (encode-char c 'ucs)))
777 " <a href=\"http://www.unicode.org/cgi-bin/GetUnihanData.pl?codepoint=%X\">%s</a>"
779 (cond ((<= ucs #xFFFF)
780 (format "U+%04X" ucs))
782 (format "U-%08X" ucs))))
786 (format " <a href=\"%s%X\">(link map)</a>"
787 www-ids-find-chise-link-map-url-prefix ucs)))
790 (setq ids (ideographic-structure-to-ids is))
793 (princ "<span class=\"ids\">")
795 (www-ids-find-format-char (aref ids i))
801 www-ids-find-tang-chars-file-name)
802 (goto-char (point-min))
803 (re-search-forward (format "^%d$" ucs) nil t)))
805 (format " <a href=\"http://coe21.zinbun.kyoto-u.ac.jp/djvuchar?query=%s\">"
808 (format "%%%02X" (char-int c)))
809 (encode-coding-string (char-to-string c)
812 (princ (encode-coding-string "
\e$B"M
\e(B[
\e$BEbBeBsK\
\e(B]</a>" 'utf-8-jp-er)))
815 (defun www-ids-insert-chars-including-components* (components
816 &optional ignored-chars products)
818 (setq products (ideograph-find-products components ignored-chars)))
820 (setq len (length products))
824 (sort (copy-list products)
826 (< (char-int a)(char-int b))))
829 (sort (copy-list products)
831 (if (setq as (char-total-strokes a))
832 (if (setq bs (char-total-strokes b))
834 (< (char-int a)(char-int b))
837 (< (char-int a)(char-int b)))))
840 (sort (copy-list products)
842 (if (setq as (char-total-strokes a))
843 (if (setq bs (char-total-strokes b))
845 (ideograph-char< a b)
848 (ideograph-char< a b))))
850 (unless (memq c ignored-chars)
851 (setq is (char-feature c 'ideographic-structure))
853 (www-ids-find-format-line c is)
855 (www-ids-insert-chars-including-components*
856 (char-to-string c) (cons c ignored-chars)))
863 (defun www-ids-insert-chars-including-components (components
864 &optional ignored-chars)
865 (let ((products (ideograph-find-products components ignored-chars))
866 is as bs len ignore-children)
867 (setq len (length products))
869 (setq ignore-children t)
871 (encode-coding-string
872 "<p>
\e$B7k2L$,B?$9$.$k$?$a!":F5"E*8!:w$r>JN,$7$^$7$?!#
\e(B</p>"
876 (www-ids-find-format-char c))
879 (www-ids-insert-chars-including-components* components ignored-chars products)))
880 (dolist (c ignored-chars)
881 (dolist (vc (char-component-variants c))
882 (unless (memq vc ignored-chars)
883 (when (setq is (get-char-attribute vc 'ideographic-structure))
885 (www-ids-find-format-line vc is)
887 (www-ids-insert-chars-including-components*
889 (cons vc ignored-chars)))))))
890 (setq products (ideograph-find-products-with-variants components ignored-chars))
891 (setq len (length products))
893 (setq ignore-children t)
895 (encode-coding-string
896 "<p>
\e$B7k2L$,B?$9$.$k$?$a!"4XO";z$N:F5"E*8!:w$r>JN,$7$^$7$?!#
\e(B</p>"
900 (www-ids-find-format-char c))
901 (dolist (c (sort (copy-tree products)
903 (if (setq as (char-total-strokes a))
904 (if (setq bs (char-total-strokes b))
906 (ideograph-char< a b)
909 (ideograph-char< a b)))))
910 (unless (memq c ignored-chars)
911 (setq is (get-char-attribute c 'ideographic-structure))
913 (www-ids-find-format-line c is)
914 (unless ignore-children
916 (www-ids-insert-chars-including-components*
918 (cons c ignored-chars))))
924 (defun www-batch-ids-find ()
925 (let ((components (car command-line-args-left))
926 (coded-charset-entity-reference-alist
928 '(=cns11643-1 "C1-" 4 X)
929 '(=cns11643-2 "C2-" 4 X)
930 '(=cns11643-3 "C3-" 4 X)
931 '(=cns11643-4 "C4-" 4 X)
932 '(=cns11643-5 "C5-" 4 X)
933 '(=cns11643-6 "C6-" 4 X)
934 '(=cns11643-7 "C7-" 4 X)
936 '(=gb12345 "G1-" 4 X)
937 '(=jis-x0208@1990 "J90-" 4 X)
938 '(=jis-x0212 "JSP-" 4 X)
940 '(=jef-china3 "JC3-" 4 X)
941 '(=jis-x0208@1978 "J78-" 4 X)
942 '(=jis-x0208@1983 "J83-" 4 X)
943 '(=daikanwa "M-" 5 d)
944 coded-charset-entity-reference-alist))
946 (setq command-line-args-left (cdr command-line-args-left))
948 ((stringp components)
949 (if (string-match "^components=" components)
950 (setq components (substring components (match-end 0))))
952 (if (> (length components) 0)
953 (decode-url-string components 'utf-8-er)
957 (setq components nil)
959 (princ "Content-Type: text/html; charset=UTF-8
961 <!DOCTYPE HTML PUBLIC \"-//W3C//DTD HTML 4.01 Transitional//EN\"
962 \"http://www.w3.org/TR/html4/loose.dtd\">
965 <meta name=\"viewport\" content=\"width=device-width, initial-scale=1\">
966 <title>CHISE IDS Find</title>
967 <link href=\"/css/bootstrap-4.5.0.min.css\" rel=\"stylesheet\">
968 <style type=\"text/css\">
970 .entry { font-size: 36px; }
971 .entry a img { height: 36px; }
972 .ids { font-size: 24px; }
973 .ids a img { height: 24px; }
974 img { vertical-align:middle; }
975 a { text-decoration:none; }
977 li { margin: 0 0 -0.2em; }
980 display: inline-block;
982 .tooltip .tooltiptext {
991 <div class=\"jumbotron jumbotron-fluid mb-0\">
992 <h1 class=\"display-4 text-center\">")
993 (princ (encode-coding-string "CHISE IDS
\e$B4A;z8!:w
\e(B" 'utf-8-jp-er))
996 <p class=\"text-center\">Version ")
997 (princ www-ids-find-version)
998 (princ (format-time-string
999 " (Last-modified: %Y-%m-%d %H:%M:%S)</p>"
1002 www-ids-find-ideographic-products-file-name))))
1005 <div class=\"container mt-0 mw-100 d-inline-block align-top bg-dark\">
1007 <div class=\"input-group mb-3 h3 my-4\">
1008 <div class=\"input-group-prepend mw-75 ml-3\">
1009 <form action=\"/ids-find\" method=\"GET\">
1010 <span class=\"input-group-text\" id=\"basic-addon1\">
1012 (princ (encode-coding-string "
\e$BItIJJ8;zNs
\e(B" 'utf-8-jp-er))
1015 <input type=\"text\" class=\"form-control\" aria-describedby=\"basic-addon1\" name=\"components\" size=\"30\" maxlength=\"256\" value=\"")
1016 (if (> (length components) 0)
1017 (princ (encode-coding-string components 'utf-8-er)))
1019 <input class=\"mr-3\" type=\"submit\" value=\"")
1020 (princ (encode-coding-string "
\e$B8!:w3+;O
\e(B" 'utf-8-jp-er))
1027 (unless (file-newer-than-file-p
1028 www-ids-find-ideographic-products-file-name
1029 (locate-file (car command-line-args) exec-path))
1030 (princ (encode-coding-string "<hr>
1032 \e$B8=:_!"%7%9%F%`$N99?7:n6HCf$G$9!#$7$P$i$/$*BT$A$/$@$5$$!#
\e(B
1035 ;; (setq components nil)
1039 (princ "<div class=\"container\">
1041 ;; (map-char-attribute
1043 ;; (when (every (lambda (p)
1044 ;; (ideographic-structure-member p v))
1046 ;; (princ (encode-coding-string
1047 ;; (ids-find-format-line c v)
1052 ;; 'ideographic-structure)
1053 (when (= (length components) 1)
1054 (www-ids-find-format-line (aref components 0)
1055 (char-feature (aref components 0)
1056 'ideographic-structure)))
1057 ;; (dolist (c (ideographic-products-find components))
1058 ;; (setq is (char-feature c 'ideographic-structure))
1059 ;; ;; to avoid problems caused by wrong indexes
1060 ;; (when (every (lambda (c)
1061 ;; (ideographic-structure-member c is))
1063 ;; (www-ids-find-format-line c is)))
1065 (www-ids-insert-chars-including-components components)
1066 ;; (princ "</ul>\n")
1070 (princ (encode-coding-string "<div class=\"container mt-4\">
1071 <div class=\"ml-3\">
1073 \e$B;XDj$7$?ItIJ$rA4$F4^$`4A;z$N0lMw$rI=<($7$^$9!#
\e(B
1076 CHISE
\e$B$GMQ$$$i$l$k<BBV;2>H7A<0!JNc!'
\e(B&M-00256;
\e$B!K$GItIJ$r;XDj$9$k;v$b$G$-$^$9!#
\e(B
1080 (princ (encode-coding-string "
1084 <li><a href=\"http://www.shuiren.org/chuden/toyoshi/syoseki/chise_ids.html\"
1085 >
\e$B!V
\e(BCHISE IDS FIND
\e$B$G4A;z$r8!:w!W
\e(B</a>
\e$B!=
\e(B
\e$B;3ED?r?N$5$s!J
\e(B<a
1086 href=\"http://www.shuiren.org/\">
\e$B?g?MDb
\e(B</a>
\e$B!K$K$h$k2r@b
\e(B
1089 <li><a href=\"http://www.karitsu.org/tools/firefox_plugin.htm\"
1090 >Firefox
\e$BMQ
\e(B plugin</a> by
\e$B=);3M[0lO:$5$s!J
\e(B<a href=\"http://www.karitsu.org/\"
1091 >
\e$B2aN)c7
\e(B</a>
\e$B!K
\e(B
1094 <li><a href=\"http://git.chise.org/gitweb/?p=chise/ids.git;a=blob;f=www/www-ids-find.el\"
1095 >www-ids-find.el (source file (Emacs Lisp part))
1096 <li><a href=\"http://www.chise.org/ids/\"
1097 >
\e$B!V
\e(BCHISE
\e$B4A;z9=B$>pJs%G!<%?%Y!<%9!W
\e(B</a>
1098 <li><a href=\"http://fonts.jp/chise_linkmap/\"
1099 >
\e$B!V
\e(Bchise_linkmap : CHISE
\e$B4A;zO"4D?^!W
\e(B</a> by
\e$B>eCO9(0l$5$s
\e(B
1100 <li><a href=\"http://www.chise.org/\"
1104 <li><a href=\"http://coe21.zinbun.kyoto-u.ac.jp/djvuchar\"
1105 >
\e$B!VBsK\J8;z%G!<%?%Y!<%9!W
\e(B</a> by
1106 <a href=\"http://coe21.zinbun.kyoto-u.ac.jp/\"
1107 >
\e$B5~ETBg3X
\e(B21
\e$B@$5*
\e(BCOE
\e$B!VEl%"%8%"@$3&$N?MJ8>pJs3X8&5f650i5rE@!W
\e(B</a>
1108 <li><a href=\"http://www.unicode.org/\"
1118 <div class=\"container\">
1120 (princ "<div class=\"ml-0\">
1121 Copyright (C) 2005, 2006, 2007, 2008, 2009, 2010, 2015, 2016, 2017, 2020 <a href=\"http://kanji.zinbun.kyoto-u.ac.jp/~tomo/\"
1122 >MORIOKA Tomohiko</a></div>")
1126 href=\"http://www.chise.org/xemacs/\"
1127 >XEmacs CHISE</a> %s.</div>"
1128 (encode-coding-string xemacs-chise-version 'utf-8-jp-er)))