1 ;;; chise-tex.el --- Coding-system based chise2otf like tool
3 ;; Copyright (C) 2004,2005,2006 MORIOKA Tomohiko
5 ;; Author: MORIOKA Tomohiko <tomo@kanji.zinbun.kyoto-u.ac.jp>
6 ;; Keywords: OTF package, pTeX, CHISE, Multiscript, Multilingual
8 ;; This file is a part of Omega/CHISE.
10 ;; This program is free software; you can redistribute it and/or
11 ;; modify it under the terms of the GNU General Public License as
12 ;; published by the Free Software Foundation; either version 2, or (at
13 ;; your option) any later version.
15 ;; This program is distributed in the hope that it will be useful, but
16 ;; WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
18 ;; General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with this program; see the file COPYING. If not, write to
22 ;; the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
23 ;; Boston, MA 02111-1307, USA.
27 (defvar chise-tex-coded-charset-expression-alist
28 '((=ucs-bmp@gb "UCSgb" 4 X)
29 (=ucs-bmp@jis "UCSjis" 4 X)
30 (=ucs-bmp@ks "UCSks" 4 X)
31 (=gt-pj-1 "GTpjA" 4 X)
32 (=gt-pj-2 "GTpjB" 4 X)
33 (=gt-pj-3 "GTpjC" 4 X)
34 (=gt-pj-4 "GTpjD" 4 X)
35 (=gt-pj-5 "GTpjE" 4 X)
36 (=gt-pj-6 "GTpjF" 4 X)
37 (=gt-pj-7 "GTpjG" 4 X)
38 (=gt-pj-8 "GTpjH" 4 X)
39 (=gt-pj-9 "GTpjI" 4 X)
40 (=gt-pj-10 "GTpjJ" 4 X)
41 (=gt-pj-11 "GTpjK" 4 X)
42 (=ucs-bmp@cns "UCScns" 4 X)))
44 (defun chise-tex-encode-region-for-gb (start end)
48 (narrow-to-region start end)
50 (let (chr ret rest spec)
51 (while (and (skip-chars-forward "\x00-\xFF")
53 (setq chr (char-after))
54 (cond ((memq chr '(?
\e$(O#@
\e(B))
56 (insert (format "\\UCSjis{%04X}"
57 (encode-char chr '=ucs@jis)))
59 ((and (setq ret (encode-char chr '=jis-x0208-1983))
62 ;; ((setq ret (encode-char chr '=jis-x0208-1990))
64 ;; (insert (decode-char '=jis-x0208-1983 ret)))
65 ((and (encode-char chr '=ks-x1001)
66 (setq ret (or (encode-char chr '=ucs@ks)
69 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
71 (insert (format "\\UCSks{%04X}" ret)))
73 (setq rest chise-tex-coded-charset-expression-alist)
74 (while (setq spec (car rest))
75 (if (setq ret (encode-char chr (car spec)))
77 (setq rest (cdr rest))))
79 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
81 (insert (format (format "\\%s{%%0%d%s}"
89 (defun chise-tex-encode-region-for-jis (start end)
93 (narrow-to-region start end)
95 (let (chr ret rest spec modifier)
96 (while (and (skip-chars-forward "\x00-\x7F")
98 (setq chr (char-after))
99 (cond ((encode-char chr '=jis-x0208-1983)
101 ;; ((setq ret (encode-char chr '=jis-x0208-1990))
103 ;; (insert (decode-char '=jis-x0208-1983 ret)))
104 ((and (not (eq (char-ucs chr) #x0451))
105 (setq ret (char-feature chr '=decomposition))
106 (setq modifier (assq (nth 1 ret)
119 (insert (format "\\%s{%c}" (cdr modifier) (car ret))))
120 ((and (or (encode-char chr '=jis-x0213-1-2000)
121 (encode-char chr '=jis-x0213-2-2000))
122 (setq ret (or (encode-char chr '=ucs@jis/2000)
123 (encode-char chr '=ucs@jis/fw))))
125 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
127 (insert (format "\\UCSjis{%04X}" ret)))
128 ((and (encode-char chr '=ks-x1001)
129 (setq ret (or (encode-char chr '=ucs@ks)
132 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
134 (insert (format "\\UCSks{%04X}" ret)))
135 ((setq ret (encode-char chr '=ucs-hangul))
137 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
139 (insert (format "\\UCSks{%04X}" ret)))
142 (insert "\\textbullet{}"))
145 (insert "\\UCSjis{0294}"))
146 ((and (encode-char chr '=ucs@jp)
147 (setq ret (char-representative-of-domain chr 'gb))
148 (setq ret (encode-char ret '=ucs@gb)))
150 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
152 (insert (format "\\UCSgb{%04X}" ret)))
154 (setq rest chise-tex-coded-charset-expression-alist)
155 (while (setq spec (car rest))
156 (if (setq ret (encode-char chr (car spec)))
158 (setq rest (cdr rest))))
160 ;; (if (eq (char-before) ?
\e$B!T
\e(B)
162 (insert (format (format "\\%s{%%0%d%s}"
168 (forward-char))))))))
170 (defun chise-tex-decode-region (start end)
174 (narrow-to-region start end)
176 (let (macro code ret me rest spec)
177 (while (re-search-forward "\\\\\\([a-zA-Z0-9]+\\){\\([0-9A-Fa-f]+\\)}"
179 (setq macro (match-string 1)
180 code (match-string 2)
183 (setq rest chise-tex-coded-charset-expression-alist)
184 (while (setq spec (car rest))
185 (if (string= (nth 1 spec) macro)
187 (setq rest (cdr rest))))
188 (setq ret (decode-char (car spec)
191 (if (eq (nth 3 spec) 'X)
194 (delete-region (match-beginning 0)(match-end 0))
199 'iso-2022-jp-tex-gb 'iso2022
200 "ISO-2022-JP with TeX representation for GB fonts."
204 input-charset-conversion ((latin-jisx0201 ascii)
205 (japanese-jisx0208-1978 japanese-jisx0208))
206 pre-write-conversion chise-tex-encode-region-for-gb
207 post-read-conversion chise-tex-decode-region
208 mnemonic "pTeX(GB)/7bit"
212 'iso-2022-jp-tex-jis 'iso2022
213 "ISO-2022-JP with TeX representation for JIS fonts."
217 ccs-priority-list (ascii
218 =jis-x0208@1983 =jis-x0208@1978
220 pre-write-conversion chise-tex-encode-region-for-jis
221 post-read-conversion chise-tex-decode-region
222 mnemonic "pTeX(JIS)/7bit"
231 ;;; chise-tex.el ends here