1 ;;; mule-coding.el --- Coding-system functions for Mule.
3 ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN.
4 ;; Licensed to the Free Software Foundation.
5 ;; Copyright (C) 1995 Amdahl Corporation.
6 ;; Copyright (C) 1995 Sun Microsystems.
7 ;; Copyright (C) 1997,1999,2002,2003,2004 MORIOKA Tomohiko
9 ;; This file is part of XEmacs.
11 ;; XEmacs is free software; you can redistribute it and/or modify it
12 ;; under the terms of the GNU General Public License as published by
13 ;; the Free Software Foundation; either version 2, or (at your option)
16 ;; XEmacs is distributed in the hope that it will be useful, but
17 ;; WITHOUT ANY WARRANTY; without even the implied warranty of
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
19 ;; General Public License for more details.
21 ;; You should have received a copy of the GNU General Public License
22 ;; along with XEmacs; see the file COPYING. If not, write to the
23 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
24 ;; Boston, MA 02111-1307, USA.
28 ;;; split off of mule.el and mostly moved to coding.el
32 (defun coding-system-force-on-output (coding-system register)
33 "Return the 'force-on-output property of CODING-SYSTEM for the specified REGISTER."
34 (check-type register integer)
35 (coding-system-property
38 (0 'force-g0-on-output)
39 (1 'force-g1-on-output)
40 (2 'force-g2-on-output)
41 (3 'force-g3-on-output)
42 (t (signal 'args-out-of-range (list register 0 3))))))
44 (defun coding-system-short (coding-system)
45 "Return the 'short property of CODING-SYSTEM."
46 (coding-system-property coding-system 'short))
48 (defun coding-system-no-ascii-eol (coding-system)
49 "Return the 'no-ascii-eol property of CODING-SYSTEM."
50 (coding-system-property coding-system 'no-ascii-eol))
52 (defun coding-system-no-ascii-cntl (coding-system)
53 "Return the 'no-ascii-cntl property of CODING-SYSTEM."
54 (coding-system-property coding-system 'no-ascii-cntl))
56 (defun coding-system-seven (coding-system)
57 "Return the 'seven property of CODING-SYSTEM."
58 (coding-system-property coding-system 'seven))
60 (defun coding-system-lock-shift (coding-system)
61 "Return the 'lock-shift property of CODING-SYSTEM."
62 (coding-system-property coding-system 'lock-shift))
64 ;;(defun coding-system-use-japanese-jisx0201-roman (coding-system)
65 ;; "Return the 'use-japanese-jisx0201-roman property of CODING-SYSTEM."
66 ;; (coding-system-property coding-system 'use-japanese-jisx0201-roman))
68 ;;(defun coding-system-use-japanese-jisx0208-1978 (coding-system)
69 ;; "Return the 'use-japanese-jisx0208-1978 property of CODING-SYSTEM."
70 ;; (coding-system-property coding-system 'use-japanese-jisx0208-2978))
72 (defun coding-system-no-iso6429 (coding-system)
73 "Return the 'no-iso6429 property of CODING-SYSTEM."
74 (coding-system-property coding-system 'no-iso6429))
76 (defun coding-system-ccl-encode (coding-system)
77 "Return the CCL 'encode property of CODING-SYSTEM."
78 (coding-system-property coding-system 'encode))
80 (defun coding-system-ccl-decode (coding-system)
81 "Return the CCL 'decode property of CODING-SYSTEM."
82 (coding-system-property coding-system 'decode))
85 ;;;; Definitions of predefined coding systems
89 "Coding-system used in X as Compound Text Encoding."
91 charset-g1 latin-iso8859-1
95 ;;; iso-8859-1 and ctext are aliases.
97 ;; (copy-coding-system 'ctext 'iso-8859-1)
99 'iso-8859-1 'no-conversion
100 "Coding-system used in X as Compound Text Encoding."
101 '(eol-type nil mnemonic "Noconv"))
104 'iso-2022-8bit-ss2 'iso2022
105 "ISO-2022 coding system using SS2 for 96-charset in 8-bit code."
107 charset-g1 latin-iso8859-1
108 charset-g2 t ;; unspecified but can be used later.
114 'iso-2022-7bit-ss2 'iso2022
115 "ISO-2022 coding system using SS2 for 96-charset in 7-bit code."
117 charset-g2 t ;; unspecified but can be used later.
123 ;; (copy-coding-system 'iso-2022-7bit-ss2 'iso-2022-jp-2)
125 'iso-2022-jp-2 'iso2022
126 "ISO-2022 coding system using SS2 for 96-charset in 7-bit code."
128 charset-g2 t ;; unspecified but can be used later.
135 'iso-2022-7bit 'iso2022
136 "ISO 2022 based 7-bit encoding using only G0"
142 ;; compatibility for old XEmacsen
143 (copy-coding-system 'iso-2022-7bit 'iso-2022-7)
147 "ISO-2022 eight-bit coding system. No single-shift or locking-shift."
149 charset-g1 latin-iso8859-1
155 'escape-quoted 'iso2022
156 "ISO-2022 eight-bit coding system with escape quoting; used for .ELC files."
158 charset-g1 latin-iso8859-1
165 'iso-2022-lock 'iso2022
166 "ISO-2022 coding system using Locking-Shift for 96-charset."
168 charset-g1 t ;; unspecified but can be used later.
174 (when (featurep 'utf-2000)
175 (setq coded-charset-entity-reference-alist
176 '(((ideograph-gt . isolated) "I-GT-" 5 d)
177 ( ideograph-gt "GT-" 5 d)
178 ((=ruimoku-v6 . isolated) "I-RUI6-" 4 X)
179 ( =ruimoku-v6 "RUI6-" 4 X)
180 ((chinese-big5-cdp . isolated) "I-CDP-" 4 X)
181 ( chinese-big5-cdp "CDP-" 4 X)
182 ((ideograph-daikanwa . isolated) "I-M-" 5 d)
183 ( ideograph-daikanwa "M-" 5 d)
184 ((ideograph-gt-k . isolated) "I-GT-K" 5 d)
185 ( ideograph-gt-k "GT-K" 5 d)
186 ((ideograph-cbeta . isolated) "I-CB" 5 d)
187 ( ideograph-cbeta "CB" 5 d)
188 ((ideograph-hanziku-1 . isolated) "I-HZK01-" 4 X)
189 ( ideograph-hanziku-1 "HZK01-" 4 X)
190 ((ideograph-hanziku-2 . isolated) "I-HZK02-" 4 X)
191 ( ideograph-hanziku-2 "HZK02-" 4 X)
192 ((ideograph-hanziku-1 . isolated) "I-HZK1-" 4 X)
193 ( ideograph-hanziku-1 "HZK1-" 4 X)
194 ((ideograph-hanziku-2 . isolated) "I-HZK2-" 4 X)
195 ( ideograph-hanziku-2 "HZK2-" 4 X)
196 ((japanese-jisx0208-1990 . isolated) "I-J90-" 4 X)
197 ( japanese-jisx0208-1990 "J90-" 4 X)
198 ((japanese-jisx0208 . isolated) "I-J83-" 4 X)
199 ( japanese-jisx0208 "J83-" 4 X)
200 ((japanese-jisx0213-1 . isolated) "I-JX1-" 4 X)
201 ( japanese-jisx0213-1 "JX1-" 4 X)
202 ((japanese-jisx0213-2 . isolated) "I-JX2-" 4 X)
203 ( japanese-jisx0213-2 "JX2-" 4 X)
204 ((japanese-jisx0212 . isolated) "I-JSP-" 4 X)
205 ( japanese-jisx0212 "JSP-" 4 X)
206 ((japanese-jisx0208-1978 . isolated) "I-J78-" 4 X)
207 ( japanese-jisx0208-1978 "J78-" 4 X)
208 ((chinese-cns11643-1 . isolated) "I-C1-" 4 X)
209 ( chinese-cns11643-1 "C1-" 4 X)
210 ((chinese-cns11643-2 . isolated) "I-C2-" 4 X)
211 ( chinese-cns11643-2 "C2-" 4 X)
212 ((chinese-cns11643-3 . isolated) "I-C3-" 4 X)
213 ( chinese-cns11643-3 "C3-" 4 X)
214 ((chinese-cns11643-4 . isolated) "I-C4-" 4 X)
215 ( chinese-cns11643-4 "C4-" 4 X)
216 ((chinese-cns11643-5 . isolated) "I-C5-" 4 X)
217 ( chinese-cns11643-5 "C5-" 4 X)
218 ((chinese-cns11643-6 . isolated) "I-C6-" 4 X)
219 ( chinese-cns11643-6 "C6-" 4 X)
220 ((chinese-cns11643-7 . isolated) "I-C7-" 4 X)
221 ( chinese-cns11643-7 "C7-" 4 X)
222 ((korean-ksc5601 . isolated) "I-K0-" 4 X)
223 ( korean-ksc5601 "K0-" 4 X)
224 ( china3-jef "JC3-" 4 X)
225 ( chinese-big5 "B-" 4 X)
226 ( chinese-big5 "C0-" 4 X)
231 "Coding-system of UTF-8 with entity-reference."
232 '(mnemonic "MTF8r" use-entity-reference t))
236 "Coding-system of UTF-8 using GB mapping."
244 "Coding-system of UTF-8 using GB mapping with entity-reference."
249 use-entity-reference t))
253 "Coding-system of UTF-8 using CNS mapping."
261 "Coding-system of UTF-8 using CNS mapping with entity-reference."
266 use-entity-reference t))
270 "Coding-system of UTF-8 using Big5 mapping."
273 charset-g1 =>ucs-big5
277 'utf-8-big5-er 'utf-8
278 "Coding-system of UTF-8 using Big5 mapping with entity-reference."
281 charset-g1 =>ucs-big5
283 use-entity-reference t))
287 "Coding-system of UTF-8 using JIS mapping."
289 charset-g0 =ucs@jis-2000
295 "Coding-system of UTF-8 using JIS mapping with entity-reference."
297 charset-g0 =ucs@jis-2000
300 use-entity-reference t))
304 "Coding-system of UTF-8 for common glyphs used in Japan."
312 "Coding-system of UTF-8 using =ucs@jp mapping with entity-reference."
317 use-entity-reference t))
321 "Coding-system of UTF-8 using KS mapping."
329 "Coding-system of UTF-8 using KS mapping with entity-reference."
334 use-entity-reference t))
336 (define-coding-system-alias 'utf-8 'utf-8-mcs)
337 (define-coding-system-alias 'utf-8-er 'utf-8-mcs-er)
341 'euc-jisx0213 'iso2022
342 "Coding-system of Japanese EUC based on JIS X 0213."
344 charset-g1 japanese-jisx0213-1
345 charset-g2 katakana-jisx0201
346 charset-g3 japanese-jisx0213-2
348 mnemonic "Ja/EUC0213"
351 ;; initialize the coding categories to something semi-reasonable
352 ;; so that the remaining Lisp files can contain extended characters.
353 ;; (They will be in ISO-7 format)
354 ;; #### This list needs to be synched with the ones in mule-cmds.el.
356 (if (featurep 'utf-2000)
357 (set-coding-priority-list '(iso-7
367 (set-coding-priority-list '(iso-7
379 (set-coding-category-system 'iso-7 'iso-2022-7)
380 (set-coding-category-system 'iso-8-designate 'ctext)
381 (set-coding-category-system 'iso-8-1 'ctext)
382 (set-coding-category-system 'iso-lock-shift 'iso-2022-lock)
383 (set-coding-category-system 'no-conversion 'no-conversion)
385 (setq-default buffer-file-coding-system 'iso-2022-8)
387 ;;; mule-coding.el ends here