1 ;;; egg-cnv.el --- Conversion Backend in Egg Input Method Architecture
3 ;; Copyright (C) 1997, 1998 Mule Project,
4 ;; Powered by Electrotechnical Laboratory, JAPAN.
5 ;; Project Leader: Satoru Tomura <tomura@etl.go.jp>
7 ;; Author: NIIBE Yutaka <gniibe@mri.co.jp>
8 ;; KATAYAMA Yoshio <kate@pfu.co.jp>
9 ;; Maintainer: NIIBE Yutaka <gniibe@mri.co.jp>
10 ;; Keywords: mule, multilingual, input method
12 ;; This file is part of EGG.
14 ;; EGG is free software; you can redistribute it and/or modify
15 ;; it under the terms of the GNU General Public License as published by
16 ;; the Free Software Foundation; either version 2, or (at your option)
19 ;; EGG is distributed in the hope that it will be useful,
20 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
21 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
22 ;; GNU General Public License for more details.
24 ;; You should have received a copy of the GNU General Public License
25 ;; along with GNU Emacs; see the file COPYING. If not, write to the
26 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
27 ;; Boston, MA 02111-1307, USA.
36 (defvar egg-current-language)
37 (make-variable-buffer-local 'egg-current-language)
38 (put 'egg-current-language 'permanent-local t)
40 (defsubst egg-bunsetsu-info () 'intangible)
42 (defun egg-get-bunsetsu-info (p &optional object)
43 (let ((bunsetsu-info (get-text-property p (egg-bunsetsu-info) object)))
45 (setq egg-conversion-backend (get-text-property p 'egg-backend object)
46 egg-current-language (get-text-property p 'egg-lang object)))
50 (defconst egg-conversion-backend-other-languages
51 [ egg-init-other-languages
53 egg-start-conversion-other-languages
54 egg-get-bunsetsu-converted-other-languages
55 egg-get-bunsetsu-source-other-languages
56 egg-list-candidates-other-languages
57 egg-get-number-of-candidates-other-languages
58 egg-get-current-candidate-number-other-languages
59 egg-get-all-candidates-other-languages
60 egg-decide-candidate-other-languages
61 egg-change-bunsetsu-length-other-languages
62 egg-end-conversion-other-languages
65 egg-fini-other-languages
68 (defun egg-init-other-languages ()
71 (defun egg-start-conversion-other-languages (yomi-string language)
72 (setq egg-conversion-backend egg-conversion-backend-other-languages)
74 (defun egg-get-bunsetsu-converted-other-languages (bunsetsu-info)
76 (defun egg-get-bunsetsu-source-other-languages (bunsetsu-info)
78 (defun egg-list-candidates-other-languages (bunsetsu-info prev-bunsetsu-info)
80 (defun egg-get-number-of-candidates-other-languages (bunsetsu-info)
82 (defun egg-get-current-candidate-number-other-languages (bunsetsu-info)
84 (defun egg-get-all-candidates-other-languages (bunsetsu-info)
86 (defun egg-decide-candidate-other-languages (bunsetsu-info candidate-pos)
88 (defun egg-change-bunsetsu-length-other-languages (b0 b1 b2 len)
89 (let ((s (concat b1 b2)))
90 (set-text-properties 0 (length s) nil s)
91 (if (= len (length s))
93 (list (substring s 0 len) (substring s len)))))
94 (defun egg-end-conversion-other-languages (bunsetsu-info-list abort)
96 (defun egg-fini-other-languages (language)
99 (defvar egg-conversion-backend-alist nil)
100 (make-variable-buffer-local 'egg-conversion-backend-alist)
101 (defvar egg-conversion-backend nil)
102 (make-variable-buffer-local 'egg-conversion-backend)
104 (defvar egg-finalize-backend-alist nil)
106 (defun egg-set-current-backend (language)
107 (setq egg-conversion-backend
108 (cdr (assq language egg-conversion-backend-alist)))
109 (if (null egg-conversion-backend)
110 (setq egg-conversion-backend egg-conversion-backend-other-languages)))
112 (defun egg-initialize-backend (language)
113 (egg-set-current-backend language)
114 (funcall (aref egg-conversion-backend 0)))
116 (defun egg-start-conversion (yomi-string language)
117 (egg-set-current-backend language)
118 (funcall (aref egg-conversion-backend 1) yomi-string language))
119 (defun egg-get-bunsetsu-converted (bunsetsu-info)
120 (funcall (aref egg-conversion-backend 2) bunsetsu-info))
121 (defun egg-get-bunsetsu-source (bunsetsu-info)
122 (funcall (aref egg-conversion-backend 3) bunsetsu-info))
123 (defun egg-list-candidates (bunsetsu-info prev-bunsetsu-info)
124 (funcall (aref egg-conversion-backend 4) bunsetsu-info prev-bunsetsu-info))
125 (defun egg-get-number-of-candidates (bunsetsu-info)
126 (funcall (aref egg-conversion-backend 5) bunsetsu-info))
127 (defun egg-get-current-candidate-number (bunsetsu-info)
128 (funcall (aref egg-conversion-backend 6) bunsetsu-info))
129 (defun egg-get-all-candidates (bunsetsu-info)
130 (funcall (aref egg-conversion-backend 7) bunsetsu-info))
131 (defun egg-decide-candidate (bunsetsu-info candidate-pos)
132 (funcall (aref egg-conversion-backend 8) bunsetsu-info candidate-pos))
133 (defun egg-change-bunsetsu-length (b0 b1 b2 len)
134 (funcall (aref egg-conversion-backend 9) b0 b1 b2 len))
135 (defun egg-end-conversion (bunsetsu-info-list abort)
136 (funcall (aref egg-conversion-backend 10) bunsetsu-info-list abort))
137 (defun egg-start-reverse-conversion (yomi-string language)
138 (egg-set-current-backend language)
139 (if (aref egg-conversion-backend 11)
140 (funcall (aref egg-conversion-backend 11) yomi-string language)
143 (defun egg-finalize-backend ()
144 (let ((alist egg-finalize-backend-alist))
146 (funcall (car (car (car alist))) (cdr (car (car alist))))
147 (setq alist (cdr alist)))))
149 (defun egg-set-conversion-backend (backend langs &optional force)
152 (setq egg-conversion-backend backend)
153 (setq backend egg-conversion-backend))
155 (setq pair (assoc (car langs) egg-conversion-backend-alist))
158 (setq egg-conversion-backend-alist
159 (cons (cons (car langs) backend) egg-conversion-backend-alist)))
161 (setcdr pair backend)))
162 (setq pair (cons (aref backend (1- (length backend))) (car langs)))
163 (if (null (assoc pair egg-finalize-backend-alist))
164 (setq egg-finalize-backend-alist
165 (cons (list pair) egg-finalize-backend-alist)))
166 (setq langs (cdr langs)))))
168 (defvar egg-conversion-open "|" "*
\e$B%U%'%s%9$N;OE@$r<($9J8;zNs
\e(B (1
\e$BJ8;z0J>e
\e(B)")
169 (defvar egg-conversion-close "|" "*
\e$B%U%'%s%9$N=*E@$r<($9J8;zNs
\e(B (1
\e$BJ8;z0J>e
\e(B)")
170 (defvar egg-conversion-face nil "*
\e$B%U%'%s%9I=<($KMQ$$$k
\e(B face
\e$B$^$?$O
\e(B nil")
171 (defvar egg-conversion-invisible nil)
172 (defvar egg-conversion-separator " ")
174 (defun egg-get-conversion-face ()
175 (let ((face (and (listp egg-conversion-face)
176 (or (assq egg-current-language egg-conversion-face)
177 (assq t egg-conversion-face)))))
178 (if face (cdr face) egg-conversion-face)))
181 (defun egg-convert-region (start end)
183 (let ((source (buffer-substring start end))
184 (no-prop-source (buffer-substring-no-properties start end))
185 bunsetsu-info-list len result i j s)
189 (delete-region start end)
190 (let ((inhibit-read-only t))
191 (its-define-select-keys egg-conversion-map)
193 (setq s (copy-sequence egg-conversion-open)
195 (set-text-properties 0 len
201 (if egg-conversion-invisible
202 (put-text-property 0 len 'invisible t s))
205 s (copy-sequence egg-conversion-close)
207 (set-text-properties 0 len
208 '(read-only t rear-nonsticky t egg-end t)
210 (if egg-conversion-invisible
211 (put-text-property 0 len 'invisible t s))
214 (egg-separate-languages (copy-sequence source))
218 (setq egg-current-language (get-text-property i 'egg-lang source)
219 j (egg-next-single-property-change i 'egg-lang source len))
220 (condition-case result
221 (setq bunsetsu-info-list (egg-start-conversion
222 (substring no-prop-source i j)
223 egg-current-language))
225 (setq bunsetsu-info-list (egg-start-conversion-other-languages
226 (substring no-prop-source i j)
227 egg-current-language))
228 (message "egg %s backend: %s"
229 egg-current-language (nth 1 result))))
230 (egg-insert-bunsetsu-list bunsetsu-info-list
231 (if (< j len) 'contine t))
233 (goto-char start)))))
235 (defconst egg-chinese-sisheng-regexp
236 (concat "[" (list (make-char 'chinese-sisheng 32))
237 "-" (list (make-char 'chinese-sisheng 127))
240 (defun egg-separate-languages (str &optional last-lang)
241 (let (lang last-chinese
242 (len (length str)) i j l)
243 ;; 1st pass -- mark undefined Chinese part
244 (if (or (eq last-lang 'Chinese-GB) (eq last-lang 'Chinese-CNS))
245 (setq last-chinese last-lang))
248 (setq j (egg-next-single-property-change i 'egg-lang str len))
249 (if (get-text-property i 'egg-lang str)
251 (setq c (egg-string-to-char-at str i)
252 cset (char-charset c))
254 ((eq cset 'chinese-sisheng)
255 (string-match egg-chinese-sisheng-regexp str i)
256 (setq l (match-end 0)
259 ((setq l (egg-chinese-syllable str i))
263 (if (eq (string-match "[\0-\177\240-\377]+" str (1+ i)) (1+ i))
264 (setq j (match-end 0))
267 (eq (char-charset (egg-string-to-char-at str j))
269 (setq j (max (1+ i) (- j 6))))
271 ((eq cset 'composition)
272 (setq j (+ i (egg-char-bytes c))
273 lang (egg-charset-to-language
275 (car (decompose-composite-char c 'list))))))
277 (string-match (concat "[" (list (make-char cset 32 32))
278 "-" (list (make-char cset 127 127))
281 (setq j (match-end 0)
282 lang (egg-charset-to-language cset))))
284 (put-text-property i j 'egg-lang lang str)))
286 ;; 2nd pass -- set language property
289 (setq lang (get-text-property i 'egg-lang str))
292 (setq lang (or last-lang
293 (egg-next-part-lang str i))))
294 ((equal lang 'Chinese)
295 (setq lang (or last-chinese
296 (egg-next-chinese-lang str i)))))
297 (setq last-lang lang)
298 (if (or (eq lang 'Chinese-GB) (eq lang 'Chinese-CNS))
299 (setq last-chinese lang))
301 i (egg-next-single-property-change i 'egg-lang str len))
302 (set-text-properties j i (list 'egg-lang lang) str))))
304 (defun egg-charset-to-language (charset)
305 (let ((list language-info-alist))
307 (null (memq charset (assq 'charset (car list)))))
308 (setq list (cdr list)))
310 (intern (car (car list))))))
312 (defun egg-next-part-lang (str pos)
313 (let ((lang (get-text-property
314 (egg-next-single-property-change pos 'egg-lang str (length str))
316 (if (eq lang 'Chinese)
317 (egg-next-chinese-lang str pos)
320 egg-default-language))))
322 (defun egg-next-chinese-lang (str pos)
323 (let ((len (length str)) lang)
324 (while (and (< pos len) (null lang))
325 (setq pos (egg-next-single-property-change pos 'egg-lang str len)
326 lang (get-text-property pos 'egg-lang str))
327 (if (null (or (eq lang 'Chinese-GB)
328 (eq lang 'Chinese-CNS)))
332 ((eq its-current-language 'Chinese-GB) 'Chinese-GB)
333 ((eq its-current-language 'Chinese-CNS) 'Chinese-CNS)
334 ((eq egg-default-language 'Chinese-GB) 'Chinese-GB)
335 ((eq egg-default-language 'Chinese-CNS) 'Chinese-CNS)
338 (defvar egg-conversion-map
339 (let ((map (make-sparse-keymap))
342 (define-key map (vector i) 'egg-exit-conversion-unread-char)
344 (define-key map "\C-@" 'egg-decide-first-char)
345 (define-key map [?\C-\ ] 'egg-decide-first-char)
346 (define-key map "\C-a" 'egg-beginning-of-conversion-buffer)
347 (define-key map "\C-b" 'egg-backward-bunsetsu)
348 (define-key map "\C-c" 'egg-abort-conversion)
349 (define-key map "\C-e" 'egg-end-of-conversion-buffer)
350 (define-key map "\C-f" 'egg-forward-bunsetsu)
351 (define-key map "\C-h" 'egg-help-command)
352 (define-key map "\C-i" 'egg-shrink-bunsetsu)
353 (define-key map "\C-k" 'egg-decide-before-point)
354 ;; (define-key map "\C-l" 'egg-exit-conversion) ; Don't override C-L
355 (define-key map "\C-m" 'egg-exit-conversion)
356 (define-key map "\C-n" 'egg-next-candidate)
357 (define-key map "\C-o" 'egg-enlarge-bunsetsu)
358 (define-key map "\C-p" 'egg-previous-candidate)
359 (define-key map "\C-r" 'egg-reverse-convert-bunsetu)
360 (define-key map "\M-r" 'egg-reconvert-bunsetsu)
361 (define-key map "\M-s" 'egg-select-candidate)
362 (define-key map [return] 'egg-exit-conversion)
363 (define-key map [right] 'egg-forward-bunsetsu)
364 (define-key map [left] 'egg-backward-bunsetsu)
365 (define-key map " " 'egg-next-candidate)
367 "Keymap for EGG Conversion mode.")
369 (fset 'egg-conversion-map egg-conversion-map)
371 (defun egg-exit-conversion-unread-char ()
373 (setq unread-command-events (list last-command-event))
374 (egg-exit-conversion))
376 (defun egg-make-bunsetsu (bunsetsu-info last)
377 (let ((bunsetsu (copy-sequence (egg-get-bunsetsu-converted bunsetsu-info)))
379 (setq len1 (length bunsetsu))
380 (if (null (eq last t))
381 (setq bunsetsu (concat bunsetsu egg-conversion-separator)))
382 (setq len (length bunsetsu))
383 (set-text-properties 0 len
385 (egg-bunsetsu-info) bunsetsu-info
386 'egg-backend egg-conversion-backend
387 'egg-lang egg-current-language
388 'egg-bunsetsu-last last
389 'local-map 'egg-conversion-map)
391 (if egg-conversion-face
392 (egg-set-face 0 len1 (egg-get-conversion-face) bunsetsu))
395 (defun egg-insert-bunsetsu-list (bunsetsu-info-list &optional last)
396 (let ((l bunsetsu-info-list)
397 bunsetsu-info bunsetsu)
399 (setq bunsetsu-info (car l)
401 bunsetsu (cons (egg-make-bunsetsu bunsetsu-info
404 (apply 'insert (nreverse bunsetsu))))
406 (defun egg-beginning-of-conversion-buffer (n)
410 (egg-end-of-conversion-buffer 1))
411 ((null (get-text-property (1- (point)) 'egg-start))
412 (goto-char (previous-single-property-change (1- (point)) 'egg-start)))))
414 (defun egg-end-of-conversion-buffer(n)
418 (egg-beginning-of-conversion-buffer 1))
420 (goto-char (next-single-property-change (point) 'egg-end))
423 (defun egg-backward-bunsetsu (n)
426 (while (and (null start) (> n 0))
428 (if (setq start (get-text-property (point) 'egg-start))
432 (signal 'beginning-of-buffer nil))))
434 (defun egg-forward-bunsetsu (n)
437 (while (and (null end) (> n 0))
439 (if (setq end (get-text-property (point) 'egg-end))
443 (signal 'end-of-buffer nil))))
445 (defun egg-get-previous-bunsetsu (p)
446 (and (null (get-text-property (1- p) 'egg-start))
447 (null (get-text-property (1- p) 'egg-bunsetsu-last))
448 (egg-get-bunsetsu-info (- p 2))))
450 (defun egg-separate-characters (str)
451 (let* ((v (egg-string-to-vector str))
453 (i 0) (j 0) m n (nchar 0))
455 (if (setq n (egg-chinese-syllable str j))
456 (setq m (egg-chars-in-period str j n))
457 (setq m 1 n (egg-char-bytes (aref v i))))
458 (put-text-property j (+ j n) 'egg-char-size n str)
459 (setq nchar (1+ nchar) i (+ i m) j (+ j n)))
462 (defun egg-shrink-bunsetsu (n)
464 (egg-enlarge-bunsetsu (- n)))
466 (defun egg-enlarge-bunsetsu (n)
468 (let* ((inhibit-read-only t)
469 (b0 (egg-get-previous-bunsetsu (point)))
470 (b1 (egg-get-bunsetsu-info (point)))
471 (s1 (egg-get-bunsetsu-source b1))
472 (s1len (egg-separate-characters s1))
475 (last (get-text-property (point) 'egg-bunsetsu-last))
476 b2 s2 source bunsetsu-info-list beep)
478 (let ((p2 (save-excursion (forward-char) (point))))
479 (setq b2 (egg-get-bunsetsu-info p2)
480 s2 (egg-get-bunsetsu-source b2)
481 s2len (egg-separate-characters s2)
482 last (get-text-property p2 'egg-bunsetsu-last))))
483 (setq source (concat s1 s2))
486 (setq beep t chrs (get-text-property 0 'egg-char-size source)))
488 (setq beep t chrs (length source)))
491 (setq chrs (- chrs (get-text-property (1- chrs) 'egg-char-size source))
495 (setq chrs (+ chrs (get-text-property chrs 'egg-char-size source))
497 (setq bunsetsu-info-list (egg-change-bunsetsu-length b0 b1 b2 chrs))
498 (delete-region (point)
499 (progn (forward-char) (if b2 (forward-char)) (point)))
501 (egg-insert-bunsetsu-list bunsetsu-info-list last)
506 (defvar egg-conversion-wrap-select nil
507 "*Candidate selection wraps around to first candidate, if non-nil.
508 Otherwise stop at the last candidate.")
510 (defun egg-next-candidate (n)
512 (let ((inhibit-read-only t)
513 (last (get-text-property (point) 'egg-bunsetsu-last))
514 (b (egg-get-bunsetsu-info (point)))
516 (setq max+ (egg-get-number-of-candidates b))
518 (let ((prev-b (egg-get-previous-bunsetsu (point))))
519 (setq i (egg-list-candidates b prev-b)) ; there is a case I=/=0
520 (if (or (> n 1) (< n 0)) ; with N=/=1, start with I
521 (setq i (+ n i)) ; or else (N==1),
522 (setq i (if (= i 0) 1 0))) ; I:=1 when I was 0, or else I:=0
523 (setq max+ (egg-get-number-of-candidates b)))
524 (setq i (egg-get-current-candidate-number b))
529 ((< i 0) ; go backward as if it is ring
531 (setq i (+ i max+))))
533 (egg-conversion-wrap-select ; go backward as if it is ring
535 (setq i (- i max+))))
536 ((setq i (1- max+) ; don't go forward
538 (setq new (egg-decide-candidate b i))
540 (delete-region p (progn (forward-char) (point)))
541 (insert (egg-make-bunsetsu new last))
546 (defun egg-previous-candidate (n)
548 (egg-next-candidate (- n)))
550 (defun egg-reconvert-bunsetsu-internal (n func)
551 (let ((inhibit-read-only t)
553 source last bunsetsu-list)
556 (while (and (null last) (> n 0))
557 (setq source (concat source
558 (egg-get-bunsetsu-converted
559 (egg-get-bunsetsu-info (point))))
560 last (get-text-property (point) 'egg-bunsetsu-last)
566 ((setq bunsetsu-list (funcall func source egg-current-language))
567 (delete-region p (point))
568 (egg-insert-bunsetsu-list bunsetsu-list (if (eq last t) t 'contine))
570 (if (egg-get-previous-bunsetsu p)
573 (put-text-property (point) p 'egg-bunsetsu-last 'contine)
574 (forward-char))))))))
576 (defun egg-reverse-convert-bunsetu (n)
578 (egg-reconvert-bunsetsu-internal n 'egg-start-reverse-conversion))
580 (defun egg-reconvert-bunsetsu (n)
582 (egg-reconvert-bunsetsu-internal n 'egg-start-conversion))
584 (defun egg-decide-before-point ()
586 (let ((inhibit-read-only t)
587 start end len decided undecided bunsetsu source)
588 (setq start (if (get-text-property (1- (point)) 'egg-start)
590 (previous-single-property-change (point) 'egg-start))
591 end (if (get-text-property (point) 'egg-end)
593 (next-single-property-change (point) 'egg-end))
594 decided (buffer-substring start (point))
595 undecided (buffer-substring (point) end))
596 (delete-region (- start (length egg-conversion-open))
597 (+ end (length egg-conversion-close)))
599 len (length decided))
601 (setq bunsetsu (cons (egg-get-bunsetsu-info i decided) bunsetsu)
602 i (egg-next-single-property-change
603 i (egg-bunsetsu-info) decided len))
605 (get-text-property (1- i) 'egg-bunsetsu-last decided))
607 (setq bunsetsu (nreverse bunsetsu))
608 (apply 'insert (mapcar (lambda (b) (egg-get-bunsetsu-converted b))
610 (egg-end-conversion bunsetsu nil)
611 (setq bunsetsu nil))))
612 (setq len (length undecided))
616 (run-hooks 'input-method-after-insert-chunk-hook))
619 (setq source (cons (egg-get-bunsetsu-source
620 (egg-get-bunsetsu-info i undecided))
622 i (egg-next-single-property-change
623 i (egg-bunsetsu-info) undecided len)))
624 (its-restart (apply 'concat (nreverse source)) t))))
626 (defun egg-exit-conversion ()
628 (goto-char (next-single-property-change (point) 'egg-end))
629 (egg-decide-before-point))
631 (defun egg-abort-conversion ()
633 (let ((inhibit-read-only t) source)
634 (goto-char (- (if (get-text-property (1- (point)) 'egg-start)
636 (previous-single-property-change (point) 'egg-start))
637 (length egg-conversion-open)))
638 (setq source (get-text-property (point) 'egg-source))
639 (delete-region (point) (+ (next-single-property-change (point) 'egg-end)
640 (length egg-conversion-close)))
642 (its-end-of-input-buffer)))
644 (defun egg-select-candidate ()
646 (let ((inhibit-read-only t)
647 (last (get-text-property (point) 'egg-bunsetsu-last))
648 (b (egg-get-bunsetsu-info (point)))
651 (setq max+ (egg-get-number-of-candidates b))
653 (let ((prev-b (egg-get-previous-bunsetsu (point))))
654 (setq i (egg-list-candidates b prev-b))
655 (setq max+ (egg-get-number-of-candidates b)))
656 (setq i (egg-get-current-candidate-number b)))
657 (let (candidate-list candidate l)
660 (menudiag-select (list 'menu "
\e$B8uJd
\e(B:"
661 (list (egg-get-bunsetsu-converted b))
662 (list (egg-get-bunsetsu-converted b))))
663 (setq candidate-list (egg-get-all-candidates b)
665 candidate (menudiag-select (list 'menu "
\e$B8uJd
\e(B:" l)
669 (if (eq candidate (car l))
673 (setq new (egg-decide-candidate b i))
675 (delete-region p (progn (forward-char) (point)))
676 (insert (egg-make-bunsetsu new last))
680 ;;; egg-cnv.el ends here.