X-Git-Url: http://git.chise.org/gitweb/?a=blobdiff_plain;f=ids-find.el;h=401866fd2ea619a3799e8b76947ba09a289aa382;hb=380244b1383ea4f8612aaaf7af1253394dbee96a;hp=0e0e7be8f32c0287858a438c12e66a5d87b5a153;hpb=f7abebb51ae1a8f4e828f1816bdf2d33a4853752;p=chise%2Fids.git diff --git a/ids-find.el b/ids-find.el index 0e0e7be..401866f 100644 --- a/ids-find.el +++ b/ids-find.el @@ -1,11 +1,11 @@ -;;; ids-find.el --- search utility based on Ideographic-structures +;;; ids-find.el --- search utility based on Ideographic-structures ;; -*- coding: utf-8-mcs-er -*- -;; Copyright (C) 2002,2003,2005 MORIOKA Tomohiko +;; Copyright (C) 2002, 2003, 2005, 2006, 2007, 2017, 2020 MORIOKA Tomohiko ;; Author: MORIOKA Tomohiko ;; Keywords: Kanji, Ideographs, search, IDS, CHISE, UCS, Unicode -;; This file is a part of Tomoyo-Tools. +;; This file is a part of CHISE-IDS. ;; This program is free software; you can redistribute it and/or ;; modify it under the terms of the GNU General Public License as @@ -42,19 +42,25 @@ (ids-index-store-char product cell)) ((setq ret (assq 'ideographic-structure cell)) (ids-index-store-structure product (cdr ret))) - ;; ((setq ret (find-char cell)) - ;; (ids-index-store-char product ret)) + ((setq ret (find-char cell)) + (ids-index-store-char product ret)) )))) ;;;###autoload -(defun ids-update-index () +(defun ids-update-index (&optional in-memory) (interactive) (map-char-attribute (lambda (c v) (ids-index-store-structure c v) nil) 'ideographic-structure) - (save-char-attribute-table 'ideographic-products)) + (map-char-attribute + (lambda (c v) + (ids-index-store-structure c v) + nil) + 'ideographic-structure@apparent) + (unless in-memory + (save-char-attribute-table 'ideographic-products))) (mount-char-attribute-table 'ideographic-products) @@ -74,8 +80,12 @@ (when (string-match "^<-.*[@/]component\\(/[^*/]+\\)*$" (symbol-name feature)) (push feature dest))) - (cons '<-ideographic-component-forms - dest))) + (list* '<-mistakable '->mistakable + '<-formed '->formed + '<-same '->same + '<-original '->original + '<-ancient '->ancient + dest))) (defun to-component-features () (let (dest) @@ -83,26 +93,29 @@ (when (string-match "^->.*[@/]component\\(/[^*/]+\\)*$" (symbol-name feature)) (push feature dest))) - (cons '->ideographic-component-forms - dest))) + dest)) ;;;###autoload (defun char-component-variants (char) (let ((dest (list char)) ret uchr) + (dolist (feature (to-component-features)) + (if (setq ret (get-char-attribute char feature)) + (dolist (c ret) + (setq dest (union dest (char-component-variants c)))))) (cond - ((setq ret (some (lambda (feature) - (get-char-attribute char feature)) - (to-component-features))) - (dolist (c ret) - (setq dest (union dest (char-component-variants c)))) - ) + ;; ((setq ret (some (lambda (feature) + ;; (get-char-attribute char feature)) + ;; (to-component-features))) + ;; (dolist (c ret) + ;; (setq dest (union dest (char-component-variants c)))) + ;; ) ((setq ret (get-char-attribute char '->ucs-unified)) (setq dest (cons char ret)) (dolist (c dest) (setq dest (union dest (some (lambda (feature) - (get-char-attribute char feature)) + (get-char-attribute c feature)) (of-component-features)) ))) ) @@ -112,7 +125,7 @@ (dolist (c dest) (setq dest (union dest (some (lambda (feature) - (get-char-attribute char feature)) + (get-char-attribute c feature)) (of-component-features)) ))) ) @@ -146,35 +159,55 @@ (setq components (cdr components))) (setq products nil) (dolist (variant (char-component-variants (car components))) + (setq products + (union products + (get-char-attribute variant 'ideographic-products)))) + (setq dest (intersection dest products))) + dest)) + +(defun ideograph-find-products-with-variants (components &optional ignored-chars) + (if (stringp components) + (setq components (string-to-char-list components))) + (let (dest products) + (dolist (variant (char-component-variants (car components))) (setq products (union products - (get-char-attribute variant 'ideographic-products)))) + (set-difference + (get-char-attribute variant 'ideographic-products) + ignored-chars)))) + (setq dest products) + (while (and dest + (setq components (cdr components))) + (setq products nil) + (dolist (variant (char-component-variants (car components))) + (setq products + (union products + (set-difference + (get-char-attribute variant 'ideographic-products) + ignored-chars)))) + (setq dest (intersection dest products))) + dest)) + +(defun ideograph-find-products (components &optional ignored-chars) + (if (stringp components) + (setq components (string-to-char-list components))) + (let (dest products) + ;; (dolist (variant (char-component-variants (car components))) + ;; (setq products + ;; (union products + ;; (get-char-attribute variant 'ideographic-products)))) + ;; (setq dest products) + (setq dest (get-char-attribute (car components) 'ideographic-products)) + (while (and dest + (setq components (cdr components))) + ;; (setq products nil) + ;; (dolist (variant (char-component-variants (car components))) + ;; (setq products + ;; (union products + ;; (get-char-attribute variant 'ideographic-products)))) + (setq products (get-char-attribute (car components) 'ideographic-products)) (setq dest (intersection dest products))) dest)) -;; (defun ideographic-products-find (&rest components) -;; (if (stringp (car components)) -;; (setq components (car components))) -;; (let ((len (length components)) -;; (i 1) -;; dest products) -;; (dolist (variant (char-component-variants (elt components 0))) -;; (setq products -;; (union products -;; (get-char-attribute variant 'ideographic-products)))) -;; (setq dest products) -;; (while (and -;; (< i len) -;; (progn -;; (setq products nil) -;; (dolist (variant (char-component-variants (elt components i))) -;; (dolist (product (get-char-attribute -;; variant 'ideographic-products)) -;; (unless (memq product products) -;; (when (memq product dest) -;; (setq products (cons product products)))))) -;; (setq dest products))) -;; (setq i (1+ i))) -;; products)) (defun ideographic-structure-char= (c1 c2) @@ -184,26 +217,7 @@ (m2 (char-ucs c2))) (or (and m1 m2 (eq m1 m2)) - (some (lambda (feature) - (some (lambda (b2) - (unless (characterp b2) - (setq b2 (find-char b2))) - (and b2 - (ideographic-structure-char= c1 b2))) - (char-feature c2 feature) - ;; (get-char-attribute - ;; c2 '<-ideographic-component-forms) - )) - (of-component-features)) - (progn - (setq m1 (car (get-char-attribute c1 '<-radical)) - m2 (car (get-char-attribute c2 '<-radical))) - (unless (characterp m1) - (setq m1 (find-char m1))) - (unless (characterp m2) - (setq m2 (find-char m2))) - (when (or m1 m2) - (ideographic-structure-char= m1 m2)))))))) + (memq c1 (char-component-variants c2))))))) (defun ideographic-structure-member-compare-components (component s-component) (let (ret) @@ -275,12 +289,60 @@ (or (ideographic-structure-to-ids v) v))) +(defun ids-insert-chars-including-components* (components + &optional level ignored-chars) + (unless level + (setq level 0)) + (let (is i as bs) + (dolist (c (sort (copy-tree (ideograph-find-products components + ignored-chars)) + (lambda (a b) + (if (setq as (char-total-strokes a)) + (if (setq bs (char-total-strokes b)) + (if (= as bs) + (ideograph-char< a b) + (< as bs)) + t) + (ideograph-char< a b))))) + (unless (memq c ignored-chars) + (setq is (char-feature c 'ideographic-structure)) + (setq i 0) + (while (< i level) + (insert "\t") + (setq i (1+ i))) + (insert (ids-find-format-line c is)) + (setq ignored-chars + (ids-insert-chars-including-components* + (char-to-string c) (1+ level) + (cons c ignored-chars)))) + ) + ) + ignored-chars) + (defun ids-insert-chars-including-components (components &optional level ignored-chars) (unless level (setq level 0)) - (let (is dis i as bs) - (dolist (c (sort (ideographic-products-find components) + (setq ignored-chars + (nreverse + (ids-insert-chars-including-components* components + level ignored-chars))) + (let (is i as bs) + (dolist (c ignored-chars) + (dolist (vc (char-component-variants c)) + (unless (memq vc ignored-chars) + (when (setq is (get-char-attribute vc 'ideographic-structure)) + (setq i 0) + (while (< i level) + (insert "\t") + (setq i (1+ i))) + (insert (ids-find-format-line vc is)) + (setq ignored-chars + (ids-insert-chars-including-components* + (char-to-string vc) (1+ level) + (cons vc ignored-chars))))))) + (dolist (c (sort (copy-tree (ideograph-find-products-with-variants + components ignored-chars)) (lambda (a b) (if (setq as (char-total-strokes a)) (if (setq bs (char-total-strokes b)) @@ -290,31 +352,19 @@ t) (ideograph-char< a b))))) (unless (memq c ignored-chars) - (setq is (char-feature c 'ideographic-structure)) + (setq is (get-char-attribute c 'ideographic-structure)) (setq i 0) (while (< i level) (insert "\t") (setq i (1+ i))) (insert (ids-find-format-line c is)) (setq ignored-chars - (ids-insert-chars-including-components + (ids-insert-chars-including-components* (char-to-string c) (1+ level) (cons c ignored-chars)))) - )) + ) + ) ignored-chars) -;; (defun ids-insert-chars-including-components (components level) -;; (let (is dis i) -;; (dolist (c (ideographic-products-find components)) -;; (setq is (char-feature c 'ideographic-structure)) -;; (setq i 0) -;; (while (< i level) -;; (insert "\t") -;; (setq i (1+ i))) -;; (insert (ids-find-format-line c is)) -;; ;;(forward-line -1) -;; (ids-insert-chars-including-components -;; (char-to-string c) (1+ level)) -;; ))) ;;;###autoload (defun ids-find-chars-including-components (components) @@ -323,48 +373,23 @@ (with-current-buffer (get-buffer-create ids-find-result-buffer) (setq buffer-read-only nil) (erase-buffer) - (ids-insert-chars-including-components components 0) - ;; (let (is dis) - ;; (dolist (c (ideographic-products-find components)) - ;; (setq is (char-feature c 'ideographic-structure)) - ;; ;; to avoid problems caused by wrong indexes - ;; ;; (when (every (lambda (cc) - ;; ;; (ideographic-structure-member cc is)) - ;; ;; components) - ;; (dolist (dc (ideographic-products-find (char-to-string c))) - ;; (setq dis (char-feature dc 'ideographic-structure)) - ;; ;; ;; to avoid problems caused by wrong indexes - ;; ;; (when (every (lambda (dcc) - ;; ;; (ideographic-structure-member dcc is)) - ;; ;; components) - ;; (insert "\t") - ;; (insert (ids-find-format-line dc dis)) - ;; (forward-line -1) - ;; ;; ) - ;; ) - ;; (insert (ids-find-format-line c is)) - ;; (forward-line -1) - ;; ;; ) - ;; ) - ;; ) + (ids-insert-chars-including-components components 0 nil) + ;; (let ((ignored-chars + ;; (nreverse + ;; (ids-insert-chars-including-components components 0 nil + ;; #'ideograph-find-products))) + ;; rest) + ;; (setq rest ignored-chars) + ;; ;; (dolist (c rest) + ;; ;; (setq ignored-chars + ;; ;; (union ignored-chars + ;; ;; (ids-insert-chars-including-components + ;; ;; (list c) 0 ignored-chars + ;; ;; #'ideograph-find-products-with-variants)))) + ;; (ids-insert-chars-including-components components 0 ignored-chars + ;; #'ideograph-find-products-with-variants)) (goto-char (point-min))) (view-buffer ids-find-result-buffer)) -;; (defun ids-find-chars-including-components (components) -;; "Search Ideographs whose structures have COMPONENTS." -;; (interactive "sComponents : ") -;; (with-current-buffer (get-buffer-create ids-find-result-buffer) -;; (setq buffer-read-only nil) -;; (erase-buffer) -;; (map-char-attribute -;; (lambda (c v) -;; (when (every (lambda (p) -;; (ideographic-structure-member p v)) -;; components) -;; (insert (ids-find-format-line c v))) -;; nil) -;; 'ideographic-structure) -;; (goto-char (point-min))) -;; (view-buffer ids-find-result-buffer)) ;;;###autoload (define-obsolete-function-alias 'ideographic-structure-search-chars @@ -379,16 +404,1203 @@ (with-current-buffer (get-buffer-create ids-find-result-buffer) (setq buffer-read-only nil) (erase-buffer) - (let (ucs jis) - (map-char-attribute - (lambda (c v) - (when (ideographic-structure-repertoire-p v components) - (insert (ids-find-format-line c v)))) - 'ideographic-structure)) + (map-char-attribute + (lambda (c v) + (when (ideographic-structure-repertoire-p v components) + (insert (ids-find-format-line c v)))) + 'ideographic-structure) (goto-char (point-min))) (view-buffer ids-find-result-buffer)) +(defun ideographic-structure-merge-components-alist (ca1 ca2) + (let ((dest-alist ca1) + ret) + (dolist (cell ca2) + (if (setq ret (assq (car cell) dest-alist)) + (setcdr ret (+ (cdr ret)(cdr cell))) + (setq dest-alist (cons cell dest-alist)))) + dest-alist)) + +(defun ideographic-structure-to-components-alist (structure) + (apply #'ideographic-structure-to-components-alist* structure)) + +(defun ideographic-structure-to-components-alist* (operator component1 component2 + &optional component3 + &rest opts) + (let (dest-alist ret) + (setq dest-alist + (cond ((characterp component1) + (unless (encode-char component1 'ascii) + (list (cons component1 1))) + ) + ((setq ret (assq 'ideographic-structure component1)) + (ideographic-structure-to-components-alist (cdr ret)) + ) + ((setq ret (find-char component1)) + (list (cons ret 1)) + ))) + (setq dest-alist + (ideographic-structure-merge-components-alist + dest-alist + (cond ((characterp component2) + (unless (encode-char component2 'ascii) + (list (cons component2 1))) + ) + ((setq ret (assq 'ideographic-structure component2)) + (ideographic-structure-to-components-alist (cdr ret)) + ) + ((setq ret (find-char component2)) + (list (cons ret 1)) + )))) + (if (memq operator '(?\u2FF2 ?\u2FF3)) + (ideographic-structure-merge-components-alist + dest-alist + (cond ((characterp component3) + (unless (encode-char component3 'ascii) + (list (cons component3 1))) + ) + ((setq ret (assq 'ideographic-structure component3)) + (ideographic-structure-to-components-alist (cdr ret)) + ) + ((setq ret (find-char component3)) + (list (cons ret 1)) + ))) + dest-alist))) + +(defun ids-find-merge-variables (ve1 ve2) + (cond ((eq ve1 t) + ve2) + ((eq ve2 t) + ve1) + (t + (let ((dest-alist ve1) + (rest ve2) + cell ret) + (while (and rest + (setq cell (car rest)) + (if (setq ret (assq (car cell) ve1)) + (eq (cdr ret)(cdr cell)) + (setq dest-alist (cons cell dest-alist)))) + (setq rest (cdr rest))) + (if rest + nil + dest-alist))))) + +;;;###autoload +(defun ideographic-structure-equal (structure1 structure2) + (let (dest-alist ret) + (and (setq dest-alist (ideographic-structure-character= + (car structure1)(car structure2))) + (setq ret (ideographic-structure-character= + (nth 1 structure1)(nth 1 structure2))) + (setq dest-alist (ids-find-merge-variables dest-alist ret)) + (setq ret (ideographic-structure-character= + (nth 2 structure1)(nth 2 structure2))) + (setq dest-alist (ids-find-merge-variables dest-alist ret)) + (if (memq (car structure1) '(?\u2FF2 ?\u2FF3)) + (and (setq ret (ideographic-structure-character= + (nth 3 structure1)(nth 3 structure2))) + (setq dest-alist (ids-find-merge-variables dest-alist ret))) + dest-alist)))) + +;;;###autoload +(defun ideographic-structure-character= (c1 c2) + (let (ret ret2) + (cond ((characterp c1) + (cond ((encode-char c1 'ascii) + (list (cons c1 c2)) + ) + ((characterp c2) + (if (encode-char c2 'ascii) + (list (cons c2 c1)) + (eq c1 c2)) + ) + ((setq ret2 (find-char c2)) + (eq c1 ret2) + ) + ((setq ret2 (assq 'ideographic-structure c2)) + (and (setq ret (get-char-attribute c1 'ideographic-structure)) + (ideographic-structure-equal ret (cdr ret2))) + )) + ) + ((setq ret (assq 'ideographic-structure c1)) + (cond ((characterp c2) + (if (encode-char c2 'ascii) + (list (cons c2 c1)) + (and (setq ret2 (get-char-attribute c2 'ideographic-structure)) + (ideographic-structure-equal (cdr ret) ret2))) + ) + ((setq ret2 (find-char c2)) + (and (setq ret2 (get-char-attribute ret2 'ideographic-structure)) + (ideographic-structure-equal (cdr ret) ret2)) + ) + ((setq ret2 (assq 'ideographic-structure c2)) + (ideographic-structure-equal (cdr ret)(cdr ret2)) + )) + ) + ((setq ret (find-char c1)) + (cond ((characterp c2) + (if (encode-char c2 'ascii) + (list (cons c2 c1)) + (eq ret c2)) + ) + ((setq ret2 (find-char c2)) + (eq ret ret2) + ) + ((setq ret2 (assq 'ideographic-structure c2)) + (and (setq ret (get-char-attribute ret 'ideographic-structure)) + (ideographic-structure-equal ret (cdr ret2)) + ))))))) + +;;;###autoload +(defun ideographic-structure-find-chars (structure) + (apply #'ideographic-structure-find-chars* structure)) + +(defun ideographic-structure-find-chars* (operator component1 component2 + &optional component3) + (let ((comp-alist (ideographic-structure-to-components-alist* + operator component1 component2 component3)) + c1 c2 c3 + ret pl str + var-alist) + (dolist (pc (caar + (sort (mapcar (lambda (cell) + (if (setq ret (get-char-attribute + (car cell) 'ideographic-products)) + (cons ret (length ret)) + (cons nil 0))) + comp-alist) + (lambda (a b) + (< (cdr a)(cdr b)))))) + (when (and (setq str (get-char-attribute pc 'ideographic-structure)) + (setq var-alist + (ideographic-structure-character= (car str) operator)) + (setq c1 (nth 1 str)) + (setq ret (ideographic-structure-character= c1 component1)) + (setq var-alist (ids-find-merge-variables var-alist ret)) + (setq c2 (nth 2 str)) + (setq ret (ideographic-structure-character= c2 component2)) + (setq var-alist (ids-find-merge-variables var-alist ret)) + (cond ((memq (car str) '(?\u2FF2 ?\u2FF3)) + (setq c3 (nth 3 str)) + (and (setq ret (ideographic-structure-character= + c3 component3)) + (ids-find-merge-variables var-alist ret)) + ) + (t var-alist))) + (setq pl (cons pc pl)) + )) + pl)) + +;;;###autoload +(defun ideographic-char-count-components (char component) + (let ((dest 0) + structure) + (cond ((eq char component) + 1) + ((setq structure (get-char-attribute char 'ideographic-structure)) + (dolist (cell (ideographic-structure-to-components-alist structure)) + (setq dest + (+ dest + (if (eq (car cell) char) + (cdr cell) + (* (ideographic-char-count-components (car cell) component) + (cdr cell)))))) + dest) + (t + 0)))) + + +;;;###autoload +(defun ideographic-character-get-structure (character) + "Return ideographic-structure of CHARACTER. +CHARACTER can be a character or char-spec." + (let (ret) + (cond ((characterp character) + (get-char-attribute character 'ideographic-structure) + ) + ((setq ret (assq 'ideographic-structure character)) + (cdr ret) + ) + ((setq ret (find-char character)) + (get-char-attribute ret 'ideographic-structure) + )))) + +;;;###autoload +(defun ideographic-char-match-component (char component) + "Return non-nil if character CHAR has COMPONENT in ideographic-structure. +COMPONENT can be a character or char-spec." + (or (ideographic-structure-character= char component) + (let ((str (ideographic-character-get-structure char))) + (and str + (or (ideographic-char-match-component (nth 1 str) component) + (ideographic-char-match-component (nth 2 str) component) + (if (memq (car str) '(?\u2FF2 ?\u2FF3)) + (ideographic-char-match-component (nth 3 str) component))))))) + +(defun ideographic-structure-char< (a b) + (let ((sa (get-char-attribute a 'ideographic-structure)) + (sb (get-char-attribute b 'ideographic-structure)) + tsa tsb) + (cond (sa + (cond (sb + (setq tsa (char-total-strokes a) + tsb (char-total-strokes b)) + (if tsa + (if tsb + (or (< tsa tsb) + (and (= tsa tsb) + (ideograph-char< a b))) + t) + (if tsb + nil + (ideograph-char< a b)))) + (t + nil)) + ) + (t + (cond (sb + t) + (t + (setq tsa (char-total-strokes a) + tsb (char-total-strokes b)) + (if tsa + (if tsb + (or (< tsa tsb) + (and (= tsa tsb) + (ideograph-char< a b))) + t) + (if tsb + nil + (ideograph-char< a b))) + )) + )) + )) + +(defun ideographic-chars-to-is-a-tree (chars) + (let (comp char products others dest rest + la lb) + (setq chars (sort chars #'ideographic-structure-char<)) + (while chars + (setq comp (pop chars) + rest chars + products nil + others nil) + (while rest + (setq char (pop rest)) + (cond + ((ideographic-char-match-component char comp) + (push char products) + ) + (t + (push char others) + ))) + (push (cons comp + ;; (nreverse products) + (if products + (sort (ideographic-chars-to-is-a-tree products) + (lambda (a b) + (setq la (length (cdr a)) + lb (length (cdr b))) + (or (> la lb) + (and (= la lb) + (ideograph-char< (car a) (car b)) + ;; (progn + ;; (setq tsa (char-total-strokes (car a)) + ;; tsb (char-total-strokes (car b))) + ;; (if tsa + ;; (if tsb + ;; (or (< tsa tsb) + ;; (and (= tsa tsb) + ;; (ideograph-char< + ;; (car a) (car b)))) + ;; t) + ;; (if tsb + ;; nil + ;; (ideograph-char< (car a) (car b))))) + )))) + nil) + ) + dest) + (setq chars others)) + dest)) + +(defun ids-find-chars-including-ids* (operator component1 component2 + &optional component3) + (let ((comp-alist (ideographic-structure-to-components-alist* + operator component1 component2 component3)) + (comp-spec + (list (list* 'ideographic-structure + operator component1 component2 + (if component3 + (list component3))))) + ret str rest) + (dolist (pc (caar + (sort (mapcar (lambda (cell) + (if (setq ret (get-char-attribute + (car cell) 'ideographic-products)) + (cons ret (length ret)) + (cons nil 0))) + comp-alist) + (lambda (a b) + (< (cdr a)(cdr b)))))) + (when (and (every (lambda (cell) + (>= (ideographic-char-count-components pc (car cell)) + (cdr cell))) + comp-alist) + (or (ideographic-char-match-component pc comp-spec) + (and (setq str (get-char-attribute pc 'ideographic-structure)) + (ideographic-char-match-component + (list + (cons + 'ideographic-structure + (functional-ideographic-structure-to-apparent-structure + str))) + comp-spec)))) + (push pc rest))) + (ideographic-chars-to-is-a-tree rest))) + +(defun ids-find-chars-including-ids (structure) + (if (characterp structure) + (setq structure (get-char-attribute structure 'ideographic-structure))) + (apply #'ids-find-chars-including-ids* structure)) + +(defun functional-ideographic-structure-to-apparent-structure (structure) + (let (enc enc-str enc2-str new-str) + (cond + ((eq (car structure) ?⿸) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿰) + (list ?⿰ (nth 1 enc-str) + (list (list 'ideographic-structure + ?⿱ + (nth 2 enc-str) + (nth 2 structure)))) + ) + ((and (eq (car enc-str) ?⿲) + (memq (char-ucs (nth 1 enc-str)) '(#x4EBB #x2E85)) + (eq (nth 2 enc-str) ?丨)) + (list ?⿰ + (decode-char '=big5-cdp #x8B7A) + (list (list 'ideographic-structure + ?⿱ + (nth 3 enc-str) + (nth 2 structure)))) + ) + ((eq (car enc-str) ?⿱) + (list ?⿱ (nth 1 enc-str) + (list + (cons 'ideographic-structure + (or (functional-ideographic-structure-to-apparent-structure + (setq new-str + (list + (cond + ((characterp (nth 2 enc-str)) + (if (or (eq (encode-char + (nth 2 enc-str) + '=>ucs@component) + #x20087) + (eq (encode-char + (nth 2 enc-str) + '=>ucs@component) + #x5382) + (eq (encode-char + (nth 2 enc-str) + '=>ucs@component) + #x4E06) + (eq (encode-char + (nth 2 enc-str) + '=big5-cdp) + #x89CE) + (eq (encode-char + (nth 2 enc-str) + '=>big5-cdp) + #x88E2) + (eq (encode-char + (nth 2 enc-str) + '=big5-cdp) + #x88AD) + (eq (or (encode-char + (nth 2 enc-str) + '=>big5-cdp) + (encode-char + (nth 2 enc-str) + '=big5-cdp-itaiji-001)) + #x8766) + (eq (car + (get-char-attribute + (nth 2 enc-str) + 'ideographic-structure)) + ?⿸)) + ?⿸ + ?⿰)) + ((eq (car + (cdr + (assq 'ideographic-structure + (nth 2 enc-str)))) + ?⿸) + ?⿸) + (t + ?⿰)) + (nth 2 enc-str) + (nth 2 structure) + ))) + new-str)))) + ) + ((eq (car enc-str) ?⿸) + (list ?⿸ (nth 1 enc-str) + (list + (cons 'ideographic-structure + (setq new-str + (list + (cond + ((characterp (nth 2 enc-str)) + (if (memq (char-ucs (nth 2 enc-str)) + '(#x5F73)) + ?⿰ + ?⿱) + ) + (t + ?⿱)) + (nth 2 enc-str) + (nth 2 structure)))))) + ))) + ) + ((eq (car structure) ?⿹) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿰) + (list ?⿰ + (list (list 'ideographic-structure + ?⿱ + (nth 1 enc-str) + (nth 2 structure))) + (nth 2 enc-str)) + ))) + ) + ((eq (get-char-attribute (car structure) '=ucs-itaiji-001) #x2FF6) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿺) + (list ?⿺ + (list (list 'ideographic-structure + ?⿱ + (nth 2 structure) + (nth 1 enc-str))) + (nth 2 enc-str)) + ) + ((eq (car enc-str) ?⿱) + (list ?⿱ + (list (list 'ideographic-structure + ?⿰ + (nth 2 structure) + (nth 1 enc-str))) + (nth 2 enc-str)) + )) + ) + ) + ((eq (car structure) ?⿴) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (cond + ((and (characterp (nth 2 enc-str)) + (or (memq (char-ucs (nth 2 enc-str)) '(#x56D7 #x5F51 #x897F)) + (eq (char-feature (nth 2 enc-str) '=>big5-cdp) + #x87A5))) + (list ?⿱ + (nth 1 enc-str) + (list (list 'ideographic-structure + ?⿴ + (nth 2 enc-str) + (nth 2 structure))) + ) + ) + ((and (characterp (nth 2 enc-str)) + (eq (char-ucs (nth 2 enc-str)) #x51F5)) + (list ?⿱ + (nth 1 enc-str) + (list (list 'ideographic-structure + ?⿶ + (nth 2 enc-str) + (nth 2 structure))) + ) + ) + ((and (characterp (nth 1 enc-str)) + (eq (char-feature (nth 1 enc-str) '=>ucs@component) + #x300E6)) + (list ?⿱ + (list (list 'ideographic-structure + ?⿵ + (nth 1 enc-str) + (nth 2 structure))) + (nth 2 enc-str)) + ) + (t + (list ?⿳ + (nth 1 enc-str) + (nth 2 structure) + (nth 2 enc-str)) + )) + )) + ) + ) + ((eq (car structure) ?⿶) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (list ?⿱ + (list (list 'ideographic-structure + ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))) + (nth 2 enc-str))) + ) + ((eq (car enc-str) ?⿳) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (list ?⿳ + (list (list 'ideographic-structure + ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))) + (nth 2 enc-str) + (nth 3 enc-str))) + ) + ((eq (car enc-str) ?⿲) + (list ?⿲ + (nth 1 enc-str) + (list (list 'ideographic-structure + ?⿱ + (nth 2 structure) + (nth 2 enc-str))) + (nth 3 enc-str)) + ) + ((eq (car enc-str) ?⿴) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (list ?⿲ + (nth 1 enc2-str) + (list (list 'ideographic-structure + ?⿱ + (nth 2 structure) + (nth 2 enc-str))) + (nth 2 enc2-str))) + ))) + ) + ((eq (car structure) ?⿵) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (setq enc2-str (ideographic-character-get-structure (nth 2 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (list ?⿱ + (nth 1 enc-str) + (list (list 'ideographic-structure + ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))))) + ) + ((eq (car enc-str) ?⿳) + (setq enc2-str (ideographic-character-get-structure (nth 3 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (list ?⿳ + (nth 1 enc-str) + (nth 2 enc-str) + (list (list 'ideographic-structure + ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))))) + ) + ((eq (car enc-str) ?⿲) + (list ?⿲ + (nth 1 enc-str) + (list (list 'ideographic-structure + ?⿱ + (nth 2 enc-str) + (nth 2 structure))) + (nth 3 enc-str)) + ) + ((eq (car enc-str) ?⿴) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (list ?⿲ + (nth 1 enc2-str) + (list (list 'ideographic-structure + ?⿱ + (nth 2 enc-str) + (nth 2 structure))) + (nth 2 enc2-str))) + ))) + ) + ((eq (car structure) ?⿻) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (list ?⿳ + (nth 1 enc-str) + (nth 2 structure) + (nth 2 enc-str)) + ))) + )) + )) + +;;;###autoload +(defun ideographic-structure-compact (structure) + (let ((rest structure) + cell + ret dest sub) + (while rest + (setq cell (pop rest)) + (cond + ((and (consp cell) + (cond ((setq ret (assq 'ideographic-structure cell)) + (setq sub (cdr ret)) + ) + ((atom (car cell)) + (setq sub cell) + ))) + (setq cell + (if (setq ret (ideographic-structure-find-chars sub)) + (car ret) + (list (cons 'ideographic-structure sub)))) + )) + (setq dest (cons cell dest))) + (nreverse dest))) + +(defun ideographic-structure-compare-functional-and-apparent (structure + &optional char) + (let (enc enc-str enc2-str new-str f-res a-res code) + (cond + ((eq (car structure) ?⿸) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿰) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿰ + (nth 1 enc-str) + (list (cons 'ideographic-structure new-str))) + 111) + ) + ((and (eq (car enc-str) ?⿲) + (memq (char-ucs (nth 1 enc-str)) '(#x4EBB #x2E85)) + (eq (nth 2 enc-str) ?丨)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 3 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿰ + (decode-char '=big5-cdp #x8B7A) + (list (cons 'ideographic-structure new-str))) + 112) + ) + ((eq (car enc-str) ?⿱) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str + (list + (cond + ((characterp (nth 2 enc-str)) + (if (or (eq (encode-char (nth 2 enc-str) '=>ucs@component) + #x20087) + (eq (encode-char (nth 2 enc-str) '=>ucs@component) + #x5382) + (eq (encode-char (nth 2 enc-str) '=>ucs@component) + #x4E06) + (eq (encode-char (nth 2 enc-str) '=big5-cdp) + #x89CE) + (eq (encode-char (nth 2 enc-str) '=>big5-cdp) + #x88E2) + (eq (encode-char (nth 2 enc-str) '=big5-cdp) + #x88AD) + (eq (or (encode-char (nth 2 enc-str) '=>big5-cdp) + (encode-char (nth 2 enc-str) '=big5-cdp-itaiji-001)) + #x8766) + (eq (car (get-char-attribute (nth 2 enc-str) + 'ideographic-structure)) + ?⿸)) + ?⿸ + ?⿰)) + ((eq (car (cdr (assq 'ideographic-structure (nth 2 enc-str)))) + ?⿸) + ?⿸) + (t + ?⿰)) + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list + ?⿱ + (nth 1 enc-str) + (list + (cons 'ideographic-structure + (or (functional-ideographic-structure-to-apparent-structure + new-str) + new-str)))) + (if (eq (car new-str) ?⿸) + 121 + 122)) + ) + ((eq (car enc-str) ?⿸) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list (cond + ((characterp (nth 2 enc-str)) + (if (memq (char-ucs (nth 2 enc-str)) + '(#x5F73)) + ?⿰ + ?⿱) + ) + (t + ?⿱)) + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿸ (nth 1 enc-str) + (list (cons 'ideographic-structure new-str))) + (if (eq (car new-str) ?⿰) + 131 + 132)) + ))) + ) + ((eq (car structure) ?⿹) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿰) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 1 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿰ + (list (cons 'ideographic-structure new-str)) + (nth 2 enc-str)) + 210) + ))) + ) + ((eq (get-char-attribute (car structure) '=ucs-itaiji-001) #x2FF6) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿺) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 2 structure) + (nth 1 enc-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿺ + (list (cons 'ideographic-structure new-str)) + (nth 2 enc-str)) + 310) + ) + ((eq (car enc-str) ?⿱) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿰ + (nth 2 structure) + (nth 1 enc-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿱ + (list (cons 'ideographic-structure new-str)) + (nth 2 enc-str)) + 320) + )) + ) + ) + ((eq (car structure) ?⿴) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (cond + ((and (characterp (nth 2 enc-str)) + (or (memq (char-ucs (nth 2 enc-str)) '(#x56D7 #x5F51 #x897F)) + (eq (char-feature (nth 2 enc-str) '=>big5-cdp) + #x87A5))) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿴ + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿱ + (nth 1 enc-str) + (list (cons 'ideographic-structure new-str))) + 411) + ) + ((and (characterp (nth 2 enc-str)) + (eq (char-ucs (nth 2 enc-str)) #x51F5)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿶ + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿱ + (nth 1 enc-str) + (list (cons 'ideographic-structure + new-str))) + 412) + ) + ((and (characterp (nth 1 enc-str)) + (eq (char-feature (nth 1 enc-str) '=>ucs@component) + #x300E6)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿵ + (nth 1 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿱ + (list (cons 'ideographic-structure new-str)) + (nth 2 enc-str)) + 413) + ) + (t + (setq f-res (ids-find-chars-including-ids enc-str)) + (list enc + f-res + new-str + nil + (list ?⿳ + (nth 1 enc-str) + (nth 2 structure) + (nth 2 enc-str)) + 414) + )) + )) + ) + ) + ((eq (car structure) ?⿶) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿱ + (list (cons 'ideographic-structure new-str)) + (nth 2 enc-str)) + 511) + ) + ) + ((eq (car enc-str) ?⿳) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿳ + (list (cons 'ideographic-structure new-str)) + (nth 2 enc-str) + (nth 3 enc-str)) + 512) + ) + ) + ((eq (car enc-str) ?⿲) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 2 structure) + (nth 2 enc-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿲ + (nth 1 enc-str) + (list (cons 'ideographic-structure new-str)) + (nth 3 enc-str)) + 520) + ) + ((eq (car enc-str) ?⿴) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 2 structure) + (nth 2 enc-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿲ + (nth 1 enc2-str) + (list (cons 'ideographic-structure new-str)) + (nth 2 enc2-str)) + 530) + ) + ))) + ) + ((eq (car structure) ?⿵) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (setq enc2-str (ideographic-character-get-structure (nth 2 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿱ + (nth 1 enc-str) + (list (cons 'ideographic-structure new-str))) + 611) + ) + ) + ((eq (car enc-str) ?⿳) + (setq enc2-str (ideographic-character-get-structure (nth 3 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿲ + (nth 1 enc2-str) + (nth 2 structure) + (nth 2 enc2-str))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿳ + (nth 1 enc-str) + (nth 2 enc-str) + (list (cons 'ideographic-structure new-str))) + 612) + ) + ) + ((eq (car enc-str) ?⿲) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿲ + (nth 1 enc-str) + (list (cons 'ideographic-structure new-str)) + (nth 3 enc-str)) + 620) + ) + ((eq (car enc-str) ?⿴) + (setq enc2-str (ideographic-character-get-structure (nth 1 enc-str))) + (when (and enc2-str + (eq (car enc2-str) ?⿰)) + (setq f-res (ids-find-chars-including-ids enc-str)) + (setq new-str (list ?⿱ + (nth 2 enc-str) + (nth 2 structure))) + (setq a-res (ids-find-chars-including-ids new-str)) + (list enc + f-res + new-str + a-res + (list ?⿲ + (nth 1 enc2-str) + (list (cons 'ideographic-structure new-str)) + (nth 2 enc2-str)) + 630) + ) + ))) + ) + ((eq (car structure) ?⿻) + (setq enc (nth 1 structure)) + (when (setq enc-str + (cond ((characterp enc) + (get-char-attribute enc 'ideographic-structure) + ) + ((consp enc) + (cdr (assq 'ideographic-structure enc)) + ))) + (cond + ((eq (car enc-str) ?⿱) + (setq f-res (ids-find-chars-including-ids enc-str)) + (list enc + f-res + new-str + nil + (list ?⿳ + (nth 1 enc-str) + (nth 2 structure) + (nth 2 enc-str)) + 911) + ))) + )) + )) + + ;;; @ End. ;;;