+;;; @ lexical analyze
+;;;
+
+(defcustom std11-lexical-analyzer
+ '(std11-analyze-quoted-string
+ std11-analyze-domain-literal
+ std11-analyze-comment
+ std11-analyze-spaces
+ std11-analyze-special
+ std11-analyze-atom)
+ "*List of functions to return result of lexical analyze.
+Each function must have two arguments: STRING and START.
+STRING is the target string to be analyzed.
+START is start position of STRING to analyze.
+
+Previous function is preferred to next function. If a function
+returns nil, next function is used. Otherwise the return value will
+be the result."
+ :group 'news
+ :group 'mail
+ :type '(repeat function))
+
+(eval-and-compile
+ (defconst std11-space-char-list '(? ?\t ?\n))
+ (defconst std11-special-char-list '(?\] ?\[
+ ?\( ?\) ?< ?> ?@
+ ?, ?\; ?: ?\\ ?\"
+ ?.))
+ )
+;; (defconst std11-spaces-regexp
+;; (eval-when-compile (concat "[" std11-space-char-list "]+")))
+
+(defconst std11-non-atom-regexp
+ (eval-when-compile
+ (concat "[" std11-special-char-list std11-space-char-list "]")))
+
+(defconst std11-atom-regexp
+ (eval-when-compile
+ (concat "[^" std11-special-char-list std11-space-char-list "]+")))
+
+(defun std11-analyze-spaces (string start)
+ (if (and (string-match (eval-when-compile
+ (concat "[" std11-space-char-list "]+"))
+ string start)
+ (= (match-beginning 0) start))
+ (let ((end (match-end 0)))
+ (cons (cons 'spaces (substring string start end))
+ ;;(substring string end)
+ end)
+ )))
+
+(defun std11-analyze-special (string start)
+ (if (and (> (length string) start)
+ (memq (aref string start) std11-special-char-list))
+ (cons (cons 'specials (substring string start (1+ start)))
+ ;;(substring string 1)
+ (1+ start))
+ ))
+
+(defun std11-analyze-atom (string start)
+ (if (string-match std11-non-atom-regexp string start)
+ (if (> (match-beginning 0) start)
+ (cons (cons 'atom (substring string start (match-beginning 0)))
+ (match-beginning 0))
+ nil)
+ (cons (cons 'atom (substring string start))
+ (length string)))
+ ;; (if (and (string-match std11-atom-regexp string start)
+ ;; (= (match-beginning 0) start))
+ ;; (let ((end (match-end 0)))
+ ;; (cons (cons 'atom (substring string start end))
+ ;; ;;(substring string end)
+ ;; end)
+ ;; ))
+ )
+
+(defun std11-check-enclosure (string open close &optional recursive from)
+ (let ((len (length string))
+ (i (or from 0))
+ )
+ (if (and (> len i)
+ (eq (aref string i) open))
+ (let (p chr)
+ (setq i (1+ i))
+ (catch 'tag
+ (while (< i len)
+ (setq chr (aref string i))
+ (cond ((eq chr ?\\)
+ (setq i (1+ i))
+ (if (>= i len)
+ (throw 'tag nil)
+ )
+ (setq i (1+ i))
+ )
+ ((eq chr close)
+ (throw 'tag (1+ i))
+ )
+ ((eq chr open)
+ (if (and recursive
+ (setq p (std11-check-enclosure
+ string open close recursive i))
+ )
+ (setq i p)
+ (throw 'tag nil)
+ ))
+ (t
+ (setq i (1+ i))
+ ))
+ ))))))
+
+(defun std11-analyze-quoted-string (string start)
+ (let ((p (std11-check-enclosure string ?\" ?\" nil start)))
+ (if p
+ (cons (cons 'quoted-string (substring string (1+ start) (1- p)))
+ ;;(substring string p))
+ p)
+ )))
+
+(defun std11-analyze-domain-literal (string start)
+ (let ((p (std11-check-enclosure string ?\[ ?\] nil start)))
+ (if p
+ (cons (cons 'domain-literal (substring string (1+ start) (1- p)))
+ ;;(substring string p))
+ p)
+ )))
+
+(defun std11-analyze-comment (string start)
+ (let ((p (std11-check-enclosure string ?\( ?\) t start)))
+ (if p
+ (cons (cons 'comment (substring string (1+ start) (1- p)))
+ ;;(substring string p))
+ p)
+ )))
+
+;;;###autoload
+(defun std11-lexical-analyze (string &optional analyzer start)
+ "Analyze STRING as lexical tokens of STD 11."
+ (or analyzer
+ (setq analyzer std11-lexical-analyzer))
+ (or start
+ (setq start 0))
+ (let ((len (length string))
+ dest ret)
+ (while (< start len)
+ (setq ret
+ (let ((rest analyzer)
+ func r)
+ (while (and (setq func (car rest))
+ (null (setq r (funcall func string start))))
+ (setq rest (cdr rest)))
+ (or r
+ (cons (cons 'error (substring string start)) (1+ len)))
+ ))
+ (setq dest (cons (car ret) dest)
+ start (cdr ret))
+ )
+ (nreverse dest)
+ ))
+
+
+;;; @ parser
+;;;
+
+(defun std11-ignored-token-p (token)
+ (let ((type (car token)))
+ (or (eq type 'spaces)(eq type 'comment))
+ ))
+
+(defun std11-parse-token (lal)
+ (let (token itl)
+ (while (and lal
+ (progn
+ (setq token (car lal))
+ (std11-ignored-token-p token)
+ ))
+ (setq lal (cdr lal))
+ (setq itl (cons token itl))
+ )
+ (cons (nreverse (cons token itl))
+ (cdr lal))
+ ))
+
+(defun std11-parse-ascii-token (lal)
+ (let (token itl parsed token-value)
+ (while (and lal
+ (setq token (car lal))
+ (or (std11-ignored-token-p token)
+ (if (and (setq token-value (cdr token))
+ (delq 'ascii (find-charset-string token-value)))
+ (setq token nil)
+ )))
+ (setq lal (cdr lal))
+ (setq itl (cons token itl))
+ )
+ (if (and token
+ (setq parsed (nreverse (cons token itl)))
+ )
+ (cons parsed (cdr lal))
+ )))
+
+(defun std11-parse-token-or-comment (lal)
+ (let (token itl)
+ (while (and lal
+ (progn
+ (setq token (car lal))
+ (eq (car token) 'spaces)
+ ))
+ (setq lal (cdr lal))
+ (setq itl (cons token itl))
+ )
+ (cons (nreverse (cons token itl))
+ (cdr lal))
+ ))
+
+(defun std11-parse-word (lal)
+ (let ((ret (std11-parse-ascii-token lal)))
+ (if ret
+ (let ((elt (car ret))
+ (rest (cdr ret))
+ )
+ (if (or (assq 'atom elt)
+ (assq 'quoted-string elt))
+ (cons (cons 'word elt) rest)
+ )))))
+
+(defun std11-parse-word-or-comment (lal)
+ (let ((ret (std11-parse-token-or-comment lal)))
+ (if ret
+ (let ((elt (car ret))
+ (rest (cdr ret))
+ )
+ (cond ((or (assq 'atom elt)
+ (assq 'quoted-string elt))
+ (cons (cons 'word elt) rest)
+ )
+ ((assq 'comment elt)
+ (cons (cons 'comment-word elt) rest)
+ ))
+ ))))
+
+(defun std11-parse-phrase (lal)
+ (let (ret phrase)
+ (while (setq ret (std11-parse-word-or-comment lal))
+ (setq phrase (append phrase (cdr (car ret))))
+ (setq lal (cdr ret))
+ )
+ (if phrase
+ (cons (cons 'phrase phrase) lal)
+ )))
+
+(defun std11-parse-local-part (lal)
+ (let ((ret (std11-parse-word lal)))
+ (if ret
+ (let ((local-part (cdr (car ret))) dot)
+ (setq lal (cdr ret))
+ (while (and (setq ret (std11-parse-ascii-token lal))
+ (setq dot (car ret))
+ (string-equal (cdr (assq 'specials dot)) ".")
+ (setq ret (std11-parse-word (cdr ret)))
+ (setq local-part
+ (append local-part dot (cdr (car ret)))
+ )
+ (setq lal (cdr ret))
+ ))
+ (cons (cons 'local-part local-part) lal)
+ ))))
+
+(defun std11-parse-sub-domain (lal)
+ (let ((ret (std11-parse-ascii-token lal)))
+ (if ret
+ (let ((sub-domain (car ret)))
+ (if (or (assq 'atom sub-domain)
+ (assq 'domain-literal sub-domain)
+ )
+ (cons (cons 'sub-domain sub-domain)
+ (cdr ret)
+ )
+ )))))
+
+(defun std11-parse-domain (lal)
+ (let ((ret (std11-parse-sub-domain lal)))
+ (if ret
+ (let ((domain (cdr (car ret))) dot)
+ (setq lal (cdr ret))
+ (while (and (setq ret (std11-parse-ascii-token lal))
+ (setq dot (car ret))
+ (string-equal (cdr (assq 'specials dot)) ".")
+ (setq ret (std11-parse-sub-domain (cdr ret)))
+ (setq domain
+ (append domain dot (cdr (car ret)))
+ )
+ (setq lal (cdr ret))
+ ))
+ (cons (cons 'domain domain) lal)
+ ))))
+
+(defun std11-parse-at-domain (lal)
+ (let ((ret (std11-parse-ascii-token lal)) at-sign)
+ (if (and ret
+ (setq at-sign (car ret))
+ (string-equal (cdr (assq 'specials at-sign)) "@")
+ (setq ret (std11-parse-domain (cdr ret)))
+ )
+ (cons (cons 'at-domain (append at-sign (cdr (car ret))))
+ (cdr ret))
+ )))
+
+(defun std11-parse-addr-spec (lal)
+ (let ((ret (std11-parse-local-part lal))
+ addr)
+ (if (and ret
+ (prog1
+ (setq addr (cdr (car ret)))
+ (setq lal (cdr ret))
+ (and (setq ret (std11-parse-at-domain lal))
+ (setq addr (append addr (cdr (car ret))))
+ (setq lal (cdr ret))
+ )))
+ (cons (cons 'addr-spec addr) lal)
+ )))
+
+(defun std11-parse-route (lal)
+ (let ((ret (std11-parse-at-domain lal))
+ route comma colon)
+ (if (and ret
+ (progn
+ (setq route (cdr (car ret)))
+ (setq lal (cdr ret))
+ (while (and (setq ret (std11-parse-ascii-token lal))
+ (setq comma (car ret))
+ (string-equal (cdr (assq 'specials comma)) ",")
+ (setq ret (std11-parse-at-domain (cdr ret)))
+ )
+ (setq route (append route comma (cdr (car ret))))
+ (setq lal (cdr ret))
+ )
+ (and (setq ret (std11-parse-ascii-token lal))
+ (setq colon (car ret))
+ (string-equal (cdr (assq 'specials colon)) ":")
+ (setq route (append route colon))
+ )
+ ))
+ (cons (cons 'route route)
+ (cdr ret)
+ )
+ )))
+
+(defun std11-parse-route-addr (lal)
+ (let ((ret (std11-parse-ascii-token lal))
+ < route addr-spec >)
+ (if (and ret
+ (setq < (car ret))
+ (string-equal (cdr (assq 'specials <)) "<")
+ (setq lal (cdr ret))
+ (progn (and (setq ret (std11-parse-route lal))
+ (setq route (cdr (car ret)))
+ (setq lal (cdr ret))
+ )
+ (setq ret (std11-parse-addr-spec lal))
+ )
+ (setq addr-spec (cdr (car ret)))
+ (setq lal (cdr ret))
+ (setq ret (std11-parse-ascii-token lal))
+ (setq > (car ret))
+ (string-equal (cdr (assq 'specials >)) ">")
+ )
+ (cons (cons 'route-addr (append route addr-spec))
+ (cdr ret)
+ )
+ )))
+
+(defun std11-parse-phrase-route-addr (lal)
+ (let ((ret (std11-parse-phrase lal)) phrase)
+ (if ret
+ (progn
+ (setq phrase (cdr (car ret)))
+ (setq lal (cdr ret))
+ ))
+ (if (setq ret (std11-parse-route-addr lal))
+ (cons (list 'phrase-route-addr
+ phrase
+ (cdr (car ret)))
+ (cdr ret))
+ )))
+
+(defun std11-parse-mailbox (lal)
+ (let ((ret (or (std11-parse-phrase-route-addr lal)
+ (std11-parse-addr-spec lal)))
+ mbox comment)
+ (if (and ret
+ (prog1
+ (setq mbox (car ret))
+ (setq lal (cdr ret))
+ (if (and (setq ret (std11-parse-token-or-comment lal))
+ (setq comment (cdr (assq 'comment (car ret))))
+ )
+ (setq lal (cdr ret))
+ )))
+ (cons (list 'mailbox mbox comment)
+ lal)
+ )))
+
+(defun std11-parse-group (lal)
+ (let ((ret (std11-parse-phrase lal))
+ phrase colon comma mbox semicolon)
+ (if (and ret
+ (setq phrase (cdr (car ret)))
+ (setq lal (cdr ret))
+ (setq ret (std11-parse-ascii-token lal))
+ (setq colon (car ret))
+ (string-equal (cdr (assq 'specials colon)) ":")
+ (setq lal (cdr ret))
+ (progn
+ (and (setq ret (std11-parse-mailbox lal))
+ (setq mbox (list (car ret)))
+ (setq lal (cdr ret))
+ (progn
+ (while (and (setq ret (std11-parse-ascii-token lal))
+ (setq comma (car ret))
+ (string-equal
+ (cdr (assq 'specials comma)) ",")
+ (setq lal (cdr ret))
+ (setq ret (std11-parse-mailbox lal))
+ (setq mbox (cons (car ret) mbox))
+ (setq lal (cdr ret))
+ )
+ )))
+ (and (setq ret (std11-parse-ascii-token lal))
+ (setq semicolon (car ret))
+ (string-equal (cdr (assq 'specials semicolon)) ";")
+ )))
+ (cons (list 'group phrase (nreverse mbox))
+ (cdr ret)
+ )
+ )))
+
+(defun std11-parse-address (lal)
+ (or (std11-parse-group lal)
+ (std11-parse-mailbox lal)
+ ))
+
+(defun std11-parse-addresses (lal)
+ (let ((ret (std11-parse-address lal)))
+ (if ret
+ (let ((dest (list (car ret))))
+ (setq lal (cdr ret))
+ (while (and (setq ret (std11-parse-ascii-token lal))
+ (string-equal (cdr (assq 'specials (car ret))) ",")
+ (setq ret (std11-parse-address (cdr ret)))
+ )
+ (setq dest (cons (car ret) dest))
+ (setq lal (cdr ret))
+ )
+ (nreverse dest)
+ ))))
+
+(defun std11-parse-msg-id (lal)
+ (let ((ret (std11-parse-ascii-token lal))
+ < addr-spec >)
+ (if (and ret
+ (setq < (car ret))
+ (string-equal (cdr (assq 'specials <)) "<")
+ (setq lal (cdr ret))
+ (setq ret (std11-parse-addr-spec lal))
+ (setq addr-spec (car ret))
+ (setq lal (cdr ret))
+ (setq ret (std11-parse-ascii-token lal))
+ (setq > (car ret))
+ (string-equal (cdr (assq 'specials >)) ">")
+ )
+ (cons (cons 'msg-id (cdr addr-spec))
+ (cdr ret))
+ )))
+
+(defun std11-parse-msg-ids (tokens)
+ "Parse lexical TOKENS as `*(phrase / msg-id)', and return the result."
+ (let ((ret (or (std11-parse-msg-id tokens)
+ (std11-parse-phrase tokens))))
+ (if ret
+ (let ((dest (list (car ret))))
+ (setq tokens (cdr ret))
+ (while (setq ret (or (std11-parse-msg-id tokens)
+ (std11-parse-phrase tokens)))
+ (setq dest (cons (car ret) dest))
+ (setq tokens (cdr ret))
+ )
+ (nreverse dest)
+ ))))
+
+(defalias 'std11-parse-in-reply-to 'std11-parse-msg-ids)
+(make-obsolete 'std11-parse-in-reply-to 'std11-parse-msg-ids)
+
+