1 ;;; ietf-drums.el --- Functions for parsing RFC822bis headers
3 ;; Copyright (C) 1998-2017 Free Software Foundation, Inc.
5 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
6 ;; This file is part of GNU Emacs.
8 ;; GNU Emacs is free software: you can redistribute it and/or modify
9 ;; it under the terms of the GNU General Public License as published by
10 ;; the Free Software Foundation, either version 3 of the License, or
11 ;; (at your option) any later version.
13 ;; GNU Emacs is distributed in the hope that it will be useful,
14 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
15 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 ;; GNU General Public License for more details.
18 ;; You should have received a copy of the GNU General Public License
19 ;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
23 ;; DRUMS is an IETF Working Group that works (or worked) on the
24 ;; successor to RFC822, "Standard For The Format Of Arpa Internet Text
25 ;; Messages". This library is based on
26 ;; draft-ietf-drums-msg-fmt-05.txt, released on 1998-08-05.
28 ;; Pending a real regression self test suite, Simon Josefsson added
29 ;; various self test expressions snipped from bug reports, and their
30 ;; expected value, below. I you believe it could be useful, please
31 ;; add your own test cases, or write a real self test suite, or just
34 ;; <m3oekvfd50.fsf@whitebox.m5r.de>
35 ;; (ietf-drums-parse-address "'foo' <foo@example.com>")
36 ;; => ("foo@example.com" . "'foo'")
40 (eval-when-compile (require 'cl
))
42 (defvar ietf-drums-no-ws-ctl-token
"\001-\010\013\014\016-\037\177"
43 "US-ASCII control characters excluding CR, LF and white space.")
44 (defvar ietf-drums-text-token
"\001-\011\013\014\016-\177"
45 "US-ASCII characters excluding CR and LF.")
46 (defvar ietf-drums-specials-token
"()<>[]:;@\\,.\""
47 "Special characters.")
48 (defvar ietf-drums-quote-token
"\\"
50 (defvar ietf-drums-wsp-token
" \t"
52 (defvar ietf-drums-fws-regexp
53 (concat "[" ietf-drums-wsp-token
"]*\n[" ietf-drums-wsp-token
"]+")
54 "Folding white space.")
55 (defvar ietf-drums-atext-token
"-^a-zA-Z0-9!#$%&'*+/=?_`{|}~"
57 (defvar ietf-drums-dot-atext-token
"-^a-zA-Z0-9!#$%&'*+/=?_`{|}~."
58 "Textual token including full stop.")
59 (defvar ietf-drums-qtext-token
60 (concat ietf-drums-no-ws-ctl-token
"\041\043-\133\135-\177")
61 "Non-white-space control characters, plus the rest of ASCII excluding
62 backslash and doublequote.")
63 (defvar ietf-drums-tspecials
"][()<>@,;:\\\"/?="
66 (defvar ietf-drums-syntax-table
67 (let ((table (copy-syntax-table emacs-lisp-mode-syntax-table
)))
68 (modify-syntax-entry ?
\\ "/" table
)
69 (modify-syntax-entry ?
< "(" table
)
70 (modify-syntax-entry ?
> ")" table
)
71 (modify-syntax-entry ?
@ "w" table
)
72 (modify-syntax-entry ?
/ "w" table
)
73 (modify-syntax-entry ?
* "_" table
)
74 (modify-syntax-entry ?\
; "_" table)
75 (modify-syntax-entry ?
\' "_" table
)
78 (defun ietf-drums-token-to-list (token)
79 "Translate TOKEN into a list of characters."
82 (while (< i
(length token
))
83 (setq c
(aref token i
))
92 (push (make-char 'ascii b
) out
)
96 (push (make-char 'ascii c
) out
))
99 (push (make-char 'ascii b
) out
))
103 (defsubst ietf-drums-init
(string)
104 (set-syntax-table ietf-drums-syntax-table
)
106 (ietf-drums-unfold-fws)
107 (goto-char (point-min)))
109 (defun ietf-drums-remove-comments (string)
110 "Remove comments from STRING."
113 (ietf-drums-init string
)
115 (setq c
(char-after))
120 (error (goto-char (point-max)))))
125 (with-syntax-table (copy-syntax-table ietf-drums-syntax-table
)
126 (modify-syntax-entry ?
\" "w")
129 (error (point-max)))))
134 (defun ietf-drums-remove-whitespace (string)
135 "Remove whitespace from STRING."
137 (ietf-drums-init string
)
140 (setq c
(char-after))
146 ((memq c
'(?\ ?
\t ?
\n ?
\r))
152 (defun ietf-drums-get-comment (string)
153 "Return the first comment in STRING."
155 (ietf-drums-init string
)
158 (setq c
(char-after))
166 (progn (forward-sexp 1) (1- (point))))))
171 (defun ietf-drums-strip (string)
172 "Remove comments and whitespace from STRING."
173 (ietf-drums-remove-whitespace (ietf-drums-remove-comments string
)))
175 (defun ietf-drums-remove-garbage (string)
176 "Remove some garbage from STRING."
177 (while (string-match "[][()<>@,;:\\\"/?=]+" string
)
178 (setq string
(concat (substring string
0 (match-beginning 0))
179 (substring string
(match-end 0)))))
182 (defun ietf-drums-strip-cte (string)
183 "Remove comments, whitespace and garbage from STRING.
184 STRING is assumed to be a string that is extracted from
185 the Content-Transfer-Encoding header of a mail."
186 (ietf-drums-remove-garbage (inline (ietf-drums-strip string
))))
188 (defun ietf-drums-parse-address (string)
189 "Parse STRING and return a MAILBOX / DISPLAY-NAME pair."
191 (let (display-name mailbox c display-string
)
192 (ietf-drums-init string
)
194 (setq c
(char-after))
195 ;; If we have an uneven number of quote characters,
196 ;; `forward-sexp' will fail. In these cases, just delete the
197 ;; final of these quote characters.
198 (when (and (eq c ?
\")
205 (setq c
(char-after)))
213 (push (buffer-substring
214 (1+ (point)) (progn (forward-sexp 1) (1- (point))))
216 ((looking-at (concat "[" ietf-drums-atext-token
"@" "]"))
217 (push (buffer-substring (point) (progn (forward-sexp 1) (point)))
221 (ietf-drums-remove-whitespace
222 (ietf-drums-remove-comments
225 (progn (forward-sexp 1) (1- (point))))))))
228 ;; If we found no display-name, then we look for comments.
231 (mapconcat 'identity
(reverse display-name
) " "))
232 (setq display-string
(ietf-drums-get-comment string
)))
234 (when (and display-string
235 (string-match "@" display-string
))
237 (mapconcat 'identity
(nreverse display-name
) "")
238 (ietf-drums-get-comment string
)))
239 (cons mailbox display-string
)))))
241 (defun ietf-drums-parse-addresses (string &optional rawp
)
242 "Parse STRING and return a list of MAILBOX / DISPLAY-NAME pairs.
243 If RAWP, don't actually parse the addresses, but instead return
244 a list of address strings."
248 (ietf-drums-init string
)
252 (setq c
(char-after))
254 ((memq c
'(?
\" ?
< ?\
())
258 (skip-chars-forward "^,"))))
262 (buffer-substring beg
(point))
264 (ietf-drums-parse-address
265 (buffer-substring beg
(point)))
267 (if address
(push address pairs
))
274 (buffer-substring beg
(point))
276 (ietf-drums-parse-address
277 (buffer-substring beg
(point)))
279 (if address
(push address pairs
))
282 (defun ietf-drums-unfold-fws ()
283 "Unfold folding white space in the current buffer."
284 (goto-char (point-min))
285 (while (re-search-forward ietf-drums-fws-regexp nil t
)
286 (replace-match " " t t
))
287 (goto-char (point-min)))
289 (defun ietf-drums-parse-date (string)
290 "Return an Emacs time spec from STRING."
291 (apply 'encode-time
(parse-time-string string
)))
293 (defun ietf-drums-narrow-to-header ()
294 "Narrow to the header section in the current buffer."
296 (goto-char (point-min))
297 (if (re-search-forward "^\r?$" nil
1)
300 (goto-char (point-min)))
302 (defun ietf-drums-quote-string (string)
303 "Quote string if it needs quoting to be displayed in a header."
304 (if (string-match (concat "[^" ietf-drums-atext-token
"]") string
)
305 (concat "\"" string
"\"")
308 (defun ietf-drums-make-address (name address
)
310 (concat (ietf-drums-quote-string name
) " <" address
">")
313 (provide 'ietf-drums
)
315 ;;; ietf-drums.el ends here