1 ;;; qp.el --- Quoted-Printable functions
3 ;; Copyright (C) 1998, 1999, 2000, 2001, 2002 Free Software Foundation, Inc.
5 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
6 ;; Keywords: mail, extensions
8 ;; This file is part of GNU Emacs.
10 ;; GNU Emacs is free software; you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation; either version 2, or (at your option)
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs; see the file COPYING. If not, write to the
22 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330,
23 ;; Boston, MA 02111-1307, USA.
27 ;; Functions for encoding and decoding quoted-printable text as
28 ;; defined in RFC 2045.
33 (eval-when-compile (defvar mm-use-ultra-safe-encoding
))
35 (defun quoted-printable-decode-region (from to
&optional coding-system
)
36 "Decode quoted-printable in the region between FROM and TO, per RFC 2045.
37 If CODING-SYSTEM is non-nil, decode bytes into characters with that
40 Interactively, you can supply the CODING-SYSTEM argument
41 with \\[universal-coding-system-argument]."
43 ;; Let the user determine the coding system with "C-x RET c".
44 (list (region-beginning) (region-end) coding-system-for-read
))
45 (unless (mm-coding-system-p coding-system
) ; e.g. `ascii' from Gnus
46 (setq coding-system nil
))
49 ;; RFC 2045: ``An "=" followed by two hexadecimal digits, one
50 ;; or both of which are lowercase letters in "abcdef", is
51 ;; formally illegal. A robust implementation might choose to
52 ;; recognize them as the corresponding uppercase letters.''
53 (let ((case-fold-search t
))
54 (narrow-to-region from to
)
55 ;; Do this in case we're called from Gnus, say, in a buffer
56 ;; which already contains non-ASCII characters which would
57 ;; then get doubly-decoded below.
59 (mm-encode-coding-region (point-min) (point-max) coding-system
))
60 (goto-char (point-min))
61 (while (and (skip-chars-forward "^=")
63 (cond ((eq (char-after (1+ (point))) ?
\n)
65 ((looking-at "=[0-9A-F][0-9A-F]")
66 (let ((byte (string-to-int (buffer-substring (1+ (point))
69 (mm-insert-byte byte
1)
74 (error "Malformed quoted-printable text")
77 (mm-decode-coding-region (point-min) (point-max) coding-system
)))))
79 (defun quoted-printable-decode-string (string &optional coding-system
)
80 "Decode the quoted-printable encoded STRING and return the result.
81 If CODING-SYSTEM is non-nil, decode the region with coding-system."
84 (quoted-printable-decode-region (point-min) (point-max) coding-system
)
87 (defun quoted-printable-encode-region (from to
&optional fold class
)
88 "Quoted-printable encode the region between FROM and TO per RFC 2045.
90 If FOLD, fold long lines at 76 characters (as required by the RFC).
91 If CLASS is non-nil, translate the characters not matched by that
92 regexp class, which is in the form expected by `skip-chars-forward'.
93 You should probably avoid non-ASCII characters in this arg.
95 If `mm-use-ultra-safe-encoding' is set, fold lines unconditionally and
96 encode lines starting with \"From\"."
100 (if (fboundp 'string-to-multibyte
) ; Emacs 22
101 (if (re-search-forward (string-to-multibyte "[^\x0-\x7f\x80-\xff]")
103 ;; Fixme: This is somewhat misleading.
104 (error "Multibyte character in QP encoding region"))
105 (if (re-search-forward (mm-string-as-multibyte "[^\0-\377]") to t
)
106 (error "Multibyte character in QP encoding region"))))
108 ;; Avoid using 8bit characters. = is \075.
109 ;; Equivalent to "^\000-\007\013\015-\037\200-\377="
110 (setq class
"\010-\012\014\040-\074\076-\177"))
113 (narrow-to-region from to
)
114 ;; Encode all the non-ascii and control characters.
115 (goto-char (point-min))
116 (while (and (skip-chars-forward class
)
120 ;; To unibyte in case of Emacs 22 eight-bit.
121 (format "=%02X" (mm-multibyte-char-to-unibyte (char-after)))
123 ;; Encode white space at the end of lines.
124 (goto-char (point-min))
125 (while (re-search-forward "[ \t]+$" nil t
)
126 (goto-char (match-beginning 0))
130 (format "=%02X" (char-after))
132 (let ((mm-use-ultra-safe-encoding
133 (and (boundp 'mm-use-ultra-safe-encoding
)
134 mm-use-ultra-safe-encoding
)))
135 (when (or fold mm-use-ultra-safe-encoding
)
136 (let ((tab-width 1)) ; HTAB is one character.
137 (goto-char (point-min))
139 ;; In ultra-safe mode, encode "From " at the beginning
141 (when mm-use-ultra-safe-encoding
142 (if (looking-at "From ")
143 (replace-match "From=20" nil t
)
145 (replace-match "=2D" nil t
))))
148 (while (> (current-column) 76) ; tab-width must be 1.
150 (forward-char 75) ; 75 chars plus an "="
151 (search-backward "=" (- (point) 2) t
)
154 (forward-line))))))))
156 (defun quoted-printable-encode-string (string)
157 "Encode the STRING as quoted-printable and return the result."
158 (let ((default-enable-multibyte-characters (mm-multibyte-string-p string
)))
161 (quoted-printable-encode-region (point-min) (point-max))