1 ;;; qp.el --- Quoted-Printable functions
3 ;; Copyright (C) 1998-2017 Free Software Foundation, Inc.
5 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org>
6 ;; Keywords: mail, extensions
8 ;; This file is part of GNU Emacs.
10 ;; GNU Emacs is free software: you can redistribute it and/or modify
11 ;; it under the terms of the GNU General Public License as published by
12 ;; the Free Software Foundation, either version 3 of the License, or
13 ;; (at your option) any later version.
15 ;; GNU Emacs is distributed in the hope that it will be useful,
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
18 ;; GNU General Public License for more details.
20 ;; You should have received a copy of the GNU General Public License
21 ;; along with GNU Emacs. If not, see <https://www.gnu.org/licenses/>.
25 ;; Functions for encoding and decoding quoted-printable text as
26 ;; defined in RFC 2045.
31 (defun quoted-printable-decode-region (from to
&optional coding-system
)
32 "Decode quoted-printable in the region between FROM and TO, per RFC 2045.
33 If CODING-SYSTEM is non-nil, decode bytes into characters with that
36 Interactively, you can supply the CODING-SYSTEM argument
37 with \\[universal-coding-system-argument].
39 The CODING-SYSTEM argument is a historical hangover and is deprecated.
40 QP encodes raw bytes and should be decoded into raw bytes. Decoding
41 them into characters should be done separately."
43 ;; Let the user determine the coding system with "C-x RET c".
44 (list (region-beginning) (region-end) coding-system-for-read
))
45 (when (and coding-system
46 (not (coding-system-p coding-system
))) ; e.g. `ascii' from Gnus
47 (setq coding-system nil
))
50 ;; RFC 2045: ``An "=" followed by two hexadecimal digits, one
51 ;; or both of which are lowercase letters in "abcdef", is
52 ;; formally illegal. A robust implementation might choose to
53 ;; recognize them as the corresponding uppercase letters.''
54 (let ((case-fold-search t
))
55 (narrow-to-region from to
)
56 ;; Do this in case we're called from Gnus, say, in a buffer
57 ;; which already contains non-ASCII characters which would
58 ;; then get doubly-decoded below.
60 (encode-coding-region (point-min) (point-max) coding-system
))
61 (goto-char (point-min))
62 (while (and (skip-chars-forward "^=")
64 (cond ((eq (char-after (1+ (point))) ?
\n)
66 ((looking-at "\\(=[0-9A-F][0-9A-F]\\)+")
67 ;; Decode this sequence at once; i.e. by a single
68 ;; deletion and insertion.
69 (let* ((n (/ (- (match-end 0) (point)) 3))
70 (str (make-string n
0)))
72 (let ((n1 (char-after (1+ (point))))
73 (n2 (char-after (+ 2 (point)))))
75 (+ (* 16 (- n1
(if (<= n1 ?
9) ?
0
76 (if (<= n1 ?F
) (- ?A
10)
78 (- n2
(if (<= n2 ?
9) ?
0
79 (if (<= n2 ?F
) (- ?A
10)
82 (delete-region (match-beginning 0) (match-end 0))
85 (message "Malformed quoted-printable text")
88 (decode-coding-region (point-min) (point-max) coding-system
)))))
90 (defun quoted-printable-decode-string (string &optional coding-system
)
91 "Decode the quoted-printable encoded STRING and return the result.
92 If CODING-SYSTEM is non-nil, decode the string with coding-system.
93 Use of CODING-SYSTEM is deprecated; this function should deal with
94 raw bytes, and coding conversion should be done separately."
96 (set-buffer-multibyte nil
)
98 (quoted-printable-decode-region (point-min) (point-max) coding-system
)
101 (defun quoted-printable-encode-region (from to
&optional fold class
)
102 "Quoted-printable encode the region between FROM and TO per RFC 2045.
104 If FOLD, fold long lines at 76 characters (as required by the RFC).
105 If CLASS is non-nil, translate the characters not matched by that
106 regexp class, which is in the form expected by `skip-chars-forward'.
107 You should probably avoid non-ASCII characters in this arg.
109 If `mm-use-ultra-safe-encoding' is set, fold lines unconditionally and
110 encode lines starting with \"From\"."
113 ;; Avoid using 8bit characters. = is \075.
114 ;; Equivalent to "^\000-\007\013\015-\037\200-\377="
115 (setq class
"\010-\012\014\040-\074\076-\177"))
118 (if (re-search-forward (string-to-multibyte "[^\x0-\x7f\x80-\xff]")
120 (error "Multibyte character in QP encoding region"))
122 (narrow-to-region from to
)
123 ;; Encode all the non-ascii and control characters.
124 (goto-char (point-min))
125 (while (and (skip-chars-forward class
)
129 (format "=%02X" (char-after))
131 ;; Encode white space at the end of lines.
132 (goto-char (point-min))
133 (while (re-search-forward "[ \t]+$" nil t
)
134 (goto-char (match-beginning 0))
138 (format "=%02X" (char-after))
141 (and (boundp 'mm-use-ultra-safe-encoding
)
142 mm-use-ultra-safe-encoding
)))
143 (when (or fold ultra
)
144 (let ((tab-width 1) ; HTAB is one character.
145 (case-fold-search nil
))
146 (goto-char (point-min))
148 ;; In ultra-safe mode, encode "From " at the beginning
151 (if (looking-at "From ")
152 (replace-match "From=20" nil t
)
154 (replace-match "=2D" nil t
))))
157 (while (> (current-column) 76) ; tab-width must be 1.
159 (forward-char 75) ; 75 chars plus an "="
160 (search-backward "=" (- (point) 2) t
)
163 (forward-line))))))))
165 (defun quoted-printable-encode-string (string)
166 "Encode the STRING as quoted-printable and return the result."
168 (if (multibyte-string-p string
)
169 (set-buffer-multibyte 'to
)
170 (set-buffer-multibyte nil
))
172 (quoted-printable-encode-region (point-min) (point-max))