Mercurial > emacs
annotate lisp/gnus/qp.el @ 86444:49cdf6b61ecb
*** empty log message ***
author | Glenn Morris <rgm@gnu.org> |
---|---|
date | Mon, 26 Nov 2007 03:49:23 +0000 |
parents | 1cdfc94602cb |
children | 107ccd98fa12 53108e6cea98 |
rev | line source |
---|---|
31717 | 1 ;;; qp.el --- Quoted-Printable functions |
32103 | 2 |
64754
fafd692d1e40
Update years in copyright notice; nfc.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
64085
diff
changeset
|
3 ;; Copyright (C) 1998, 1999, 2000, 2001, 2002, 2003, 2004, |
75347 | 4 ;; 2005, 2006, 2007 Free Software Foundation, Inc. |
31717 | 5 |
6 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org> | |
32103 | 7 ;; Keywords: mail, extensions |
8 | |
31717 | 9 ;; This file is part of GNU Emacs. |
10 | |
11 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
12 ;; it under the terms of the GNU General Public License as published by | |
78224
24202b793a08
Switch license to GPLv3 or later.
Glenn Morris <rgm@gnu.org>
parents:
75347
diff
changeset
|
13 ;; the Free Software Foundation; either version 3, or (at your option) |
31717 | 14 ;; any later version. |
15 | |
16 ;; GNU Emacs is distributed in the hope that it will be useful, | |
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
19 ;; GNU General Public License for more details. | |
20 | |
21 ;; You should have received a copy of the GNU General Public License | |
22 ;; along with GNU Emacs; see the file COPYING. If not, write to the | |
64085 | 23 ;; Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, |
24 ;; Boston, MA 02110-1301, USA. | |
31717 | 25 |
26 ;;; Commentary: | |
27 | |
32103 | 28 ;; Functions for encoding and decoding quoted-printable text as |
29 ;; defined in RFC 2045. | |
30 | |
31717 | 31 ;;; Code: |
32 | |
32504 | 33 (require 'mm-util) |
86154 | 34 (defvar mm-use-ultra-safe-encoding) |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
35 |
56927
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
36 ;;;###autoload |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
37 (defun quoted-printable-decode-region (from to &optional coding-system) |
32103 | 38 "Decode quoted-printable in the region between FROM and TO, per RFC 2045. |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
39 If CODING-SYSTEM is non-nil, decode bytes into characters with that |
43737
4f7c660e6029
* qp.el (quoted-printable-decode-region): Doc addition.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
38103
diff
changeset
|
40 coding-system. |
4f7c660e6029
* qp.el (quoted-printable-decode-region): Doc addition.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
38103
diff
changeset
|
41 |
4f7c660e6029
* qp.el (quoted-printable-decode-region): Doc addition.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
38103
diff
changeset
|
42 Interactively, you can supply the CODING-SYSTEM argument |
56927
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
43 with \\[universal-coding-system-argument]. |
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
44 |
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
45 The CODING-SYSTEM argument is a historical hangover and is deprecated. |
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
46 QP encodes raw bytes and should be decoded into raw bytes. Decoding |
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
47 them into characters should be done separately." |
38103
282970d20daa
(quoted-printable-decode-region): If called interactively,
Eli Zaretskii <eliz@gnu.org>
parents:
35931
diff
changeset
|
48 (interactive |
282970d20daa
(quoted-printable-decode-region): If called interactively,
Eli Zaretskii <eliz@gnu.org>
parents:
35931
diff
changeset
|
49 ;; Let the user determine the coding system with "C-x RET c". |
282970d20daa
(quoted-printable-decode-region): If called interactively,
Eli Zaretskii <eliz@gnu.org>
parents:
35931
diff
changeset
|
50 (list (region-beginning) (region-end) coding-system-for-read)) |
32462
7a39fdec7aac
(quoted-printable-decode-region): Avoid invalid
Dave Love <fx@gnu.org>
parents:
32211
diff
changeset
|
51 (unless (mm-coding-system-p coding-system) ; e.g. `ascii' from Gnus |
7a39fdec7aac
(quoted-printable-decode-region): Avoid invalid
Dave Love <fx@gnu.org>
parents:
32211
diff
changeset
|
52 (setq coding-system nil)) |
31717 | 53 (save-excursion |
54 (save-restriction | |
32462
7a39fdec7aac
(quoted-printable-decode-region): Avoid invalid
Dave Love <fx@gnu.org>
parents:
32211
diff
changeset
|
55 ;; RFC 2045: ``An "=" followed by two hexadecimal digits, one |
7a39fdec7aac
(quoted-printable-decode-region): Avoid invalid
Dave Love <fx@gnu.org>
parents:
32211
diff
changeset
|
56 ;; or both of which are lowercase letters in "abcdef", is |
7a39fdec7aac
(quoted-printable-decode-region): Avoid invalid
Dave Love <fx@gnu.org>
parents:
32211
diff
changeset
|
57 ;; formally illegal. A robust implementation might choose to |
7a39fdec7aac
(quoted-printable-decode-region): Avoid invalid
Dave Love <fx@gnu.org>
parents:
32211
diff
changeset
|
58 ;; recognize them as the corresponding uppercase letters.'' |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
59 (let ((case-fold-search t)) |
31717 | 60 (narrow-to-region from to) |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
61 ;; Do this in case we're called from Gnus, say, in a buffer |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
62 ;; which already contains non-ASCII characters which would |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
63 ;; then get doubly-decoded below. |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
64 (if coding-system |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
65 (mm-encode-coding-region (point-min) (point-max) coding-system)) |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
66 (goto-char (point-min)) |
35619
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
67 (while (and (skip-chars-forward "^=") |
32103 | 68 (not (eobp))) |
69 (cond ((eq (char-after (1+ (point))) ?\n) | |
70 (delete-char 2)) | |
71 ((looking-at "=[0-9A-F][0-9A-F]") | |
62907
88db2adda4b7
Revision: miles@gnu.org--gnu-2005/emacs--cvs-trunk--0--patch-339
Miles Bader <miles@gnu.org>
parents:
61644
diff
changeset
|
72 (let ((byte (string-to-number (buffer-substring (1+ (point)) |
85712
a3c27999decb
Update Gnus to No Gnus 0.7 from the Gnus CVS trunk
Miles Bader <miles@gnu.org>
parents:
78224
diff
changeset
|
73 (+ 3 (point))) |
a3c27999decb
Update Gnus to No Gnus 0.7 from the Gnus CVS trunk
Miles Bader <miles@gnu.org>
parents:
78224
diff
changeset
|
74 16))) |
47944
03cfc305a0fa
(quoted-printable-encode-region): Use mm-insert-byte.
Dave Love <fx@gnu.org>
parents:
43737
diff
changeset
|
75 (mm-insert-byte byte 1) |
56927
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
76 (delete-char 3))) |
32103 | 77 (t |
56927
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
78 (message "Malformed quoted-printable text") |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
79 (forward-char))))) |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
80 (if coding-system |
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
81 (mm-decode-coding-region (point-min) (point-max) coding-system))))) |
31717 | 82 |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
83 (defun quoted-printable-decode-string (string &optional coding-system) |
32103 | 84 "Decode the quoted-printable encoded STRING and return the result. |
79313 | 85 If CODING-SYSTEM is non-nil, decode the string with coding-system. |
56927
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
86 Use of CODING-SYSTEM is deprecated; this function should deal with |
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
87 raw bytes, and coding conversion should be done separately." |
55fd4f77387a
Revision: miles@gnu.org--gnu-2004/emacs--cvs-trunk--0--patch-523
Miles Bader <miles@gnu.org>
parents:
52401
diff
changeset
|
88 (mm-with-unibyte-buffer |
31717 | 89 (insert string) |
32211
5b42e5f7e809
(mm-decode-coding-region, mm-encode-coding-region):
Dave Love <fx@gnu.org>
parents:
32107
diff
changeset
|
90 (quoted-printable-decode-region (point-min) (point-max) coding-system) |
31717 | 91 (buffer-string))) |
92 | |
93 (defun quoted-printable-encode-region (from to &optional fold class) | |
32103 | 94 "Quoted-printable encode the region between FROM and TO per RFC 2045. |
31717 | 95 |
32103 | 96 If FOLD, fold long lines at 76 characters (as required by the RFC). |
35619
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
97 If CLASS is non-nil, translate the characters not matched by that |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
98 regexp class, which is in the form expected by `skip-chars-forward'. |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
99 You should probably avoid non-ASCII characters in this arg. |
31717 | 100 |
32103 | 101 If `mm-use-ultra-safe-encoding' is set, fold lines unconditionally and |
31717 | 102 encode lines starting with \"From\"." |
103 (interactive "r") | |
32103 | 104 (unless class |
34752
f04f551e94ce
* message.el (message-narrow-to-head-1): New function.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
34025
diff
changeset
|
105 ;; Avoid using 8bit characters. = is \075. |
f04f551e94ce
* message.el (message-narrow-to-head-1): New function.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
34025
diff
changeset
|
106 ;; Equivalent to "^\000-\007\013\015-\037\200-\377=" |
f04f551e94ce
* message.el (message-narrow-to-head-1): New function.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
34025
diff
changeset
|
107 (setq class "\010-\012\014\040-\074\076-\177")) |
31717 | 108 (save-excursion |
61644
aff89865e27c
Revision: miles@gnu.org--gnu-2005/emacs--cvs-trunk--0--patch-268
Miles Bader <miles@gnu.org>
parents:
61537
diff
changeset
|
109 (goto-char from) |
aff89865e27c
Revision: miles@gnu.org--gnu-2005/emacs--cvs-trunk--0--patch-268
Miles Bader <miles@gnu.org>
parents:
61537
diff
changeset
|
110 (if (re-search-forward (mm-string-to-multibyte "[^\x0-\x7f\x80-\xff]") |
aff89865e27c
Revision: miles@gnu.org--gnu-2005/emacs--cvs-trunk--0--patch-268
Miles Bader <miles@gnu.org>
parents:
61537
diff
changeset
|
111 to t) |
aff89865e27c
Revision: miles@gnu.org--gnu-2005/emacs--cvs-trunk--0--patch-268
Miles Bader <miles@gnu.org>
parents:
61537
diff
changeset
|
112 (error "Multibyte character in QP encoding region")) |
31717 | 113 (save-restriction |
114 (narrow-to-region from to) | |
35619
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
115 ;; Encode all the non-ascii and control characters. |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
116 (goto-char (point-min)) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
117 (while (and (skip-chars-forward class) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
118 (not (eobp))) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
119 (insert |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
120 (prog1 |
69135
12d289b6e5de
Revision: emacs@sv.gnu.org/emacs--devo--0--patch-118
Miles Bader <miles@gnu.org>
parents:
68633
diff
changeset
|
121 ;; To unibyte in case of Emacs 23 (unicode) eight-bit. |
47944
03cfc305a0fa
(quoted-printable-encode-region): Use mm-insert-byte.
Dave Love <fx@gnu.org>
parents:
43737
diff
changeset
|
122 (format "=%02X" (mm-multibyte-char-to-unibyte (char-after))) |
35619
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
123 (delete-char 1)))) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
124 ;; Encode white space at the end of lines. |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
125 (goto-char (point-min)) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
126 (while (re-search-forward "[ \t]+$" nil t) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
127 (goto-char (match-beginning 0)) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
128 (while (not (eolp)) |
31717 | 129 (insert |
130 (prog1 | |
34752
f04f551e94ce
* message.el (message-narrow-to-head-1): New function.
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
34025
diff
changeset
|
131 (format "=%02X" (char-after)) |
35931
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
132 (delete-char 1))))) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
133 (let ((mm-use-ultra-safe-encoding |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
134 (and (boundp 'mm-use-ultra-safe-encoding) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
135 mm-use-ultra-safe-encoding))) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
136 (when (or fold mm-use-ultra-safe-encoding) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
137 (let ((tab-width 1)) ; HTAB is one character. |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
138 (goto-char (point-min)) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
139 (while (not (eobp)) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
140 ;; In ultra-safe mode, encode "From " at the beginning |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
141 ;; of a line. |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
142 (when mm-use-ultra-safe-encoding |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
143 (if (looking-at "From ") |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
144 (replace-match "From=20" nil t) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
145 (if (looking-at "-") |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
146 (replace-match "=2D" nil t)))) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
147 (end-of-line) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
148 ;; Fold long lines. |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
149 (while (> (current-column) 76) ; tab-width must be 1. |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
150 (beginning-of-line) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
151 (forward-char 75) ; 75 chars plus an "=" |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
152 (search-backward "=" (- (point) 2) t) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
153 (insert "=\n") |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
154 (end-of-line)) |
ccc41398da84
(quoted-printable-encode-region): Remove redundant code
Dave Love <fx@gnu.org>
parents:
35619
diff
changeset
|
155 (forward-line)))))))) |
31717 | 156 |
157 (defun quoted-printable-encode-string (string) | |
32103 | 158 "Encode the STRING as quoted-printable and return the result." |
35619
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
159 (let ((default-enable-multibyte-characters (mm-multibyte-string-p string))) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
160 (with-temp-buffer |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
161 (insert string) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
162 (quoted-printable-encode-region (point-min) (point-max)) |
a670d2680870
Remove un-logged bogus changes from 2000-12-20.
Dave Love <fx@gnu.org>
parents:
34752
diff
changeset
|
163 (buffer-string)))) |
31717 | 164 |
165 (provide 'qp) | |
166 | |
52401 | 167 ;;; arch-tag: db89e52a-e4a1-4b69-926f-f434f04216ba |
32103 | 168 ;;; qp.el ends here |