Mercurial > emacs
annotate lisp/gnus/mm-util.el @ 40292:b040e198106d
*** empty log message ***
author | Stefan Monnier <monnier@iro.umontreal.ca> |
---|---|
date | Thu, 25 Oct 2001 05:54:03 +0000 |
parents | b7c0bc16b250 |
children | 93f6c74a2f60 |
rev | line source |
---|---|
38413
a26d9b55abb6
Some fixes to follow coding conventions in files from Gnus.
Pavel Janík <Pavel@Janik.cz>
parents:
36557
diff
changeset
|
1 ;;; mm-util.el --- utility functions for MIME things |
35793 | 2 ;; Copyright (C) 1998, 1999, 2000, 2001 Free Software Foundation, Inc. |
31717 | 3 |
4 ;; Author: Lars Magne Ingebrigtsen <larsi@gnus.org> | |
5 ;; MORIOKA Tomohiko <morioka@jaist.ac.jp> | |
6 ;; This file is part of GNU Emacs. | |
7 | |
8 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
9 ;; it under the terms of the GNU General Public License as published by | |
10 ;; the Free Software Foundation; either version 2, or (at your option) | |
11 ;; any later version. | |
12 | |
13 ;; GNU Emacs is distributed in the hope that it will be useful, | |
14 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
15 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
16 ;; GNU General Public License for more details. | |
17 | |
18 ;; You should have received a copy of the GNU General Public License | |
19 ;; along with GNU Emacs; see the file COPYING. If not, write to the | |
20 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
21 ;; Boston, MA 02111-1307, USA. | |
22 | |
23 ;;; Commentary: | |
24 | |
25 ;;; Code: | |
26 | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
27 (eval-when-compile (require 'cl)) |
31717 | 28 (require 'mail-prsvr) |
29 | |
36557 | 30 (defun mm-coding-system-p (sym) |
31 "Return non-nil if SYM is a coding system." | |
32 (or (and (fboundp 'coding-system-p) (coding-system-p sym)) | |
33 (memq sym (mm-get-coding-system-list)))) | |
36556
8af75e618534
(mm-mime-mule-charset-alist): Move it after definition of
Dave Love <fx@gnu.org>
parents:
36539
diff
changeset
|
34 |
31717 | 35 (defvar mm-mime-mule-charset-alist |
35793 | 36 `((us-ascii ascii) |
31717 | 37 (iso-8859-1 latin-iso8859-1) |
38 (iso-8859-2 latin-iso8859-2) | |
39 (iso-8859-3 latin-iso8859-3) | |
40 (iso-8859-4 latin-iso8859-4) | |
41 (iso-8859-5 cyrillic-iso8859-5) | |
42 ;; Non-mule (X)Emacs uses the last mule-charset for 8bit characters. | |
43 ;; The fake mule-charset, gnus-koi8-r, tells Gnus that the default | |
44 ;; charset is koi8-r, not iso-8859-5. | |
45 (koi8-r cyrillic-iso8859-5 gnus-koi8-r) | |
46 (iso-8859-6 arabic-iso8859-6) | |
47 (iso-8859-7 greek-iso8859-7) | |
48 (iso-8859-8 hebrew-iso8859-8) | |
49 (iso-8859-9 latin-iso8859-9) | |
35148
a408e1d28e3d
(mm-mime-mule-charset-alist): Add Latin-{8,9}.
Dave Love <fx@gnu.org>
parents:
34724
diff
changeset
|
50 (iso-8859-14 latin-iso8859-14) |
a408e1d28e3d
(mm-mime-mule-charset-alist): Add Latin-{8,9}.
Dave Love <fx@gnu.org>
parents:
34724
diff
changeset
|
51 (iso-8859-15 latin-iso8859-15) |
31717 | 52 (viscii vietnamese-viscii-lower) |
53 (iso-2022-jp latin-jisx0201 japanese-jisx0208 japanese-jisx0208-1978) | |
54 (euc-kr korean-ksc5601) | |
35838
53eebdb81828
2001-02-01 ShengHuo ZHU <zsh@cs.rochester.edu>
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
35793
diff
changeset
|
55 (gb2312 chinese-gb2312) |
53eebdb81828
2001-02-01 ShengHuo ZHU <zsh@cs.rochester.edu>
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
35793
diff
changeset
|
56 (big5 chinese-big5-1 chinese-big5-2) |
31717 | 57 (tibetan tibetan) |
58 (thai-tis620 thai-tis620) | |
59 (iso-2022-7bit ethiopic arabic-1-column arabic-2-column) | |
60 (iso-2022-jp-2 latin-iso8859-1 greek-iso8859-7 | |
61 latin-jisx0201 japanese-jisx0208-1978 | |
62 chinese-gb2312 japanese-jisx0208 | |
63 korean-ksc5601 japanese-jisx0212 | |
64 katakana-jisx0201) | |
65 (iso-2022-int-1 latin-iso8859-1 greek-iso8859-7 | |
66 latin-jisx0201 japanese-jisx0208-1978 | |
67 chinese-gb2312 japanese-jisx0208 | |
68 korean-ksc5601 japanese-jisx0212 | |
69 chinese-cns11643-1 chinese-cns11643-2) | |
70 (iso-2022-int-1 latin-iso8859-1 latin-iso8859-2 | |
71 cyrillic-iso8859-5 greek-iso8859-7 | |
72 latin-jisx0201 japanese-jisx0208-1978 | |
73 chinese-gb2312 japanese-jisx0208 | |
74 korean-ksc5601 japanese-jisx0212 | |
75 chinese-cns11643-1 chinese-cns11643-2 | |
76 chinese-cns11643-3 chinese-cns11643-4 | |
77 chinese-cns11643-5 chinese-cns11643-6 | |
78 chinese-cns11643-7) | |
36539
9b4d3e18dcf7
(mm-mime-mule-charset-alist): Fix utf-8 case.
Dave Love <fx@gnu.org>
parents:
36474
diff
changeset
|
79 ;; utf-8 comes either from Mule-UCS or Mule 5+. |
9b4d3e18dcf7
(mm-mime-mule-charset-alist): Fix utf-8 case.
Dave Love <fx@gnu.org>
parents:
36474
diff
changeset
|
80 ,@(if (mm-coding-system-p 'utf-8) |
9b4d3e18dcf7
(mm-mime-mule-charset-alist): Fix utf-8 case.
Dave Love <fx@gnu.org>
parents:
36474
diff
changeset
|
81 (list (cons 'utf-8 (delete 'ascii |
9b4d3e18dcf7
(mm-mime-mule-charset-alist): Fix utf-8 case.
Dave Love <fx@gnu.org>
parents:
36474
diff
changeset
|
82 (coding-system-get |
9b4d3e18dcf7
(mm-mime-mule-charset-alist): Fix utf-8 case.
Dave Love <fx@gnu.org>
parents:
36474
diff
changeset
|
83 'mule-utf-8 |
9b4d3e18dcf7
(mm-mime-mule-charset-alist): Fix utf-8 case.
Dave Love <fx@gnu.org>
parents:
36474
diff
changeset
|
84 'safe-charsets)))))) |
31717 | 85 "Alist of MIME-charset/MULE-charsets.") |
86 | |
87 (eval-and-compile | |
36557 | 88 (mapcar |
89 (lambda (elem) | |
90 (let ((nfunc (intern (format "mm-%s" (car elem))))) | |
91 (if (fboundp (car elem)) | |
92 (defalias nfunc (car elem)) | |
93 (defalias nfunc (cdr elem))))) | |
94 '((decode-coding-string . (lambda (s a) s)) | |
95 (encode-coding-string . (lambda (s a) s)) | |
96 (encode-coding-region . ignore) | |
97 (coding-system-list . ignore) | |
98 (decode-coding-region . ignore) | |
99 (char-int . identity) | |
100 (device-type . ignore) | |
101 (coding-system-equal . equal) | |
102 (annotationp . ignore) | |
103 (set-buffer-file-coding-system . ignore) | |
104 (make-char | |
105 . (lambda (charset int) | |
106 (int-to-char int))) | |
107 (read-coding-system | |
108 . (lambda (prompt) | |
109 "Prompt the user for a coding system." | |
110 (completing-read | |
111 prompt (mapcar (lambda (s) (list (symbol-name (car s)))) | |
112 mm-mime-mule-charset-alist)))) | |
113 (read-charset | |
114 . (lambda (prompt) | |
115 "Return a charset." | |
116 (intern | |
117 (completing-read | |
118 prompt | |
119 (mapcar (lambda (e) (list (symbol-name (car e)))) | |
120 mm-mime-mule-charset-alist) | |
121 nil t)))) | |
122 (string-as-unibyte . identity) | |
123 (multibyte-string-p . ignore) | |
124 ))) | |
125 | |
126 (eval-and-compile | |
31717 | 127 (defalias 'mm-char-or-char-int-p |
128 (cond | |
129 ((fboundp 'char-or-char-int-p) 'char-or-char-int-p) | |
130 ((fboundp 'char-valid-p) 'char-valid-p) | |
131 (t 'identity)))) | |
132 | |
133 (defvar mm-coding-system-list nil) | |
134 (defun mm-get-coding-system-list () | |
135 "Get the coding system list." | |
136 (or mm-coding-system-list | |
137 (setq mm-coding-system-list (mm-coding-system-list)))) | |
138 | |
139 (defvar mm-charset-synonym-alist | |
32414
cbdba3c57536
(mm-charset-synonym-alist): Add windows-1252.
Dave Love <fx@gnu.org>
parents:
31717
diff
changeset
|
140 `((big5 . cn-big5) |
31717 | 141 (gb2312 . cn-gb-2312) |
32414
cbdba3c57536
(mm-charset-synonym-alist): Add windows-1252.
Dave Love <fx@gnu.org>
parents:
31717
diff
changeset
|
142 ;; Windows-1252 is actually a superset of Latin-1. See also |
cbdba3c57536
(mm-charset-synonym-alist): Add windows-1252.
Dave Love <fx@gnu.org>
parents:
31717
diff
changeset
|
143 ;; `gnus-article-dumbquotes-map'. |
34724
15c6663e5676
2000-12-19 ShengHuo ZHU <zsh@cs.rochester.edu>
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
33378
diff
changeset
|
144 ,(unless (mm-coding-system-p 'windows-1252) ; should be defined eventually |
15c6663e5676
2000-12-19 ShengHuo ZHU <zsh@cs.rochester.edu>
ShengHuo ZHU <zsh@cs.rochester.edu>
parents:
33378
diff
changeset
|
145 '(windows-1252 . iso-8859-1)) |
39339
b7c0bc16b250
(mm-charset-synonym-alist): Add windows-1250 so we
Gerd Moellmann <gerd@gnu.org>
parents:
38413
diff
changeset
|
146 ;; Windows-1250 is a variant of Latin-2 heavily used by Microsoft |
b7c0bc16b250
(mm-charset-synonym-alist): Add windows-1250 so we
Gerd Moellmann <gerd@gnu.org>
parents:
38413
diff
changeset
|
147 ;; Outlook users in Czech republic. Use this to allow reading of their |
b7c0bc16b250
(mm-charset-synonym-alist): Add windows-1250 so we
Gerd Moellmann <gerd@gnu.org>
parents:
38413
diff
changeset
|
148 ;; e-mails. cp1250 should be defined by M-x codepage-setup. |
b7c0bc16b250
(mm-charset-synonym-alist): Add windows-1250 so we
Gerd Moellmann <gerd@gnu.org>
parents:
38413
diff
changeset
|
149 ,(unless (mm-coding-system-p 'windows-1250) ; should be defined eventually |
b7c0bc16b250
(mm-charset-synonym-alist): Add windows-1250 so we
Gerd Moellmann <gerd@gnu.org>
parents:
38413
diff
changeset
|
150 '(windows-1250 . cp1250)) |
31717 | 151 (x-ctext . ctext)) |
152 "A mapping from invalid charset names to the real charset names.") | |
153 | |
154 (defvar mm-binary-coding-system | |
155 (cond | |
156 ((mm-coding-system-p 'binary) 'binary) | |
157 ((mm-coding-system-p 'no-conversion) 'no-conversion) | |
158 (t nil)) | |
159 "100% binary coding system.") | |
160 | |
161 (defvar mm-text-coding-system | |
162 (or (if (memq system-type '(windows-nt ms-dos ms-windows)) | |
163 (and (mm-coding-system-p 'raw-text-dos) 'raw-text-dos) | |
164 (and (mm-coding-system-p 'raw-text) 'raw-text)) | |
165 mm-binary-coding-system) | |
166 "Text-safe coding system (For removing ^M).") | |
167 | |
168 (defvar mm-text-coding-system-for-write nil | |
169 "Text coding system for write.") | |
170 | |
171 (defvar mm-auto-save-coding-system | |
172 (cond | |
173 ((mm-coding-system-p 'emacs-mule) | |
174 (if (memq system-type '(windows-nt ms-dos ms-windows)) | |
175 (if (mm-coding-system-p 'emacs-mule-dos) | |
176 'emacs-mule-dos mm-binary-coding-system) | |
177 'emacs-mule)) | |
178 ((mm-coding-system-p 'escape-quoted) 'escape-quoted) | |
179 (t mm-binary-coding-system)) | |
180 "Coding system of auto save file.") | |
181 | |
182 ;;; Internal variables: | |
183 | |
184 ;;; Functions: | |
185 | |
186 (defun mm-mule-charset-to-mime-charset (charset) | |
33378 | 187 "Return the MIME charset corresponding to the given Mule CHARSET." |
31717 | 188 (let ((alist mm-mime-mule-charset-alist) |
189 out) | |
190 (while alist | |
191 (when (memq charset (cdar alist)) | |
192 (setq out (caar alist) | |
193 alist nil)) | |
194 (pop alist)) | |
195 out)) | |
196 | |
197 (defun mm-charset-to-coding-system (charset &optional lbt) | |
198 "Return coding-system corresponding to CHARSET. | |
199 CHARSET is a symbol naming a MIME charset. | |
200 If optional argument LBT (`unix', `dos' or `mac') is specified, it is | |
201 used as the line break code type of the coding system." | |
202 (when (stringp charset) | |
203 (setq charset (intern (downcase charset)))) | |
204 (setq charset | |
205 (or (cdr (assq charset mm-charset-synonym-alist)) | |
206 charset)) | |
207 (when lbt | |
208 (setq charset (intern (format "%s-%s" charset lbt)))) | |
209 (cond | |
210 ;; Running in a non-MULE environment. | |
211 ((null (mm-get-coding-system-list)) | |
212 charset) | |
213 ;; ascii | |
214 ((eq charset 'us-ascii) | |
215 'ascii) | |
33378 | 216 ;; Check to see whether we can handle this charset. (This depends |
217 ;; on there being some coding system matching each `mime-charset' | |
218 ;; coding sysytem property defined, as there should be.) | |
31717 | 219 ((memq charset (mm-get-coding-system-list)) |
220 charset) | |
221 ;; Nope. | |
222 (t | |
223 nil))) | |
224 | |
225 (if (fboundp 'subst-char-in-string) | |
226 (defsubst mm-replace-chars-in-string (string from to) | |
227 (subst-char-in-string from to string)) | |
228 (defun mm-replace-chars-in-string (string from to) | |
229 "Replace characters in STRING from FROM to TO." | |
230 (let ((string (substring string 0)) ;Copy string. | |
231 (len (length string)) | |
232 (idx 0)) | |
233 ;; Replace all occurrences of FROM with TO. | |
234 (while (< idx len) | |
235 (when (= (aref string idx) from) | |
236 (aset string idx to)) | |
237 (setq idx (1+ idx))) | |
238 string))) | |
239 | |
240 (defsubst mm-enable-multibyte () | |
33378 | 241 "Set the multibyte flag of the current buffer. |
242 Only do this if the default value of `enable-multibyte-characters' is | |
243 non-nil. This is a no-op in XEmacs." | |
31717 | 244 (when (and (fboundp 'set-buffer-multibyte) |
245 (boundp 'enable-multibyte-characters) | |
246 (default-value 'enable-multibyte-characters)) | |
247 (set-buffer-multibyte t))) | |
248 | |
249 (defsubst mm-disable-multibyte () | |
33378 | 250 "Unset the multibyte flag of in the current buffer. |
251 This is a no-op in XEmacs." | |
31717 | 252 (when (fboundp 'set-buffer-multibyte) |
253 (set-buffer-multibyte nil))) | |
254 | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
255 (defsubst mm-enable-multibyte-mule4 () |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
256 "Enable multibyte in the current buffer. |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
257 Only used in Emacs Mule 4." |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
258 (when (and (fboundp 'set-buffer-multibyte) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
259 (boundp 'enable-multibyte-characters) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
260 (default-value 'enable-multibyte-characters) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
261 (not (charsetp 'eight-bit-control))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
262 (set-buffer-multibyte t))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
263 |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
264 (defsubst mm-disable-multibyte-mule4 () |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
265 "Disable multibyte in the current buffer. |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
266 Only used in Emacs Mule 4." |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
267 (when (and (fboundp 'set-buffer-multibyte) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
268 (not (charsetp 'eight-bit-control))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
269 (set-buffer-multibyte nil))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
270 |
31717 | 271 (defun mm-preferred-coding-system (charset) |
272 ;; A typo in some Emacs versions. | |
273 (or (get-charset-property charset 'prefered-coding-system) | |
274 (get-charset-property charset 'preferred-coding-system))) | |
275 | |
276 (defun mm-charset-after (&optional pos) | |
277 "Return charset of a character in current buffer at position POS. | |
278 If POS is nil, it defauls to the current point. | |
279 If POS is out of range, the value is nil. | |
280 If the charset is `composition', return the actual one." | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
281 (let ((char (char-after pos)) charset) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
282 (if (< (mm-char-int char) 128) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
283 (setq charset 'ascii) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
284 ;; charset-after is fake in some Emacsen. |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
285 (setq charset (and (fboundp 'char-charset) (char-charset char))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
286 (if (eq charset 'composition) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
287 (let ((p (or pos (point)))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
288 (cadr (find-charset-region p (1+ p)))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
289 (if (and charset (not (memq charset '(ascii eight-bit-control |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
290 eight-bit-graphic)))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
291 charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
292 (or |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
293 mail-parse-mule-charset ;; cached mule-charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
294 (progn |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
295 (setq mail-parse-mule-charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
296 (and (boundp 'current-language-environment) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
297 (car (last |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
298 (assq 'charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
299 (assoc current-language-environment |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
300 language-info-alist)))))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
301 (if (or (not mail-parse-mule-charset) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
302 (eq mail-parse-mule-charset 'ascii)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
303 (setq mail-parse-mule-charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
304 (or (car (last (assq mail-parse-charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
305 mm-mime-mule-charset-alist))) |
35793 | 306 ;; Fixme: don't fix that! |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
307 'latin-iso8859-1))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
308 mail-parse-mule-charset))))))) |
31717 | 309 |
310 (defun mm-mime-charset (charset) | |
33378 | 311 "Return the MIME charset corresponding to the given Mule CHARSET." |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
312 (if (and (fboundp 'coding-system-get) (fboundp 'get-charset-property)) |
31717 | 313 ;; This exists in Emacs 20. |
314 (or | |
315 (and (mm-preferred-coding-system charset) | |
316 (coding-system-get | |
317 (mm-preferred-coding-system charset) 'mime-charset)) | |
318 (and (eq charset 'ascii) | |
319 'us-ascii) | |
320 (mm-mule-charset-to-mime-charset charset)) | |
321 ;; This is for XEmacs. | |
322 (mm-mule-charset-to-mime-charset charset))) | |
323 | |
324 (defun mm-delete-duplicates (list) | |
325 "Simple substitute for CL `delete-duplicates', testing with `equal'." | |
326 (let (result head) | |
327 (while list | |
328 (setq head (car list)) | |
329 (setq list (delete head list)) | |
330 (setq result (cons head result))) | |
331 (nreverse result))) | |
332 | |
333 (defun mm-find-mime-charset-region (b e) | |
334 "Return the MIME charsets needed to encode the region between B and E." | |
335 (let ((charsets (mapcar 'mm-mime-charset | |
336 (delq 'ascii | |
337 (mm-find-charset-region b e))))) | |
338 (when (memq 'iso-2022-jp-2 charsets) | |
339 (setq charsets (delq 'iso-2022-jp charsets))) | |
340 (setq charsets (mm-delete-duplicates charsets)) | |
341 (if (and (> (length charsets) 1) | |
342 (fboundp 'find-coding-systems-region) | |
35793 | 343 (let ((cs (find-coding-systems-region b e))) |
344 (or (memq 'utf-8 cs) (memq 'mule-utf-8 cs)))) | |
31717 | 345 '(utf-8) |
346 charsets))) | |
347 | |
348 (defsubst mm-multibyte-p () | |
349 "Say whether multibyte is enabled." | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
350 (if (and (not (featurep 'xemacs)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
351 (boundp 'enable-multibyte-characters)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
352 enable-multibyte-characters |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
353 (featurep 'mule))) |
31717 | 354 |
355 (defmacro mm-with-unibyte-buffer (&rest forms) | |
356 "Create a temporary buffer, and evaluate FORMS there like `progn'. | |
33378 | 357 Use unibyte mode for this." |
358 `(let (default-enable-multibyte-characters) | |
359 (with-temp-buffer ,@forms))) | |
31717 | 360 (put 'mm-with-unibyte-buffer 'lisp-indent-function 0) |
361 (put 'mm-with-unibyte-buffer 'edebug-form-spec '(body)) | |
362 | |
363 (defmacro mm-with-unibyte-current-buffer (&rest forms) | |
33378 | 364 "Evaluate FORMS with current current buffer temporarily made unibyte. |
365 Also bind `default-enable-multibyte-characters' to nil. | |
366 Equivalent to `progn' in XEmacs" | |
31717 | 367 (let ((multibyte (make-symbol "multibyte"))) |
33378 | 368 `(if (fboundp 'set-buffer-multibyte) |
369 (let ((,multibyte enable-multibyte-characters)) | |
370 (unwind-protect | |
371 (let (default-enable-multibyte-characters) | |
372 (set-buffer-multibyte nil) | |
373 ,@forms) | |
374 (set-buffer-multibyte ,multibyte))) | |
375 (progn | |
376 ,@forms)))) | |
31717 | 377 (put 'mm-with-unibyte-current-buffer 'lisp-indent-function 0) |
378 (put 'mm-with-unibyte-current-buffer 'edebug-form-spec '(body)) | |
379 | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
380 (defmacro mm-with-unibyte-current-buffer-mule4 (&rest forms) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
381 "Evaluate FORMS there like `progn' in current buffer. |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
382 Mule4 only." |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
383 (let ((multibyte (make-symbol "multibyte"))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
384 `(if (or (featurep 'xemacs) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
385 (not (fboundp 'set-buffer-multibyte)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
386 (charsetp 'eight-bit-control)) ;; For Emacs Mule 4 only. |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
387 (progn |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
388 ,@forms) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
389 (let ((,multibyte (default-value 'enable-multibyte-characters))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
390 (unwind-protect |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
391 (let ((buffer-file-coding-system mm-binary-coding-system) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
392 (coding-system-for-read mm-binary-coding-system) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
393 (coding-system-for-write mm-binary-coding-system)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
394 (set-buffer-multibyte nil) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
395 (setq-default enable-multibyte-characters nil) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
396 ,@forms) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
397 (setq-default enable-multibyte-characters ,multibyte) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
398 (set-buffer-multibyte ,multibyte)))))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
399 (put 'mm-with-unibyte-current-buffer-mule4 'lisp-indent-function 0) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
400 (put 'mm-with-unibyte-current-buffer-mule4 'edebug-form-spec '(body)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
401 |
31717 | 402 (defmacro mm-with-unibyte (&rest forms) |
33378 | 403 "Eval the FORMS with the default value of `enable-multibyte-characters' nil, ." |
404 `(let (default-enable-multibyte-characters) | |
405 ,@forms)) | |
31717 | 406 (put 'mm-with-unibyte 'lisp-indent-function 0) |
407 (put 'mm-with-unibyte 'edebug-form-spec '(body)) | |
408 | |
409 (defun mm-find-charset-region (b e) | |
33378 | 410 "Return a list of Emacs charsets in the region B to E." |
31717 | 411 (cond |
412 ((and (mm-multibyte-p) | |
413 (fboundp 'find-charset-region)) | |
414 ;; Remove composition since the base charsets have been included. | |
415 (delq 'composition (find-charset-region b e))) | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
416 (t |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
417 ;; We are in a unibyte buffer or XEmacs non-mule, so we futz around a bit. |
31717 | 418 (save-excursion |
419 (save-restriction | |
420 (narrow-to-region b e) | |
421 (goto-char (point-min)) | |
422 (skip-chars-forward "\0-\177") | |
423 (if (eobp) | |
424 '(ascii) | |
32976
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
425 (let (charset) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
426 (setq charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
427 (and (boundp 'current-language-environment) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
428 (car (last (assq 'charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
429 (assoc current-language-environment |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
430 language-info-alist)))))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
431 (if (eq charset 'ascii) (setq charset nil)) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
432 (or charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
433 (setq charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
434 (car (last (assq mail-parse-charset |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
435 mm-mime-mule-charset-alist))))) |
aa9dc4e7c5ac
2000-10-27 ShengHuo ZHU <zsh@cs.rochester.edu>
Dave Love <fx@gnu.org>
parents:
32414
diff
changeset
|
436 (list 'ascii (or charset 'latin-iso8859-1))))))))) |
31717 | 437 |
438 (if (fboundp 'shell-quote-argument) | |
439 (defalias 'mm-quote-arg 'shell-quote-argument) | |
440 (defun mm-quote-arg (arg) | |
441 "Return a version of ARG that is safe to evaluate in a shell." | |
442 (let ((pos 0) new-pos accum) | |
443 ;; *** bug: we don't handle newline characters properly | |
444 (while (setq new-pos (string-match "[]*[;!'`\"$\\& \t{} |()<>]" arg pos)) | |
445 (push (substring arg pos new-pos) accum) | |
446 (push "\\" accum) | |
447 (push (list (aref arg new-pos)) accum) | |
448 (setq pos (1+ new-pos))) | |
449 (if (= pos 0) | |
450 arg | |
451 (apply 'concat (nconc (nreverse accum) (list (substring arg pos)))))))) | |
452 | |
453 (defun mm-auto-mode-alist () | |
454 "Return an `auto-mode-alist' with only the .gz (etc) thingies." | |
455 (let ((alist auto-mode-alist) | |
456 out) | |
457 (while alist | |
458 (when (listp (cdar alist)) | |
459 (push (car alist) out)) | |
460 (pop alist)) | |
461 (nreverse out))) | |
462 | |
463 (defvar mm-inhibit-file-name-handlers | |
36473
c1e752e8d255
(mm-inhibit-file-name-handlers): Add
Dave Love <fx@gnu.org>
parents:
35838
diff
changeset
|
464 '(jka-compr-handler image-file-handler) |
31717 | 465 "A list of handlers doing (un)compression (etc) thingies.") |
466 | |
467 (defun mm-insert-file-contents (filename &optional visit beg end replace | |
468 inhibit) | |
469 "Like `insert-file-contents', q.v., but only reads in the file. | |
470 A buffer may be modified in several ways after reading into the buffer due | |
471 to advanced Emacs features, such as file-name-handlers, format decoding, | |
472 find-file-hooks, etc. | |
473 If INHIBIT is non-nil, inhibit mm-inhibit-file-name-handlers. | |
474 This function ensures that none of these modifications will take place." | |
475 (let ((format-alist nil) | |
476 (auto-mode-alist (if inhibit nil (mm-auto-mode-alist))) | |
477 (default-major-mode 'fundamental-mode) | |
478 (enable-local-variables nil) | |
479 (after-insert-file-functions nil) | |
480 (enable-local-eval nil) | |
481 (find-file-hooks nil) | |
482 (inhibit-file-name-operation (if inhibit | |
483 'insert-file-contents | |
484 inhibit-file-name-operation)) | |
485 (inhibit-file-name-handlers | |
486 (if inhibit | |
487 (append mm-inhibit-file-name-handlers | |
488 inhibit-file-name-handlers) | |
489 inhibit-file-name-handlers))) | |
490 (insert-file-contents filename visit beg end replace))) | |
491 | |
492 (defun mm-append-to-file (start end filename &optional codesys inhibit) | |
493 "Append the contents of the region to the end of file FILENAME. | |
494 When called from a function, expects three arguments, | |
495 START, END and FILENAME. START and END are buffer positions | |
496 saying what text to write. | |
497 Optional fourth argument specifies the coding system to use when | |
498 encoding the file. | |
499 If INHIBIT is non-nil, inhibit mm-inhibit-file-name-handlers." | |
500 (let ((coding-system-for-write | |
501 (or codesys mm-text-coding-system-for-write | |
502 mm-text-coding-system)) | |
503 (inhibit-file-name-operation (if inhibit | |
504 'append-to-file | |
505 inhibit-file-name-operation)) | |
506 (inhibit-file-name-handlers | |
507 (if inhibit | |
508 (append mm-inhibit-file-name-handlers | |
509 inhibit-file-name-handlers) | |
510 inhibit-file-name-handlers))) | |
511 (append-to-file start end filename))) | |
512 | |
513 (defun mm-write-region (start end filename &optional append visit lockname | |
514 coding-system inhibit) | |
515 | |
516 "Like `write-region'. | |
517 If INHIBIT is non-nil, inhibit mm-inhibit-file-name-handlers." | |
518 (let ((coding-system-for-write | |
519 (or coding-system mm-text-coding-system-for-write | |
520 mm-text-coding-system)) | |
521 (inhibit-file-name-operation (if inhibit | |
522 'write-region | |
523 inhibit-file-name-operation)) | |
524 (inhibit-file-name-handlers | |
525 (if inhibit | |
526 (append mm-inhibit-file-name-handlers | |
527 inhibit-file-name-handlers) | |
528 inhibit-file-name-handlers))) | |
529 (write-region start end filename append visit lockname))) | |
530 | |
531 (provide 'mm-util) | |
532 | |
533 ;;; mm-util.el ends here |