Mercurial > emacs
annotate lisp/url/url-util.el @ 105916:1f553b32ab4f
* compilation.txt: Add one more error message for msft (Bug#4100).
author | Chong Yidong <cyd@stupidchicken.com> |
---|---|
date | Sun, 08 Nov 2009 16:30:52 +0000 |
parents | 328150f0cf76 |
children | 1d1d5d9bd884 |
rev | line source |
---|---|
54695 | 1 ;;; url-util.el --- Miscellaneous helper routines for URL library |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
2 |
101912
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
3 ;; Copyright (C) 1996, 1997, 1998, 1999, 2001, 2004, 2005, 2006, 2007, |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
4 ;; 2008, 2009 Free Software Foundation, Inc. |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
5 |
54695 | 6 ;; Author: Bill Perry <wmperry@gnu.org> |
7 ;; Keywords: comm, data, processes | |
8 | |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
9 ;; This file is part of GNU Emacs. |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
10 ;; |
94668
8259d0d8e107
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
92401
diff
changeset
|
11 ;; GNU Emacs is free software: you can redistribute it and/or modify |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
12 ;; it under the terms of the GNU General Public License as published by |
94668
8259d0d8e107
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
92401
diff
changeset
|
13 ;; the Free Software Foundation, either version 3 of the License, or |
8259d0d8e107
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
92401
diff
changeset
|
14 ;; (at your option) any later version. |
8259d0d8e107
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
92401
diff
changeset
|
15 |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
16 ;; GNU Emacs is distributed in the hope that it will be useful, |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
17 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
18 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
19 ;; GNU General Public License for more details. |
94668
8259d0d8e107
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
92401
diff
changeset
|
20 |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
21 ;; You should have received a copy of the GNU General Public License |
94668
8259d0d8e107
Switch to recommended form of GPLv3 permissions notice.
Glenn Morris <rgm@gnu.org>
parents:
92401
diff
changeset
|
22 ;; along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
23 |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
24 ;;; Commentary: |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
25 |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
26 ;;; Code: |
54695 | 27 |
28 (require 'url-parse) | |
92401
b7d3823f3c26
Require cl when compiling.
Andreas Schwab <schwab@suse.de>
parents:
92305
diff
changeset
|
29 (eval-when-compile (require 'cl)) |
54695 | 30 (autoload 'timezone-parse-date "timezone") |
31 (autoload 'timezone-make-date-arpa-standard "timezone") | |
54803
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
32 (autoload 'mail-header-extract "mailheader") |
54695 | 33 |
34 (defvar url-parse-args-syntax-table | |
35 (copy-syntax-table emacs-lisp-mode-syntax-table) | |
36 "A syntax table for parsing sgml attributes.") | |
37 | |
38 (modify-syntax-entry ?' "\"" url-parse-args-syntax-table) | |
39 (modify-syntax-entry ?` "\"" url-parse-args-syntax-table) | |
40 (modify-syntax-entry ?{ "(" url-parse-args-syntax-table) | |
41 (modify-syntax-entry ?} ")" url-parse-args-syntax-table) | |
42 | |
43 ;;;###autoload | |
44 (defcustom url-debug nil | |
45 "*What types of debug messages from the URL library to show. | |
46 Debug messages are logged to the *URL-DEBUG* buffer. | |
47 | |
48 If t, all messages will be logged. | |
49 If a number, all messages will be logged, as well shown via `message'. | |
50 If a list, it is a list of the types of messages to be logged." | |
51 :type '(choice (const :tag "none" nil) | |
52 (const :tag "all" t) | |
53 (checklist :tag "custom" | |
54 (const :tag "HTTP" :value http) | |
55 (const :tag "DAV" :value dav) | |
56 (const :tag "General" :value retrieval) | |
57 (const :tag "Filename handlers" :value handlers) | |
58 (symbol :tag "Other"))) | |
59 :group 'url-hairy) | |
60 | |
61 ;;;###autoload | |
62 (defun url-debug (tag &rest args) | |
63 (if quit-flag | |
64 (error "Interrupted!")) | |
65 (if (or (eq url-debug t) | |
66 (numberp url-debug) | |
67 (and (listp url-debug) (memq tag url-debug))) | |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
68 (with-current-buffer (get-buffer-create "*URL-DEBUG*") |
54695 | 69 (goto-char (point-max)) |
70 (insert (symbol-name tag) " -> " (apply 'format args) "\n") | |
71 (if (numberp url-debug) | |
72 (apply 'message args))))) | |
73 | |
74 ;;;###autoload | |
75 (defun url-parse-args (str &optional nodowncase) | |
76 ;; Return an assoc list of attribute/value pairs from an RFC822-type string | |
77 (let ( | |
78 name ; From name= | |
79 value ; its value | |
80 results ; Assoc list of results | |
81 name-pos ; Start of XXXX= position | |
82 val-pos ; Start of value position | |
83 st | |
84 nd | |
85 ) | |
86 (save-excursion | |
87 (save-restriction | |
88 (set-buffer (get-buffer-create " *urlparse-temp*")) | |
89 (set-syntax-table url-parse-args-syntax-table) | |
90 (erase-buffer) | |
91 (insert str) | |
92 (setq st (point-min) | |
93 nd (point-max)) | |
94 (set-syntax-table url-parse-args-syntax-table) | |
95 (narrow-to-region st nd) | |
96 (goto-char (point-min)) | |
97 (while (not (eobp)) | |
98 (skip-chars-forward "; \n\t") | |
99 (setq name-pos (point)) | |
100 (skip-chars-forward "^ \n\t=;") | |
101 (if (not nodowncase) | |
102 (downcase-region name-pos (point))) | |
103 (setq name (buffer-substring name-pos (point))) | |
104 (skip-chars-forward " \t\n") | |
105 (if (/= (or (char-after (point)) 0) ?=) ; There is no value | |
106 (setq value nil) | |
107 (skip-chars-forward " \t\n=") | |
108 (setq val-pos (point) | |
109 value | |
110 (cond | |
111 ((or (= (or (char-after val-pos) 0) ?\") | |
112 (= (or (char-after val-pos) 0) ?')) | |
113 (buffer-substring (1+ val-pos) | |
114 (condition-case () | |
115 (prog2 | |
116 (forward-sexp 1) | |
117 (1- (point)) | |
118 (skip-chars-forward "\"")) | |
119 (error | |
120 (skip-chars-forward "^ \t\n") | |
121 (point))))) | |
122 (t | |
123 (buffer-substring val-pos | |
124 (progn | |
125 (skip-chars-forward "^;") | |
126 (skip-chars-backward " \t") | |
127 (point))))))) | |
128 (setq results (cons (cons name value) results)) | |
129 (skip-chars-forward "; \n\t")) | |
130 results)))) | |
131 | |
132 ;;;###autoload | |
133 (defun url-insert-entities-in-string (string) | |
134 "Convert HTML markup-start characters to entity references in STRING. | |
135 Also replaces the \" character, so that the result may be safely used as | |
136 an attribute value in a tag. Returns a new string with the result of the | |
137 conversion. Replaces these characters as follows: | |
138 & ==> & | |
139 < ==> < | |
140 > ==> > | |
141 \" ==> "" | |
142 (if (string-match "[&<>\"]" string) | |
105829
328150f0cf76
* url-util.el (url-insert-entities-in-string):
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
101912
diff
changeset
|
143 (with-current-buffer (get-buffer-create " *entity*") |
54695 | 144 (erase-buffer) |
145 (buffer-disable-undo (current-buffer)) | |
146 (insert string) | |
147 (goto-char (point-min)) | |
148 (while (progn | |
149 (skip-chars-forward "^&<>\"") | |
150 (not (eobp))) | |
151 (insert (cdr (assq (char-after (point)) | |
152 '((?\" . """) | |
153 (?& . "&") | |
154 (?< . "<") | |
155 (?> . ">"))))) | |
156 (delete-char 1)) | |
157 (buffer-string)) | |
158 string)) | |
159 | |
160 ;;;###autoload | |
161 (defun url-normalize-url (url) | |
162 "Return a 'normalized' version of URL. | |
163 Strips out default port numbers, etc." | |
72218
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
164 (let (type data retval) |
54695 | 165 (setq data (url-generic-parse-url url) |
166 type (url-type data)) | |
167 (if (member type '("www" "about" "mailto" "info")) | |
168 (setq retval url) | |
98338 | 169 ;; FIXME all this does, and all this function seems to do in |
170 ;; most cases, is remove any trailing "#anchor" part of a url. | |
83823
dd2bcc6758a0
* url-parse.el (url): Use defstruct rather than macros. Update all callers.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
78222
diff
changeset
|
171 (setf (url-target data) nil) |
54695 | 172 (setq retval (url-recreate-url data))) |
173 retval)) | |
174 | |
175 ;;;###autoload | |
176 (defun url-lazy-message (&rest args) | |
177 "Just like `message', but is a no-op if called more than once a second. | |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
178 Will not do anything if `url-show-status' is nil." |
54695 | 179 (if (or (null url-show-status) |
180 (active-minibuffer-window) | |
181 (= url-lazy-message-time | |
182 (setq url-lazy-message-time (nth 1 (current-time))))) | |
183 nil | |
184 (apply 'message args))) | |
185 | |
186 ;;;###autoload | |
187 (defun url-get-normalized-date (&optional specified-time) | |
92305
76175fc0a2f9
(url-get-normalized-date): Simplify
Teodor Zlatanov <tzz@lifelogs.com>
parents:
87649
diff
changeset
|
188 "Return a 'real' date string that most HTTP servers can understand." |
76175fc0a2f9
(url-get-normalized-date): Simplify
Teodor Zlatanov <tzz@lifelogs.com>
parents:
87649
diff
changeset
|
189 (let ((system-time-locale "C")) |
76175fc0a2f9
(url-get-normalized-date): Simplify
Teodor Zlatanov <tzz@lifelogs.com>
parents:
87649
diff
changeset
|
190 (format-time-string "%a, %d %b %Y %T GMT" |
76175fc0a2f9
(url-get-normalized-date): Simplify
Teodor Zlatanov <tzz@lifelogs.com>
parents:
87649
diff
changeset
|
191 (or specified-time (current-time)) t))) |
54695 | 192 |
193 ;;;###autoload | |
194 (defun url-eat-trailing-space (x) | |
195 "Remove spaces/tabs at the end of a string." | |
196 (let ((y (1- (length x))) | |
197 (skip-chars (list ? ?\t ?\n))) | |
198 (while (and (>= y 0) (memq (aref x y) skip-chars)) | |
199 (setq y (1- y))) | |
200 (substring x 0 (1+ y)))) | |
201 | |
202 ;;;###autoload | |
203 (defun url-strip-leading-spaces (x) | |
204 "Remove spaces at the front of a string." | |
205 (let ((y (1- (length x))) | |
206 (z 0) | |
207 (skip-chars (list ? ?\t ?\n))) | |
208 (while (and (<= z y) (memq (aref x z) skip-chars)) | |
209 (setq z (1+ z))) | |
210 (substring x z nil))) | |
211 | |
212 ;;;###autoload | |
213 (defun url-pretty-length (n) | |
214 (cond | |
215 ((< n 1024) | |
216 (format "%d bytes" n)) | |
217 ((< n (* 1024 1024)) | |
218 (format "%dk" (/ n 1024.0))) | |
219 (t | |
220 (format "%2.2fM" (/ n (* 1024 1024.0)))))) | |
221 | |
222 ;;;###autoload | |
223 (defun url-display-percentage (fmt perc &rest args) | |
74135
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
224 (when url-show-status |
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
225 (if (null fmt) |
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
226 (if (fboundp 'clear-progress-display) |
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
227 (clear-progress-display)) |
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
228 (if (and (fboundp 'progress-display) perc) |
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
229 (apply 'progress-display fmt perc args) |
e125bce98ce9
(url-display-percentage): Only show a message if `url-show-status' is non-nil.
Magnus Henoch <mange@freemail.hu>
parents:
72218
diff
changeset
|
230 (apply 'message fmt args))))) |
54695 | 231 |
232 ;;;###autoload | |
233 (defun url-percentage (x y) | |
234 (if (fboundp 'float) | |
235 (round (* 100 (/ x (float y)))) | |
236 (/ (* x 100) y))) | |
237 | |
238 ;;;###autoload | |
99385
7b5dc2894014
(url-basepath): Add url-basepath as an alias for url-file-directory.
Chong Yidong <cyd@stupidchicken.com>
parents:
98338
diff
changeset
|
239 (defalias 'url-basepath 'url-file-directory) |
7b5dc2894014
(url-basepath): Add url-basepath as an alias for url-file-directory.
Chong Yidong <cyd@stupidchicken.com>
parents:
98338
diff
changeset
|
240 |
7b5dc2894014
(url-basepath): Add url-basepath as an alias for url-file-directory.
Chong Yidong <cyd@stupidchicken.com>
parents:
98338
diff
changeset
|
241 ;;;###autoload |
79064
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
242 (defun url-file-directory (file) |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
243 "Return the directory part of FILE, for a URL." |
54695 | 244 (cond |
245 ((null file) "") | |
246 ((string-match (eval-when-compile (regexp-quote "?")) file) | |
79064
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
247 (file-name-directory (substring file 0 (match-beginning 0)))) |
54695 | 248 (t (file-name-directory file)))) |
249 | |
250 ;;;###autoload | |
79064
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
251 (defun url-file-nondirectory (file) |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
252 "Return the nondirectory part of FILE, for a URL." |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
253 (cond |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
254 ((null file) "") |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
255 ((string-match (eval-when-compile (regexp-quote "?")) file) |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
256 (file-name-nondirectory (substring file 0 (match-beginning 0)))) |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
257 (t (file-name-nondirectory file)))) |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
258 |
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
259 ;;;###autoload |
65312
915d671fef52
*** empty log message ***
Chong Yidong <cyd@stupidchicken.com>
parents:
64748
diff
changeset
|
260 (defun url-parse-query-string (query &optional downcase allow-newlines) |
54695 | 261 (let (retval pairs cur key val) |
262 (setq pairs (split-string query "&")) | |
263 (while pairs | |
264 (setq cur (car pairs) | |
265 pairs (cdr pairs)) | |
266 (if (not (string-match "=" cur)) | |
267 nil ; Grace | |
65312
915d671fef52
*** empty log message ***
Chong Yidong <cyd@stupidchicken.com>
parents:
64748
diff
changeset
|
268 (setq key (url-unhex-string (substring cur 0 (match-beginning 0)) |
915d671fef52
*** empty log message ***
Chong Yidong <cyd@stupidchicken.com>
parents:
64748
diff
changeset
|
269 allow-newlines)) |
915d671fef52
*** empty log message ***
Chong Yidong <cyd@stupidchicken.com>
parents:
64748
diff
changeset
|
270 (setq val (url-unhex-string (substring cur (match-end 0) nil) |
915d671fef52
*** empty log message ***
Chong Yidong <cyd@stupidchicken.com>
parents:
64748
diff
changeset
|
271 allow-newlines)) |
54695 | 272 (if downcase |
273 (setq key (downcase key))) | |
274 (setq cur (assoc key retval)) | |
275 (if cur | |
276 (setcdr cur (cons val (cdr cur))) | |
277 (setq retval (cons (list key val) retval))))) | |
278 retval)) | |
279 | |
280 (defun url-unhex (x) | |
281 (if (> x ?9) | |
282 (if (>= x ?a) | |
283 (+ 10 (- x ?a)) | |
284 (+ 10 (- x ?A))) | |
285 (- x ?0))) | |
286 | |
54803
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
287 ;; Fixme: Is this definition better, and does it ever matter? |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
288 |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
289 ;; (defun url-unhex-string (str &optional allow-newlines) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
290 ;; "Remove %XX, embedded spaces, etc in a url. |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
291 ;; If optional second argument ALLOW-NEWLINES is non-nil, then allow the |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
292 ;; decoding of carriage returns and line feeds in the string, which is normally |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
293 ;; forbidden in URL encoding." |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
294 ;; (setq str (or str "")) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
295 ;; (setq str (replace-regexp-in-string "%[[:xdigit:]]\\{2\\}" |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
296 ;; (lambda (match) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
297 ;; (string (string-to-number |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
298 ;; (substring match 1) 16))) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
299 ;; str t t)) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
300 ;; (if allow-newlines |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
301 ;; (replace-regexp-in-string "[\n\r]" (lambda (match) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
302 ;; (format "%%%.2X" (aref match 0))) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
303 ;; str t t) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
304 ;; str)) |
a78c94aa182d
(url-hexify-string): Don't give multibyte error for char <16.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54770
diff
changeset
|
305 |
54695 | 306 ;;;###autoload |
307 (defun url-unhex-string (str &optional allow-newlines) | |
96486
7369ded3b436
Typo and docstring fixes.
Juanma Barranquero <lekktu@gmail.com>
parents:
94668
diff
changeset
|
308 "Remove %XX embedded spaces, etc in a URL. |
54695 | 309 If optional second argument ALLOW-NEWLINES is non-nil, then allow the |
310 decoding of carriage returns and line feeds in the string, which is normally | |
311 forbidden in URL encoding." | |
312 (setq str (or str "")) | |
313 (let ((tmp "") | |
314 (case-fold-search t)) | |
315 (while (string-match "%[0-9a-f][0-9a-f]" str) | |
316 (let* ((start (match-beginning 0)) | |
317 (ch1 (url-unhex (elt str (+ start 1)))) | |
318 (code (+ (* 16 ch1) | |
319 (url-unhex (elt str (+ start 2)))))) | |
320 (setq tmp (concat | |
321 tmp (substring str 0 start) | |
322 (cond | |
323 (allow-newlines | |
324 (char-to-string code)) | |
325 ((or (= code ?\n) (= code ?\r)) | |
326 " ") | |
327 (t (char-to-string code)))) | |
328 str (substring str (match-end 0))))) | |
329 (setq tmp (concat tmp str)) | |
330 tmp)) | |
331 | |
332 (defconst url-unreserved-chars | |
333 '( | |
334 ?a ?b ?c ?d ?e ?f ?g ?h ?i ?j ?k ?l ?m ?n ?o ?p ?q ?r ?s ?t ?u ?v ?w ?x ?y ?z | |
335 ?A ?B ?C ?D ?E ?F ?G ?H ?I ?J ?K ?L ?M ?N ?O ?P ?Q ?R ?S ?T ?U ?V ?W ?X ?Y ?Z | |
336 ?0 ?1 ?2 ?3 ?4 ?5 ?6 ?7 ?8 ?9 | |
337 ?- ?_ ?. ?! ?~ ?* ?' ?\( ?\)) | |
338 "A list of characters that are _NOT_ reserved in the URL spec. | |
339 This is taken from RFC 2396.") | |
340 | |
341 ;;;###autoload | |
72196
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
342 (defun url-hexify-string (string) |
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
343 "Return a new string that is STRING URI-encoded. |
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
344 First, STRING is converted to utf-8, if necessary. Then, for each |
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
345 character in the utf-8 string, those found in `url-unreserved-chars' |
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
346 are left as-is, all others are represented as a three-character |
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
347 string: \"%\" followed by two lowercase hex digits." |
72218
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
348 ;; To go faster and avoid a lot of consing, we could do: |
96486
7369ded3b436
Typo and docstring fixes.
Juanma Barranquero <lekktu@gmail.com>
parents:
94668
diff
changeset
|
349 ;; |
72218
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
350 ;; (defconst url-hexify-table |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
351 ;; (let ((map (make-vector 256 nil))) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
352 ;; (dotimes (byte 256) (aset map byte |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
353 ;; (if (memq byte url-unreserved-chars) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
354 ;; (char-to-string byte) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
355 ;; (format "%%%02x" byte)))) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
356 ;; map)) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
357 ;; |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
358 ;; (mapconcat (curry 'aref url-hexify-table) ...) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
359 (mapconcat (lambda (byte) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
360 (if (memq byte url-unreserved-chars) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
361 (char-to-string byte) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
362 (format "%%%02x" byte))) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
363 (if (multibyte-string-p string) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
364 (encode-coding-string string 'utf-8) |
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
365 string) |
72196
5b336ff592bb
(url-hexify-string): Rewrite.
Thien-Thi Nguyen <ttn@gnuvola.org>
parents:
68640
diff
changeset
|
366 "")) |
54695 | 367 |
368 ;;;###autoload | |
369 (defun url-file-extension (fname &optional x) | |
370 "Return the filename extension of FNAME. | |
96486
7369ded3b436
Typo and docstring fixes.
Juanma Barranquero <lekktu@gmail.com>
parents:
94668
diff
changeset
|
371 If optional argument X is t, then return the basename |
7369ded3b436
Typo and docstring fixes.
Juanma Barranquero <lekktu@gmail.com>
parents:
94668
diff
changeset
|
372 of the file with the extension stripped off." |
54695 | 373 (if (and fname |
79064
5299839279f5
(url-basepath): Function deleted.
Richard M. Stallman <rms@gnu.org>
parents:
78850
diff
changeset
|
374 (setq fname (url-file-nondirectory fname)) |
54695 | 375 (string-match "\\.[^./]+$" fname)) |
376 (if x (substring fname 0 (match-beginning 0)) | |
377 (substring fname (match-beginning 0) nil)) | |
378 ;; | |
379 ;; If fname has no extension, and x then return fname itself instead of | |
380 ;; nothing. When caching it allows the correct .hdr file to be produced | |
381 ;; for filenames without extension. | |
382 ;; | |
383 (if x | |
384 fname | |
385 ""))) | |
386 | |
387 ;;;###autoload | |
388 (defun url-truncate-url-for-viewing (url &optional width) | |
101145
b375012e7a7a
* url-util.el (url-truncate-url-for-viewing): Doc fix.
Juanma Barranquero <lekktu@gmail.com>
parents:
100908
diff
changeset
|
389 "Return a shortened version of URL that is WIDTH characters wide or less. |
54695 | 390 WIDTH defaults to the current frame width." |
391 (let* ((fr-width (or width (frame-width))) | |
392 (str-width (length url)) | |
393 (fname nil) | |
394 (modified 0) | |
395 (urlobj nil)) | |
396 ;; The first thing that can go are the search strings | |
397 (if (and (>= str-width fr-width) | |
398 (string-match "?" url)) | |
399 (setq url (concat (substring url 0 (match-beginning 0)) "?...") | |
72218
23d71f51857b
(url-hexify-string): Only utf-8 encode if it's a multibyte string.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
72196
diff
changeset
|
400 str-width (length url))) |
54695 | 401 (if (< str-width fr-width) |
402 nil ; Hey, we are done! | |
403 (setq urlobj (url-generic-parse-url url) | |
404 fname (url-filename urlobj) | |
405 fr-width (- fr-width 4)) | |
406 (while (and (>= str-width fr-width) | |
407 (string-match "/" fname)) | |
408 (setq fname (substring fname (match-end 0) nil) | |
409 modified (1+ modified)) | |
83823
dd2bcc6758a0
* url-parse.el (url): Use defstruct rather than macros. Update all callers.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
78222
diff
changeset
|
410 (setf (url-filename urlobj) fname) |
54695 | 411 (setq url (url-recreate-url urlobj) |
412 str-width (length url))) | |
413 (if (> modified 1) | |
414 (setq fname (concat "/.../" fname)) | |
415 (setq fname (concat "/" fname))) | |
83823
dd2bcc6758a0
* url-parse.el (url): Use defstruct rather than macros. Update all callers.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
78222
diff
changeset
|
416 (setf (url-filename urlobj) fname) |
54695 | 417 (setq url (url-recreate-url urlobj))) |
418 url)) | |
419 | |
420 ;;;###autoload | |
421 (defun url-view-url (&optional no-show) | |
422 "View the current document's URL. | |
423 Optional argument NO-SHOW means just return the URL, don't show it in | |
424 the minibuffer. | |
425 | |
426 This uses `url-current-object', set locally to the buffer." | |
427 (interactive) | |
428 (if (not url-current-object) | |
429 nil | |
430 (if no-show | |
431 (url-recreate-url url-current-object) | |
432 (message "%s" (url-recreate-url url-current-object))))) | |
433 | |
434 (eval-and-compile | |
435 (defvar url-get-url-filename-chars "-%.?@a-zA-Z0-9()_/:~=&" | |
96486
7369ded3b436
Typo and docstring fixes.
Juanma Barranquero <lekktu@gmail.com>
parents:
94668
diff
changeset
|
436 "Valid characters in a URL.") |
54695 | 437 ) |
438 | |
439 (defun url-get-url-at-point (&optional pt) | |
440 "Get the URL closest to point, but don't change position. | |
441 Has a preference for looking backward when not directly on a symbol." | |
442 ;; Not at all perfect - point must be right in the name. | |
443 (save-excursion | |
444 (if pt (goto-char pt)) | |
445 (let (start url) | |
446 (save-excursion | |
447 ;; first see if you're just past a filename | |
448 (if (not (eobp)) | |
449 (if (looking-at "[] \t\n[{}()]") ; whitespace or some parens | |
450 (progn | |
451 (skip-chars-backward " \n\t\r({[]})") | |
452 (if (not (bobp)) | |
453 (backward-char 1))))) | |
454 (if (and (char-after (point)) | |
455 (string-match (eval-when-compile | |
456 (concat "[" url-get-url-filename-chars "]")) | |
457 (char-to-string (char-after (point))))) | |
458 (progn | |
459 (skip-chars-backward url-get-url-filename-chars) | |
460 (setq start (point)) | |
461 (skip-chars-forward url-get-url-filename-chars)) | |
462 (setq start (point))) | |
463 (setq url (buffer-substring-no-properties start (point)))) | |
464 (if (and url (string-match "^(.*)\\.?$" url)) | |
465 (setq url (match-string 1 url))) | |
466 (if (and url (string-match "^URL:" url)) | |
467 (setq url (substring url 4 nil))) | |
468 (if (and url (string-match "\\.$" url)) | |
469 (setq url (substring url 0 -1))) | |
470 (if (and url (string-match "^www\\." url)) | |
471 (setq url (concat "http://" url))) | |
472 (if (and url (not (string-match url-nonrelative-link url))) | |
473 (setq url nil)) | |
474 url))) | |
475 | |
476 (defun url-generate-unique-filename (&optional fmt) | |
477 "Generate a unique filename in `url-temporary-directory'." | |
101912
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
478 ;; This variable is obsolete, but so is this function. |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
479 (let ((tempdir (with-no-warnings url-temporary-directory))) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
480 (if (not fmt) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
481 (let ((base (format "url-tmp.%d" (user-real-uid))) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
482 (fname "") |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
483 (x 0)) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
484 (setq fname (format "%s%d" base x)) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
485 (while (file-exists-p |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
486 (expand-file-name fname tempdir)) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
487 (setq x (1+ x) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
488 fname (concat base (int-to-string x)))) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
489 (expand-file-name fname tempdir)) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
490 (let ((base (concat "url" (int-to-string (user-real-uid)))) |
54695 | 491 (fname "") |
492 (x 0)) | |
101912
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
493 (setq fname (format fmt (concat base (int-to-string x)))) |
54695 | 494 (while (file-exists-p |
101912
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
495 (expand-file-name fname tempdir)) |
54695 | 496 (setq x (1+ x) |
101912
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
497 fname (format fmt (concat base (int-to-string x))))) |
c28ecc931e8c
(url-generate-unique-filename): Silence compiler.
Glenn Morris <rgm@gnu.org>
parents:
101887
diff
changeset
|
498 (expand-file-name fname tempdir))))) |
101887
3a192c2f3ada
(url-generate-unique-filename): Mark as obsolete.
Chong Yidong <cyd@stupidchicken.com>
parents:
101145
diff
changeset
|
499 (make-obsolete 'url-generate-unique-filename 'make-temp-file "23.1") |
54695 | 500 |
501 (defun url-extract-mime-headers () | |
502 "Set `url-current-mime-headers' in current buffer." | |
503 (save-excursion | |
504 (goto-char (point-min)) | |
505 (unless url-current-mime-headers | |
506 (set (make-local-variable 'url-current-mime-headers) | |
507 (mail-header-extract))))) | |
508 | |
79558
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
509 (defun url-make-private-file (file) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
510 "Make FILE only readable and writable by the current user. |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
511 Creates FILE and its parent directories if they do not exist." |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
512 (let ((dir (file-name-directory file))) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
513 (when dir |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
514 ;; For historical reasons. |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
515 (make-directory dir t))) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
516 ;; Based on doc-view-make-safe-dir. |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
517 (condition-case nil |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
518 (let ((umask (default-file-modes))) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
519 (unwind-protect |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
520 (progn |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
521 (set-default-file-modes #o0600) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
522 (with-temp-buffer |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
523 (write-region (point-min) (point-max) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
524 file nil 'silent nil 'excl))) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
525 (set-default-file-modes umask))) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
526 (file-already-exists |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
527 (if (file-symlink-p file) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
528 (error "Danger: `%s' is a symbolic link" file)) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
529 (set-file-modes file #o0600)))) |
ba4da6f08090
(url-make-private-file): New function.
Glenn Morris <rgm@gnu.org>
parents:
79064
diff
changeset
|
530 |
54695 | 531 (provide 'url-util) |
54699 | 532 |
54935
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
533 ;; arch-tag: 24352abc-5a5a-412e-90cd-313b26bed5c9 |
efddc239393d
(url-debug): Use with-current-buffer.
Stefan Monnier <monnier@iro.umontreal.ca>
parents:
54803
diff
changeset
|
534 ;;; url-util.el ends here |