Mercurial > emacs
annotate lisp/international/mule-util.el @ 19688:854a46c2aac5
(detect_coding_mask): Add in CODING_CATEGORY_MASK_RAW_TEXT
in the detect_coding_iso2022 case.
author | Richard M. Stallman <rms@gnu.org> |
---|---|
date | Tue, 02 Sep 1997 20:56:02 +0000 |
parents | 7cf3d42a6fd7 |
children | 356bc22e88f6 |
rev | line source |
---|---|
17052 | 1 ;;; mule-util.el --- Utility functions for mulitilingual environment (mule) |
2 | |
3 ;; Copyright (C) 1995 Electrotechnical Laboratory, JAPAN. | |
18377
8b4a66c66dd6
Change copyright notice.
Richard M. Stallman <rms@gnu.org>
parents:
18313
diff
changeset
|
4 ;; Licensed to the Free Software Foundation. |
17052 | 5 |
6 ;; Keywords: mule, multilingual | |
7 | |
8 ;; This file is part of GNU Emacs. | |
9 | |
10 ;; GNU Emacs is free software; you can redistribute it and/or modify | |
11 ;; it under the terms of the GNU General Public License as published by | |
12 ;; the Free Software Foundation; either version 2, or (at your option) | |
13 ;; any later version. | |
14 | |
15 ;; GNU Emacs is distributed in the hope that it will be useful, | |
16 ;; but WITHOUT ANY WARRANTY; without even the implied warranty of | |
17 ;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
18 ;; GNU General Public License for more details. | |
19 | |
20 ;; You should have received a copy of the GNU General Public License | |
17071 | 21 ;; along with GNU Emacs; see the file COPYING. If not, write to the |
22 ;; Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
23 ;; Boston, MA 02111-1307, USA. | |
17052 | 24 |
25 ;;; Code: | |
26 | |
27 ;;; String manipulations while paying attention to multibyte | |
28 ;;; characters. | |
29 | |
30 ;;;###autoload | |
31 (defun string-to-sequence (string type) | |
32 "Convert STRING to a sequence of TYPE which contains characters in STRING. | |
18200
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
33 TYPE should be `list' or `vector'." |
17052 | 34 (or (eq type 'list) (eq type 'vector) |
35 (error "Invalid type: %s" type)) | |
36 (let* ((len (length string)) | |
37 (i 0) | |
38 l ch) | |
39 (while (< i len) | |
40 (setq ch (sref string i)) | |
41 (setq l (cons ch l)) | |
42 (setq i (+ i (char-bytes ch)))) | |
43 (setq l (nreverse l)) | |
44 (if (eq type 'list) | |
45 l | |
46 (vconcat l)))) | |
47 | |
48 ;;;###autoload | |
49 (defsubst string-to-list (string) | |
50 "Return a list of characters in STRING." | |
51 (string-to-sequence string 'list)) | |
52 | |
53 ;;;###autoload | |
54 (defsubst string-to-vector (string) | |
55 "Return a vector of characters in STRING." | |
56 (string-to-sequence string 'vector)) | |
57 | |
58 ;;;###autoload | |
59 (defun store-substring (string idx obj) | |
60 "Embed OBJ (string or character) at index IDX of STRING." | |
61 (let* ((str (cond ((stringp obj) obj) | |
62 ((integerp obj) (char-to-string obj)) | |
63 (t (error | |
64 "Invalid argument (should be string or character): %s" | |
65 obj)))) | |
66 (string-len (length string)) | |
67 (len (length str)) | |
68 (i 0)) | |
69 (while (and (< i len) (< idx string-len)) | |
70 (aset string idx (aref str i)) | |
71 (setq idx (1+ idx) i (1+ i))) | |
72 string)) | |
73 | |
74 ;;;###autoload | |
75 (defun truncate-string-to-width (str width &optional start-column padding) | |
76 "Truncate string STR to fit in WIDTH columns. | |
77 Optional 1st arg START-COLUMN if non-nil specifies the starting column. | |
17092
e7920fdc4948
(truncate-string-to-width): Argument PADDING can be a padding character.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
78 Optional 2nd arg PADDING if non-nil is a padding character to be padded at |
17052 | 79 the head and tail of the resulting string to fit in WIDTH if necessary. |
80 If PADDING is nil, the resulting string may be narrower than WIDTH." | |
81 (or start-column | |
82 (setq start-column 0)) | |
83 (let ((len (length str)) | |
84 (idx 0) | |
85 (column 0) | |
86 (head-padding "") (tail-padding "") | |
87 ch last-column last-idx from-idx) | |
88 (condition-case nil | |
89 (while (< column start-column) | |
90 (setq ch (sref str idx) | |
91 column (+ column (char-width ch)) | |
92 idx (+ idx (char-bytes ch)))) | |
93 (args-out-of-range (setq idx len))) | |
94 (if (< column start-column) | |
17092
e7920fdc4948
(truncate-string-to-width): Argument PADDING can be a padding character.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
95 (if padding (make-string width padding) "") |
17052 | 96 (if (and padding (> column start-column)) |
97 (setq head-padding (make-string (- column start-column) ?\ ))) | |
98 (setq from-idx idx) | |
99 (condition-case nil | |
100 (while (< column width) | |
101 (setq last-column column | |
102 last-idx idx | |
103 ch (sref str idx) | |
104 column (+ column (char-width ch)) | |
105 idx (+ idx (char-bytes ch)))) | |
106 (args-out-of-range (setq idx len))) | |
107 (if (> column width) | |
108 (setq column last-column idx last-idx)) | |
109 (if (and padding (< column width)) | |
17092
e7920fdc4948
(truncate-string-to-width): Argument PADDING can be a padding character.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
110 (setq tail-padding (make-string (- width column) padding))) |
17052 | 111 (setq str (substring str from-idx idx)) |
112 (if padding | |
113 (concat head-padding str tail-padding) | |
114 str)))) | |
115 | |
116 ;;; For backward compatiblity ... | |
117 ;;;###autoload | |
118 (defalias 'truncate-string 'truncate-string-to-width) | |
119 (make-obsolete 'truncate-string 'truncate-string-to-width) | |
120 | |
121 ;;; Nested alist handler. Nested alist is alist whose elements are | |
122 ;;; also nested alist. | |
123 | |
124 ;;;###autoload | |
125 (defsubst nested-alist-p (obj) | |
126 "Return t if OBJ is a nesetd alist. | |
127 | |
128 Nested alist is a list of the form (ENTRY . BRANCHES), where ENTRY is | |
129 any Lisp object, and BRANCHES is a list of cons cells of the form | |
130 (KEY-ELEMENT . NESTED-ALIST). | |
131 | |
132 You can use a nested alist to store any Lisp object (ENTRY) for a key | |
133 sequence KEYSEQ, where KEYSEQ is a sequence of KEY-ELEMENT. KEYSEQ | |
134 can be a string, a vector, or a list." | |
135 (and obj (listp obj) (listp (cdr obj)))) | |
136 | |
137 ;;;###autoload | |
138 (defun set-nested-alist (keyseq entry alist &optional len branches) | |
139 "Set ENTRY for KEYSEQ in a nested alist ALIST. | |
140 Optional 4th arg LEN non-nil means the firlst LEN elements in KEYSEQ | |
141 is considered. | |
142 Optional argument BRANCHES if non-nil is branches for a keyseq | |
143 longer than KEYSEQ. | |
144 See the documentation of `nested-alist-p' for more detail." | |
145 (or (nested-alist-p alist) | |
146 (error "Invalid arguement %s" alist)) | |
147 (let ((islist (listp keyseq)) | |
148 (len (or len (length keyseq))) | |
149 (i 0) | |
150 key-elt slot) | |
151 (while (< i len) | |
152 (if (null (nested-alist-p alist)) | |
153 (error "Keyseq %s is too long for this nested alist" keyseq)) | |
154 (setq key-elt (if islist (nth i keyseq) (aref keyseq i))) | |
155 (setq slot (assoc key-elt (cdr alist))) | |
156 (if (null slot) | |
157 (progn | |
158 (setq slot (cons key-elt (list t))) | |
159 (setcdr alist (cons slot (cdr alist))))) | |
160 (setq alist (cdr slot)) | |
161 (setq i (1+ i))) | |
162 (setcar alist entry) | |
163 (if branches | |
164 (if (cdr alist) | |
165 (error "Can't set branches for keyseq %s" keyseq) | |
166 (setcdr alist branches))))) | |
167 | |
168 ;;;###autoload | |
169 (defun lookup-nested-alist (keyseq alist &optional len start nil-for-too-long) | |
170 "Look up key sequence KEYSEQ in nested alist ALIST. Return the definition. | |
171 Optional 1st argument LEN specifies the length of KEYSEQ. | |
172 Optional 2nd argument START specifies index of the starting key. | |
173 The returned value is normally a nested alist of which | |
174 car part is the entry for KEYSEQ. | |
175 If ALIST is not deep enough for KEYSEQ, return number which is | |
176 how many key elements at the front of KEYSEQ it takes | |
177 to reach a leaf in ALIST. | |
178 Optional 3rd argument NIL-FOR-TOO-LONG non-nil means return nil | |
179 even if ALIST is not deep enough." | |
180 (or (nested-alist-p alist) | |
181 (error "invalid arguement %s" alist)) | |
182 (or len | |
183 (setq len (length keyseq))) | |
184 (let ((i (or start 0))) | |
185 (if (catch 'lookup-nested-alist-tag | |
186 (if (listp keyseq) | |
187 (while (< i len) | |
188 (if (setq alist (cdr (assoc (nth i keyseq) (cdr alist)))) | |
189 (setq i (1+ i)) | |
190 (throw 'lookup-nested-alist-tag t)))) | |
191 (while (< i len) | |
192 (if (setq alist (cdr (assoc (aref keyseq i) (cdr alist)))) | |
193 (setq i (1+ i)) | |
194 (throw 'lookup-nested-alist-tag t)))) | |
195 ;; KEYSEQ is too long. | |
196 (if nil-for-too-long nil i) | |
197 alist))) | |
198 | |
18299
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
199 |
17052 | 200 ;; Coding system related functions. |
201 | |
202 ;;;###autoload | |
18200
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
203 (defun coding-system-base (coding-system) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
204 "Return a base of CODING-SYSTEM. |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
205 The base is a coding system of which coding-system property is a |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
206 coding-spec (see the function `make-coding-system')." |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
207 (let ((coding-spec (get coding-system 'coding-system))) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
208 (if (vectorp coding-spec) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
209 coding-system |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
210 (coding-system-base coding-spec)))) |
17052 | 211 |
212 ;;;###autoload | |
18200
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
213 (defun coding-system-eol-type-mnemonic (coding-system) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
214 "Return mnemonic letter of eol-type of CODING-SYSTEM." |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
215 (let ((eol-type (coding-system-eol-type coding-system))) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
216 (cond ((vectorp eol-type) eol-mnemonic-undecided) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
217 ((eq eol-type 0) eol-mnemonic-unix) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
218 ((eq eol-type 1) eol-mnemonic-unix) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
219 ((eq eol-type 2) eol-mnemonic-unix) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
220 (t ?-)))) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
221 |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
222 ;;;###autoload |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
223 (defun coding-system-post-read-conversion (coding-system) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
224 "Return post-read-conversion property of CODING-SYSTEM." |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
225 (and coding-system |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
226 (symbolp coding-system) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
227 (or (get coding-system 'post-read-conversion) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
228 (coding-system-post-read-conversion |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
229 (get coding-system 'coding-system))))) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
230 |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
231 ;;;###autoload |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
232 (defun coding-system-pre-write-conversion (coding-system) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
233 "Return pre-write-conversion property of CODING-SYSTEM." |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
234 (and coding-system |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
235 (symbolp coding-system) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
236 (or (get coding-system 'pre-write-conversion) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
237 (coding-system-pre-write-conversion |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
238 (get coding-system 'coding-system))))) |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
239 |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
240 ;;;###autoload |
19455
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
241 (defun coding-system-unification-table-for-decode (coding-system) |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
242 "Return unification-table-for-decode property of CODING-SYSTEM." |
18200
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
243 (and coding-system |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
244 (symbolp coding-system) |
19455
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
245 (or (get coding-system 'unification-table-for-decode) |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
246 (coding-system-unification-table |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
247 (get coding-system 'coding-system))))) |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
248 |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
249 ;;;###autoload |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
250 (defun coding-system-unification-table-for-encode (coding-system) |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
251 "Return unification-table-for-encode property of CODING-SYSTEM." |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
252 (and coding-system |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
253 (symbolp coding-system) |
7cf3d42a6fd7
(coding-system-unification-table):
Kenichi Handa <handa@m17n.org>
parents:
19264
diff
changeset
|
254 (or (get coding-system 'unification-table-for-encode) |
18200
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
255 (coding-system-unification-table |
c913160e34a7
(set-coding-system-alist): Deleted.
Kenichi Handa <handa@m17n.org>
parents:
17092
diff
changeset
|
256 (get coding-system 'coding-system))))) |
17052 | 257 |
18299
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
258 (defun coding-system-lessp (x y) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
259 (cond ((eq x 'no-conversion) t) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
260 ((eq y 'no-conversion) nil) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
261 ((eq x 'emacs-mule) t) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
262 ((eq y 'emacs-mule) nil) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
263 ((eq x 'undecided) t) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
264 ((eq y 'undecided) nil) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
265 (t (let ((c1 (coding-system-mnemonic x)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
266 (c2 (coding-system-mnemonic y))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
267 (or (< (downcase c1) (downcase c2)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
268 (and (not (> (downcase c1) (downcase c2))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
269 (< c1 c2))))))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
270 |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
271 ;;;###autoload |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
272 (defun coding-system-list (&optional base-only) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
273 "Return a list of all existing coding systems. |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
274 If optional arg BASE-ONLY is non-nil, only base coding systems are listed." |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
275 (let (l) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
276 (mapatoms (lambda (x) (if (get x 'coding-system) (setq l (cons x l))))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
277 (let* ((codings (sort l 'coding-system-lessp)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
278 (tail (cons nil codings)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
279 coding) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
280 ;; At first, remove subsidiary coding systems (eol variants) and |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
281 ;; alias coding systems (if necessary). |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
282 (while (cdr tail) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
283 (setq coding (car (cdr tail))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
284 (if (or (get coding 'eol-variant) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
285 (and base-only (coding-system-parent coding))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
286 (setcdr tail (cdr (cdr tail))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
287 (setq tail (cdr tail)))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
288 codings))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
289 |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
290 ;;;###autoload |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
291 (defun coding-system-plist (coding-system) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
292 "Return property list of CODING-SYSTEM." |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
293 (let ((found nil) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
294 coding-spec eol-type |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
295 post-read-conversion pre-write-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
296 unification-table) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
297 (while (not found) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
298 (or eol-type |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
299 (setq eol-type (get coding-system 'eol-type))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
300 (or post-read-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
301 (setq post-read-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
302 (get coding-system 'post-read-conversion))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
303 (or pre-write-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
304 (setq pre-write-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
305 (get coding-system 'pre-write-conversion))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
306 (or unification-table |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
307 (setq unification-table |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
308 (get coding-system 'unification-table))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
309 (setq coding-spec (get coding-system 'coding-system)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
310 (if (and coding-spec (symbolp coding-spec)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
311 (setq coding-system coding-spec) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
312 (setq found t))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
313 (if (not coding-spec) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
314 (error "Invalid coding system: %s" coding-system)) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
315 (list 'coding-spec coding-spec |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
316 'eol-type eol-type |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
317 'post-read-conversion post-read-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
318 'pre-write-conversion pre-write-conversion |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
319 'unification-table unification-table))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
320 |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
321 ;;;###autoload |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
322 (defun coding-system-equal (coding-system-1 coding-system-2) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
323 "Return t if and only if CODING-SYSTEM-1 and CODING-SYSTEM-2 are identical. |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
324 Two coding systems are identical if two symbols are equal |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
325 or one is an alias of the other." |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
326 (or (eq coding-system-1 coding-system-2) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
327 (equal (coding-system-plist coding-system-1) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
328 (coding-system-plist coding-system-2)))) |
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
329 |
17052 | 330 |
331 ;;; Composite charcater manipulations. | |
332 | |
333 ;;;###autoload | |
334 (defun compose-region (start end) | |
335 "Compose all characters in the current region into one composite character. | |
336 When called from a program, expects two arguments, | |
337 positions (integers or markers) specifying the region." | |
338 (interactive "r") | |
339 (save-excursion | |
340 (let ((str (buffer-substring start end))) | |
341 (goto-char start) | |
342 (delete-region start end) | |
343 (insert (compose-string str))))) | |
344 | |
345 ;;;###autoload | |
346 (defun decompose-region (start end) | |
347 "Decompose all composite characters in the current region. | |
348 Composite characters are broken up into individual components. | |
349 When called from a program, expects two arguments, | |
350 positions (integers or markers) specifying the region." | |
351 (interactive "r") | |
352 (save-restriction | |
353 (narrow-to-region start end) | |
354 (goto-char (point-min)) | |
355 (let ((enable-multibyte-characters nil) | |
356 ;; This matches the whole bytes of single composite character. | |
357 (re-cmpchar "\200[\240-\377]+") | |
358 p ch str) | |
359 (while (re-search-forward re-cmpchar nil t) | |
360 (setq str (buffer-substring (match-beginning 0) (match-end 0))) | |
361 (delete-region (match-beginning 0) (match-end 0)) | |
362 (insert (decompose-composite-char (string-to-char str))))))) | |
363 | |
364 ;;;###autoload | |
19264
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
365 (defun decompose-string (string) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
366 "Decompose all composite characters in STRING." |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
367 (let* ((l (string-to-list string)) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
368 (tail l) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
369 ch) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
370 (while tail |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
371 (setq ch (car tail)) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
372 (setcar tail (if (cmpcharp ch) (decompose-composite-char ch) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
373 (char-to-string ch))) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
374 (setq tail (cdr tail))) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
375 (apply 'concat l))) |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
376 |
6122dbba797f
(prefer-coding-system): Moved to mule-util.el.
Kenichi Handa <handa@m17n.org>
parents:
19056
diff
changeset
|
377 ;;;###autoload |
17052 | 378 (defconst reference-point-alist |
379 '((tl . 0) (tc . 1) (tr . 2) | |
380 (ml . 3) (mc . 4) (mr . 5) | |
381 (bl . 6) (bc . 7) (br . 8) | |
382 (top-left . 0) (top-center . 1) (top-right . 2) | |
383 (mid-left . 3) (mid-center . 4) (mid-right . 5) | |
384 (bottom-left . 6) (bottom-center . 7) (bottom-right . 8) | |
385 (0 . 0) (1 . 1) (2 . 2) | |
386 (3 . 3) (4 . 4) (5 . 5) | |
387 (6 . 6) (7 . 7) (8 . 8)) | |
388 "Alist of reference point symbols vs reference point codes. | |
19048
65112b3cc989
(reference-point-alist): Doc-string modified.
Kenichi Handa <handa@m17n.org>
parents:
19016
diff
changeset
|
389 A reference point symbol is to be used to specify a composition rule |
65112b3cc989
(reference-point-alist): Doc-string modified.
Kenichi Handa <handa@m17n.org>
parents:
19016
diff
changeset
|
390 while making a composite character by the function `compose-chars' |
65112b3cc989
(reference-point-alist): Doc-string modified.
Kenichi Handa <handa@m17n.org>
parents:
19016
diff
changeset
|
391 (which see). |
65112b3cc989
(reference-point-alist): Doc-string modified.
Kenichi Handa <handa@m17n.org>
parents:
19016
diff
changeset
|
392 |
17052 | 393 Meanings of reference point codes are as follows: |
394 | |
395 0----1----2 <-- ascent 0:tl or top-left | |
396 | | 1:tc or top-center | |
397 | | 2:tr or top-right | |
398 | | 3:ml or mid-left | |
399 | 4 <--+---- center 4:mc or mid-center | |
400 | | 5:mr or mid-right | |
401 --- 3 5 <-- baseline 6:bl or bottom-left | |
402 | | 7:bc or bottom-center | |
403 6----7----8 <-- descent 8:br or bottom-right | |
404 | |
405 Reference point symbols are to be used to specify composition rule of | |
406 the form \(GLOBAL-REF-POINT . NEW-REF-POINT), where GLOBAL-REF-POINT | |
407 is a reference point in the overall glyphs already composed, and | |
408 NEW-REF-POINT is a reference point in the new glyph to be added. | |
409 | |
410 For instance, if GLOBAL-REF-POINT is 8 and NEW-REF-POINT is 1, the | |
411 overall glyph is updated as follows: | |
412 | |
413 +-------+--+ <--- new ascent | |
414 | | | | |
415 | global| | | |
416 | glyph | | | |
417 --- | | | <--- baseline (doesn't change) | |
418 +----+--+--+ | |
419 | | new | | |
420 | |glyph| | |
421 +----+-----+ <--- new descent | |
422 ") | |
423 | |
424 ;; Return a string for char CH to be embedded in multibyte form of | |
425 ;; composite character. | |
426 (defun compose-chars-component (ch) | |
427 (if (< ch 128) | |
428 (format "\240%c" (+ ch 128)) | |
429 (let ((str (char-to-string ch))) | |
430 (if (cmpcharp ch) | |
18299
c6f35cac24b4
(coding-system-parent): New function.
Kenichi Handa <handa@m17n.org>
parents:
18200
diff
changeset
|
431 (substring str (if (= (aref str 1) ?\xFF) 2 1)) |
17052 | 432 (aset str 0 (+ (aref str 0) ?\x20)) |
433 str)))) | |
434 | |
435 ;; Return a string for composition rule RULE to be embedded in | |
436 ;; multibyte form of composite character. | |
437 (defsubst compose-chars-rule (rule) | |
438 (char-to-string (+ ?\xA0 | |
439 (* (cdr (assq (car rule) reference-point-alist)) 9) | |
440 (cdr (assq (cdr rule) reference-point-alist))))) | |
441 | |
442 ;;;###autoload | |
443 (defun compose-chars (first-component &rest args) | |
444 "Return one char string composed from the arguments. | |
445 Each argument is a character (including a composite chararacter) | |
446 or a composition rule. | |
447 A composition rule has the form \(GLOBAL-REF-POINT . NEW-REF-POINT). | |
448 See the documentation of `reference-point-alist' for more detail." | |
449 (if (= (length args) 0) | |
450 (char-to-string first-component) | |
451 (let* ((with-rule (consp (car args))) | |
452 (str (if with-rule (concat (vector leading-code-composition ?\xFF)) | |
453 (char-to-string leading-code-composition)))) | |
454 (setq str (concat str (compose-chars-component first-component))) | |
455 (while args | |
456 (if with-rule | |
457 (progn | |
458 (if (not (consp (car args))) | |
459 (error "Invalid composition rule: %s" (car args))) | |
460 (setq str (concat str (compose-chars-rule (car args)) | |
461 (compose-chars-component (car (cdr args)))) | |
462 args (cdr (cdr args)))) | |
463 (setq str (concat str (compose-chars-component (car args))) | |
464 args (cdr args)))) | |
465 str))) | |
466 | |
467 ;;;###autoload | |
468 (defun decompose-composite-char (char &optional type with-composition-rule) | |
469 "Convert composite character CHAR to a string containing components of CHAR. | |
470 Optional 1st arg TYPE specifies the type of sequence returned. | |
471 It should be `string' (default), `list', or `vector'. | |
472 Optional 2nd arg WITH-COMPOSITION-RULE non-nil means the returned | |
473 sequence contains embedded composition rules if any. In this case, the | |
474 order of elements in the sequence is the same as arguments for | |
475 `compose-chars' to create CHAR. | |
476 If TYPE is omitted or is `string', composition rules are omitted | |
477 even if WITH-COMPOSITION-RULE is t." | |
478 (or type | |
479 (setq type 'string)) | |
480 (let* ((len (composite-char-component-count char)) | |
481 (i (1- len)) | |
482 l) | |
483 (setq with-composition-rule (and with-composition-rule | |
484 (not (eq type 'string)) | |
485 (composite-char-composition-rule-p char))) | |
486 (while (> i 0) | |
487 (setq l (cons (composite-char-component char i) l)) | |
488 (if with-composition-rule | |
489 (let ((rule (- (composite-char-composition-rule char i) ?\xA0))) | |
490 (setq l (cons (cons (/ rule 9) (% rule 9)) l)))) | |
491 (setq i (1- i))) | |
492 (setq l (cons (composite-char-component char 0) l)) | |
493 (cond ((eq type 'string) | |
494 (apply 'concat-chars l)) | |
495 ((eq type 'list) | |
496 l) | |
497 (t ; i.e. TYPE is vector | |
498 (vconcat l))))) | |
499 | |
500 ;;; mule-util.el ends here |