Mercurial > emacs
annotate src/category.c @ 25507:b9b4581adf36
(Fsubst_char_in_region): Adjust the way to check byte-combining
possibility for the new handling of multibyte sequence.
author | Kenichi Handa <handa@m17n.org> |
---|---|
date | Fri, 03 Sep 1999 01:28:42 +0000 |
parents | 63628f8fe648 |
children | 0a7261c1d487 |
rev | line source |
---|---|
17052 | 1 /* GNU Emacs routines to deal with category tables. |
18341
33e78cc7f058
Change copyright notices.
Richard M. Stallman <rms@gnu.org>
parents:
17787
diff
changeset
|
2 Copyright (C) 1995, 1997 Electrotechnical Laboratory, JAPAN. |
33e78cc7f058
Change copyright notices.
Richard M. Stallman <rms@gnu.org>
parents:
17787
diff
changeset
|
3 Licensed to the Free Software Foundation. |
17052 | 4 |
5 This file is part of GNU Emacs. | |
6 | |
7 GNU Emacs is free software; you can redistribute it and/or modify | |
8 it under the terms of the GNU General Public License as published by | |
9 the Free Software Foundation; either version 2, or (at your option) | |
10 any later version. | |
11 | |
12 GNU Emacs is distributed in the hope that it will be useful, | |
13 but WITHOUT ANY WARRANTY; without even the implied warranty of | |
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
15 GNU General Public License for more details. | |
16 | |
17 You should have received a copy of the GNU General Public License | |
18 along with GNU Emacs; see the file COPYING. If not, write to | |
17071 | 19 the Free Software Foundation, Inc., 59 Temple Place - Suite 330, |
20 Boston, MA 02111-1307, USA. */ | |
17052 | 21 |
22 | |
23 /* Here we handle three objects: category, category set, and category | |
24 table. Read comments in the file category.h to understand them. */ | |
25 | |
26 #include <config.h> | |
27 #include <ctype.h> | |
28 #include "lisp.h" | |
29 #include "buffer.h" | |
30 #include "charset.h" | |
31 #include "category.h" | |
32 | |
33 /* The version number of the latest category table. Each category | |
34 table has a unique version number. It is assigned a new number | |
35 also when it is modified. When a regular expression is compiled | |
36 into the struct re_pattern_buffer, the version number of the | |
37 category table (of the current buffer) at that moment is also | |
38 embedded in the structure. | |
39 | |
40 For the moment, we are not using this feature. */ | |
41 static int category_table_version; | |
42 | |
43 Lisp_Object Qcategory_table, Qcategoryp, Qcategorysetp, Qcategory_table_p; | |
44 | |
45 /* Variables to determine word boundary. */ | |
46 Lisp_Object Vword_combining_categories, Vword_separating_categories; | |
47 | |
48 /* Temporary internal variable used in macro CHAR_HAS_CATEGORY. */ | |
49 Lisp_Object _temp_category_set; | |
50 | |
51 | |
52 /* Category set staff. */ | |
53 | |
54 DEFUN ("make-category-set", Fmake_category_set, Smake_category_set, 1, 1, 0, | |
55 "Return a newly created category-set which contains CATEGORIES.\n\ | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
56 CATEGORIES is a string of category mnemonics.\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
57 The value is a bool-vector which has t at the indices corresponding to\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
58 those categories.") |
17052 | 59 (categories) |
60 Lisp_Object categories; | |
61 { | |
62 Lisp_Object val; | |
63 int len; | |
64 | |
65 CHECK_STRING (categories, 0); | |
66 val = MAKE_CATEGORY_SET; | |
67 | |
20612
5a0922f8c841
(Fmake_category_set): Don't allow multibyte string.
Richard M. Stallman <rms@gnu.org>
parents:
20189
diff
changeset
|
68 if (STRING_MULTIBYTE (categories)) |
5a0922f8c841
(Fmake_category_set): Don't allow multibyte string.
Richard M. Stallman <rms@gnu.org>
parents:
20189
diff
changeset
|
69 error ("Multibyte string in make-category-set"); |
5a0922f8c841
(Fmake_category_set): Don't allow multibyte string.
Richard M. Stallman <rms@gnu.org>
parents:
20189
diff
changeset
|
70 |
17052 | 71 len = XSTRING (categories)->size; |
72 while (--len >= 0) | |
73 { | |
17369
566b26e1930e
(Fmake_category_set): Use XSETFASTINT.
Karl Heuer <kwzh@gnu.org>
parents:
17324
diff
changeset
|
74 Lisp_Object category; |
17052 | 75 |
17369
566b26e1930e
(Fmake_category_set): Use XSETFASTINT.
Karl Heuer <kwzh@gnu.org>
parents:
17324
diff
changeset
|
76 XSETFASTINT (category, XSTRING (categories)->data[len]); |
17052 | 77 CHECK_CATEGORY (category, 0); |
78 SET_CATEGORY_SET (val, category, Qt); | |
79 } | |
80 return val; | |
81 } | |
82 | |
83 | |
84 /* Category staff. */ | |
85 | |
86 Lisp_Object check_category_table (); | |
87 | |
88 DEFUN ("define-category", Fdefine_category, Sdefine_category, 2, 3, 0, | |
89 "Define CHAR as a category which is described by DOCSTRING.\n\ | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
90 CHAR should be an ASCII printing character in the range ` ' to `~'.\n\ |
17052 | 91 DOCSTRING is a documentation string of the category.\n\ |
92 The category is defined only in category table TABLE, which defaults to\n\ | |
93 the current buffer's category table.") | |
94 (category, docstring, table) | |
95 Lisp_Object category, docstring, table; | |
96 { | |
97 CHECK_CATEGORY (category, 0); | |
98 CHECK_STRING (docstring, 1); | |
99 table = check_category_table (table); | |
100 | |
101 if (!NILP (CATEGORY_DOCSTRING (table, XFASTINT (category)))) | |
102 error ("Category `%c' is already defined", XFASTINT (category)); | |
103 CATEGORY_DOCSTRING (table, XFASTINT (category)) = docstring; | |
104 | |
105 return Qnil; | |
106 } | |
107 | |
108 DEFUN ("category-docstring", Fcategory_docstring, Scategory_docstring, 1, 2, 0, | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
109 "Return the documentation string of CATEGORY, as defined in CATEGORY-TABLE.") |
17052 | 110 (category, table) |
111 Lisp_Object category, table; | |
112 { | |
113 Lisp_Object doc; | |
114 | |
115 CHECK_CATEGORY (category, 0); | |
116 table = check_category_table (table); | |
117 | |
118 return CATEGORY_DOCSTRING (table, XFASTINT (category)); | |
119 } | |
120 | |
121 DEFUN ("get-unused-category", Fget_unused_category, Sget_unused_category, | |
122 0, 1, 0, | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
123 "Return a category which is not yet defined in CATEGORY-TABLE.\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
124 If no category remains available, return nil.\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
125 The optional argument CATEGORY-TABLE specifies which category table\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
126 to modify; it defaults to the current buffer's category table.") |
17052 | 127 (table) |
128 Lisp_Object table; | |
129 { | |
130 int i; | |
131 Lisp_Object docstring_vector; | |
132 | |
133 table = check_category_table (table); | |
134 | |
135 for (i = ' '; i <= '~'; i++) | |
136 if (NILP (CATEGORY_DOCSTRING (table, i))) | |
137 return make_number (i); | |
138 | |
139 return Qnil; | |
140 } | |
141 | |
142 | |
143 /* Category-table staff. */ | |
144 | |
145 DEFUN ("category-table-p", Fcategory_table_p, Scategory_table_p, 1, 1, 0, | |
146 "Return t if ARG is a category table.") | |
147 (arg) | |
148 Lisp_Object arg; | |
149 { | |
150 if (CHAR_TABLE_P (arg) | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
151 && EQ (XCHAR_TABLE (arg)->purpose, Qcategory_table)) |
17052 | 152 return Qt; |
153 return Qnil; | |
154 } | |
155 | |
156 /* If TABLE is nil, return the current category table. If TABLE is | |
157 not nil, check the validity of TABLE as a category table. If | |
158 valid, return TABLE itself, but if not valid, signal an error of | |
159 wrong-type-argument. */ | |
160 | |
161 Lisp_Object | |
162 check_category_table (table) | |
163 Lisp_Object table; | |
164 { | |
165 register Lisp_Object tem; | |
166 if (NILP (table)) | |
167 return current_buffer->category_table; | |
168 while (tem = Fcategory_table_p (table), NILP (tem)) | |
169 table = wrong_type_argument (Qcategory_table_p, table); | |
170 return table; | |
171 } | |
172 | |
173 DEFUN ("category-table", Fcategory_table, Scategory_table, 0, 0, 0, | |
174 "Return the current category table.\n\ | |
175 This is the one specified by the current buffer.") | |
176 () | |
177 { | |
178 return current_buffer->category_table; | |
179 } | |
180 | |
181 DEFUN ("standard-category-table", Fstandard_category_table, | |
182 Sstandard_category_table, 0, 0, 0, | |
183 "Return the standard category table.\n\ | |
184 This is the one used for new buffers.") | |
185 () | |
186 { | |
187 return Vstandard_category_table; | |
188 } | |
189 | |
190 /* Return a copy of category table TABLE. We can't simply use the | |
191 function copy-sequence because no contents should be shared between | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
192 the original and the copy. This function is called recursively by |
20189
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
193 binding TABLE to a sub char table. */ |
17052 | 194 |
195 Lisp_Object | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
196 copy_category_table (table) |
17052 | 197 Lisp_Object table; |
198 { | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
199 Lisp_Object tmp; |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
200 int i, to; |
17052 | 201 |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
202 if (!NILP (XCHAR_TABLE (table)->top)) |
17052 | 203 { |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
204 /* TABLE is a top level char table. |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
205 At first, make a copy of tree structure of the table. */ |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
206 table = Fcopy_sequence (table); |
17052 | 207 |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
208 /* Then, copy elements for single byte characters one by one. */ |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
209 for (i = 0; i < CHAR_TABLE_SINGLE_BYTE_SLOTS; i++) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
210 if (!NILP (tmp = XCHAR_TABLE (table)->contents[i])) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
211 XCHAR_TABLE (table)->contents[i] = Fcopy_sequence (tmp); |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
212 to = CHAR_TABLE_ORDINARY_SLOTS; |
20189
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
213 |
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
214 /* Also copy the first (and sole) extra slot. It is a vector |
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
215 containing docstring of each category. */ |
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
216 Fset_char_table_extra_slot |
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
217 (table, make_number (0), |
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
218 Fcopy_sequence (Fchar_table_extra_slot (table, make_number (0)))); |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
219 } |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
220 else |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
221 { |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
222 i = 32; |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
223 to = SUB_CHAR_TABLE_ORDINARY_SLOTS; |
17052 | 224 } |
225 | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
226 /* If the table has non-nil default value, copy it. */ |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
227 if (!NILP (tmp = XCHAR_TABLE (table)->defalt)) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
228 XCHAR_TABLE (table)->defalt = Fcopy_sequence (tmp); |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
229 |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
230 /* At last, copy the remaining elements while paying attention to a |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
231 sub char table. */ |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
232 for (; i < to; i++) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
233 if (!NILP (tmp = XCHAR_TABLE (table)->contents[i])) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
234 XCHAR_TABLE (table)->contents[i] |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
235 = (SUB_CHAR_TABLE_P (tmp) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
236 ? copy_category_table (tmp) : Fcopy_sequence (tmp)); |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
237 |
17052 | 238 return table; |
239 } | |
240 | |
241 DEFUN ("copy-category-table", Fcopy_category_table, Scopy_category_table, | |
242 0, 1, 0, | |
243 "Construct a new category table and return it.\n\ | |
244 It is a copy of the TABLE, which defaults to the standard category table.") | |
245 (table) | |
246 Lisp_Object table; | |
247 { | |
248 if (!NILP (table)) | |
249 check_category_table (table); | |
250 else | |
251 table = Vstandard_category_table; | |
252 | |
20189
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
253 return copy_category_table (table); |
17052 | 254 } |
255 | |
256 DEFUN ("set-category-table", Fset_category_table, Sset_category_table, 1, 1, 0, | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
257 "Specify TABLE as the category table for the current buffer.") |
17052 | 258 (table) |
259 Lisp_Object table; | |
260 { | |
261 table = check_category_table (table); | |
262 current_buffer->category_table = table; | |
263 /* Indicate that this buffer now has a specified category table. */ | |
264 current_buffer->local_var_flags | |
265 |= XFASTINT (buffer_local_flags.category_table); | |
266 return table; | |
267 } | |
268 | |
269 | |
270 DEFUN ("char-category-set", Fchar_category_set, Schar_category_set, 1, 1, 0, | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
271 "Return the category set of CHAR.") |
17052 | 272 (ch) |
273 Lisp_Object ch; | |
274 { | |
275 Lisp_Object val; | |
276 int charset; | |
277 unsigned char c1, c2; | |
278 | |
279 CHECK_NUMBER (ch, 0); | |
280 return CATEGORY_SET (XFASTINT (ch)); | |
281 } | |
282 | |
283 DEFUN ("category-set-mnemonics", Fcategory_set_mnemonics, | |
284 Scategory_set_mnemonics, 1, 1, 0, | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
285 "Return a string containing mnemonics of the categories in CATEGORY-SET.\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
286 CATEGORY-SET is a bool-vector, and the categories \"in\" it are those\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
287 that are indexes where t occurs the bool-vector.\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
288 The return value is a string containing those same categories.") |
17052 | 289 (category_set) |
290 Lisp_Object category_set; | |
291 { | |
292 int i, j; | |
293 char str[96]; | |
294 | |
295 CHECK_CATEGORY_SET (category_set, 0); | |
296 | |
297 j = 0; | |
298 for (i = 32; i < 127; i++) | |
299 if (CATEGORY_MEMBER (i, category_set)) | |
300 str[j++] = i; | |
301 str[j] = '\0'; | |
302 | |
303 return build_string (str); | |
304 } | |
305 | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
306 /* Modify all category sets stored under sub char-table TABLE so that |
17052 | 307 they contain (SET_VALUE is t) or don't contain (SET_VALUE is nil) |
308 CATEGORY. */ | |
309 | |
310 void | |
311 modify_lower_category_set (table, category, set_value) | |
312 Lisp_Object table, category, set_value; | |
313 { | |
314 Lisp_Object val; | |
315 int i; | |
316 | |
317 if (NILP (XCHAR_TABLE (table)->defalt)) | |
318 { | |
319 val = MAKE_CATEGORY_SET; | |
320 SET_CATEGORY_SET (val, category, set_value); | |
321 XCHAR_TABLE (table)->defalt = val; | |
322 } | |
323 | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
324 for (i = 32; i < SUB_CHAR_TABLE_ORDINARY_SLOTS; i++) |
17052 | 325 { |
326 val = XCHAR_TABLE (table)->contents[i]; | |
327 | |
328 if (CATEGORY_SET_P (val)) | |
329 SET_CATEGORY_SET (val, category, set_value); | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
330 else if (SUB_CHAR_TABLE_P (val)) |
17052 | 331 modify_lower_category_set (val, category, set_value); |
332 } | |
333 } | |
334 | |
335 void | |
336 set_category_set (category_set, category, val) | |
337 Lisp_Object category_set, category, val; | |
338 { | |
339 do { | |
340 int idx = XINT (category) / 8; | |
341 unsigned char bits = 1 << (XINT (category) % 8); | |
342 | |
343 if (NILP (val)) | |
344 XCATEGORY_SET (category_set)->data[idx] &= ~bits; | |
345 else | |
346 XCATEGORY_SET (category_set)->data[idx] |= bits; | |
347 } while (0); | |
348 } | |
349 | |
350 DEFUN ("modify-category-entry", Fmodify_category_entry, | |
351 Smodify_category_entry, 2, 4, 0, | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
352 "Modify the category set of CHARACTER by adding CATEGORY to it.\n\ |
17052 | 353 The category is changed only for table TABLE, which defaults to\n\ |
354 the current buffer's category table.\n\ | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
355 If optional fourth argument RESET is non-nil,\n\ |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
356 then delete CATEGORY from the category set instead of adding it.") |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
357 (character, category, table, reset) |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
358 Lisp_Object character, category, table, reset; |
17052 | 359 { |
360 int c, charset, c1, c2; | |
361 Lisp_Object set_value; /* Actual value to be set in category sets. */ | |
362 Lisp_Object val, category_set; | |
363 | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
364 CHECK_NUMBER (character, 0); |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
365 c = XINT (character); |
17052 | 366 CHECK_CATEGORY (category, 1); |
367 table = check_category_table (table); | |
368 | |
369 if (NILP (CATEGORY_DOCSTRING (table, XFASTINT (category)))) | |
370 error ("Undefined category: %c", XFASTINT (category)); | |
371 | |
372 set_value = NILP (reset) ? Qt : Qnil; | |
373 | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
374 if (c < CHAR_TABLE_SINGLE_BYTE_SLOTS) |
17052 | 375 { |
376 val = XCHAR_TABLE (table)->contents[c]; | |
377 if (!CATEGORY_SET_P (val)) | |
378 XCHAR_TABLE (table)->contents[c] = (val = MAKE_CATEGORY_SET); | |
379 SET_CATEGORY_SET (val, category, set_value); | |
380 return Qnil; | |
381 } | |
382 | |
383 SPLIT_NON_ASCII_CHAR (c, charset, c1, c2); | |
384 | |
385 /* The top level table. */ | |
17187
9ab0c08a3359
Adjusted for the change of CHAR_TABLE_ORDINARY_SLOTS.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
386 val = XCHAR_TABLE (table)->contents[charset + 128]; |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
387 if (CATEGORY_SET_P (val)) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
388 category_set = val; |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
389 else if (!SUB_CHAR_TABLE_P (val)) |
17052 | 390 { |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
391 category_set = val = MAKE_CATEGORY_SET; |
17187
9ab0c08a3359
Adjusted for the change of CHAR_TABLE_ORDINARY_SLOTS.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
392 XCHAR_TABLE (table)->contents[charset + 128] = category_set; |
17052 | 393 } |
394 | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
395 if (c1 <= 0) |
17052 | 396 { |
397 /* Only a charset is specified. */ | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
398 if (SUB_CHAR_TABLE_P (val)) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
399 /* All characters in CHARSET should be the same as for having |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
400 CATEGORY or not. */ |
17052 | 401 modify_lower_category_set (val, category, set_value); |
402 else | |
403 SET_CATEGORY_SET (category_set, category, set_value); | |
404 return Qnil; | |
405 } | |
406 | |
407 /* The second level table. */ | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
408 if (!SUB_CHAR_TABLE_P (val)) |
17052 | 409 { |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
410 val = make_sub_char_table (Qnil); |
17187
9ab0c08a3359
Adjusted for the change of CHAR_TABLE_ORDINARY_SLOTS.
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
411 XCHAR_TABLE (table)->contents[charset + 128] = val; |
17052 | 412 /* We must set default category set of CHARSET in `defalt' slot. */ |
413 XCHAR_TABLE (val)->defalt = category_set; | |
414 } | |
415 table = val; | |
416 | |
417 val = XCHAR_TABLE (table)->contents[c1]; | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
418 if (CATEGORY_SET_P (val)) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
419 category_set = val; |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
420 else if (!SUB_CHAR_TABLE_P (val)) |
17052 | 421 { |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
422 category_set = val = Fcopy_sequence (XCHAR_TABLE (table)->defalt); |
17052 | 423 XCHAR_TABLE (table)->contents[c1] = category_set; |
424 } | |
425 | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
426 if (c2 <= 0) |
17052 | 427 { |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
428 if (SUB_CHAR_TABLE_P (val)) |
17052 | 429 /* All characters in C1 group of CHARSET should be the same as |
430 for CATEGORY. */ | |
431 modify_lower_category_set (val, category, set_value); | |
432 else | |
433 SET_CATEGORY_SET (category_set, category, set_value); | |
434 return Qnil; | |
435 } | |
436 | |
437 /* The third (bottom) level table. */ | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
438 if (!SUB_CHAR_TABLE_P (val)) |
17052 | 439 { |
17459
22fc94ab9e79
(Fmodify_category_entry): Delete second arg in call to make_sub_char_table.
Karl Heuer <kwzh@gnu.org>
parents:
17369
diff
changeset
|
440 val = make_sub_char_table (Qnil); |
17052 | 441 XCHAR_TABLE (table)->contents[c1] = val; |
442 /* We must set default category set of CHARSET and C1 in | |
443 `defalt' slot. */ | |
444 XCHAR_TABLE (val)->defalt = category_set; | |
445 } | |
446 table = val; | |
447 | |
448 val = XCHAR_TABLE (table)->contents[c2]; | |
17324
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
449 if (CATEGORY_SET_P (val)) |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
450 category_set = val; |
ed53084a1655
(category-table-p): Check only type and purpose.
Kenichi Handa <handa@m17n.org>
parents:
17187
diff
changeset
|
451 else if (!SUB_CHAR_TABLE_P (val)) |
17052 | 452 { |
453 category_set = Fcopy_sequence (XCHAR_TABLE (table)->defalt); | |
454 XCHAR_TABLE (table)->contents[c2] = category_set; | |
455 } | |
456 else | |
457 /* This should never happen. */ | |
458 error ("Invalid category table"); | |
459 | |
460 SET_CATEGORY_SET (category_set, category, set_value); | |
461 | |
462 return Qnil; | |
463 } | |
464 | |
465 /* Dump category table to buffer in human-readable format */ | |
466 | |
467 static void | |
468 describe_category (value) | |
469 Lisp_Object value; | |
470 { | |
471 Lisp_Object mnemonics; | |
472 | |
473 Findent_to (make_number (16), make_number (1)); | |
474 | |
475 if (NILP (value)) | |
476 { | |
477 insert_string ("default\n"); | |
478 return; | |
479 } | |
480 | |
19659
315acc2627fe
(describe_category): Handle a sub-chartable.
Richard M. Stallman <rms@gnu.org>
parents:
18613
diff
changeset
|
481 if (CHAR_TABLE_P (value)) |
315acc2627fe
(describe_category): Handle a sub-chartable.
Richard M. Stallman <rms@gnu.org>
parents:
18613
diff
changeset
|
482 { |
315acc2627fe
(describe_category): Handle a sub-chartable.
Richard M. Stallman <rms@gnu.org>
parents:
18613
diff
changeset
|
483 insert_string ("deeper char-table ...\n"); |
315acc2627fe
(describe_category): Handle a sub-chartable.
Richard M. Stallman <rms@gnu.org>
parents:
18613
diff
changeset
|
484 return; |
315acc2627fe
(describe_category): Handle a sub-chartable.
Richard M. Stallman <rms@gnu.org>
parents:
18613
diff
changeset
|
485 } |
315acc2627fe
(describe_category): Handle a sub-chartable.
Richard M. Stallman <rms@gnu.org>
parents:
18613
diff
changeset
|
486 |
17052 | 487 if (!CATEGORY_SET_P (value)) |
488 { | |
489 insert_string ("invalid\n"); | |
490 return; | |
491 } | |
492 | |
493 mnemonics = Fcategory_set_mnemonics (value); | |
20612
5a0922f8c841
(Fmake_category_set): Don't allow multibyte string.
Richard M. Stallman <rms@gnu.org>
parents:
20189
diff
changeset
|
494 insert_from_string (mnemonics, 0, 0, XSTRING (mnemonics)->size, |
21244
50929073a0ba
Use STRING_BYTES and SET_STRING_BYTES.
Richard M. Stallman <rms@gnu.org>
parents:
20825
diff
changeset
|
495 STRING_BYTES (XSTRING (mnemonics)), 0); |
17052 | 496 insert_string ("\n"); |
497 return; | |
498 } | |
499 | |
500 static Lisp_Object | |
501 describe_category_1 (vector) | |
502 Lisp_Object vector; | |
503 { | |
504 struct buffer *old = current_buffer; | |
505 set_buffer_internal (XBUFFER (Vstandard_output)); | |
17787
eacf563a6d0d
(describe_category_1): Pass new args to describe_vector.
Richard M. Stallman <rms@gnu.org>
parents:
17459
diff
changeset
|
506 describe_vector (vector, Qnil, describe_category, 0, Qnil, Qnil, |
eacf563a6d0d
(describe_category_1): Pass new args to describe_vector.
Richard M. Stallman <rms@gnu.org>
parents:
17459
diff
changeset
|
507 (int *)0, 0); |
17052 | 508 { |
509 int i; | |
510 Lisp_Object docs = XCHAR_TABLE (vector)->extras[0]; | |
511 Lisp_Object elt; | |
512 | |
513 if (!VECTORP (docs) || XVECTOR (docs)->size != 95) | |
514 { | |
515 insert_string ("Invalid first extra slot in this char table\n"); | |
516 return Qnil; | |
517 } | |
518 | |
519 insert_string ("Meanings of mnemonice characters are:\n"); | |
520 for (i = 0; i < 95; i++) | |
521 { | |
522 elt = XVECTOR (docs)->contents[i]; | |
523 if (NILP (elt)) | |
524 continue; | |
525 | |
526 insert_char (i + 32); | |
527 insert (": ", 2); | |
20612
5a0922f8c841
(Fmake_category_set): Don't allow multibyte string.
Richard M. Stallman <rms@gnu.org>
parents:
20189
diff
changeset
|
528 insert_from_string (elt, 0, 0, XSTRING (elt)->size, |
21244
50929073a0ba
Use STRING_BYTES and SET_STRING_BYTES.
Richard M. Stallman <rms@gnu.org>
parents:
20825
diff
changeset
|
529 STRING_BYTES (XSTRING (elt)), 0); |
17052 | 530 insert ("\n", 1); |
531 } | |
532 } | |
533 | |
534 while (! NILP (XCHAR_TABLE (vector)->parent)) | |
535 { | |
536 vector = XCHAR_TABLE (vector)->parent; | |
537 insert_string ("\nThe parent category table is:"); | |
17787
eacf563a6d0d
(describe_category_1): Pass new args to describe_vector.
Richard M. Stallman <rms@gnu.org>
parents:
17459
diff
changeset
|
538 describe_vector (vector, Qnil, describe_category, 0, Qnil, Qnil, |
eacf563a6d0d
(describe_category_1): Pass new args to describe_vector.
Richard M. Stallman <rms@gnu.org>
parents:
17459
diff
changeset
|
539 (int *) 0, 0); |
17052 | 540 } |
541 | |
542 call0 (intern ("help-mode")); | |
543 set_buffer_internal (old); | |
544 return Qnil; | |
545 } | |
546 | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
547 DEFUN ("describe-categories", Fdescribe_categories, Sdescribe_categories, 0, 0, "", |
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
548 "Describe the category specifications in the current category table.\n\ |
17052 | 549 The descriptions are inserted in a buffer, which is then displayed.") |
550 () | |
551 { | |
552 internal_with_output_to_temp_buffer | |
553 ("*Help*", describe_category_1, current_buffer->category_table); | |
554 | |
555 return Qnil; | |
556 } | |
557 | |
558 /* Return 1 if there is a word boundary between two word-constituent | |
559 characters C1 and C2 if they appear in this order, else return 0. | |
560 Use the macro WORD_BOUNDARY_P instead of calling this function | |
561 directly. */ | |
562 | |
563 int | |
564 word_boundary_p (c1, c2) | |
565 int c1, c2; | |
566 { | |
567 Lisp_Object category_set1, category_set2; | |
568 Lisp_Object tail; | |
569 int default_result; | |
570 | |
23755
63628f8fe648
(word_boundary_p): If C1 or C2 are composite
Kenichi Handa <handa@m17n.org>
parents:
23543
diff
changeset
|
571 if (COMPOSITE_CHAR_P (c1)) |
63628f8fe648
(word_boundary_p): If C1 or C2 are composite
Kenichi Handa <handa@m17n.org>
parents:
23543
diff
changeset
|
572 c1 = cmpchar_component (c1, 0, 1); |
63628f8fe648
(word_boundary_p): If C1 or C2 are composite
Kenichi Handa <handa@m17n.org>
parents:
23543
diff
changeset
|
573 if (COMPOSITE_CHAR_P (c2)) |
63628f8fe648
(word_boundary_p): If C1 or C2 are composite
Kenichi Handa <handa@m17n.org>
parents:
23543
diff
changeset
|
574 c2 = cmpchar_component (c2, 0, 1); |
63628f8fe648
(word_boundary_p): If C1 or C2 are composite
Kenichi Handa <handa@m17n.org>
parents:
23543
diff
changeset
|
575 |
17052 | 576 if (CHAR_CHARSET (c1) == CHAR_CHARSET (c2)) |
577 { | |
578 tail = Vword_separating_categories; | |
579 default_result = 0; | |
580 } | |
581 else | |
582 { | |
583 tail = Vword_combining_categories; | |
584 default_result = 1; | |
585 } | |
586 | |
587 category_set1 = CATEGORY_SET (c1); | |
588 if (NILP (category_set1)) | |
589 return default_result; | |
590 category_set2 = CATEGORY_SET (c2); | |
591 if (NILP (category_set2)) | |
592 return default_result; | |
593 | |
594 for (; CONSP (tail); tail = XCONS (tail)->cdr) | |
595 { | |
596 Lisp_Object elt = XCONS(tail)->car; | |
597 | |
598 if (CONSP (elt) | |
599 && CATEGORYP (XCONS (elt)->car) | |
600 && CATEGORYP (XCONS (elt)->cdr) | |
18613
614b916ff5bf
Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents:
18341
diff
changeset
|
601 && CATEGORY_MEMBER (XFASTINT (XCONS (elt)->car), category_set1) |
614b916ff5bf
Fix bugs with inappropriate mixing of Lisp_Object with int.
Richard M. Stallman <rms@gnu.org>
parents:
18341
diff
changeset
|
602 && CATEGORY_MEMBER (XFASTINT (XCONS (elt)->cdr), category_set2)) |
17052 | 603 return !default_result; |
604 } | |
605 return default_result; | |
606 } | |
607 | |
608 | |
21514 | 609 void |
17052 | 610 init_category_once () |
611 { | |
612 /* This has to be done here, before we call Fmake_char_table. */ | |
613 Qcategory_table = intern ("category-table"); | |
614 staticpro (&Qcategory_table); | |
615 | |
616 /* Intern this now in case it isn't already done. | |
617 Setting this variable twice is harmless. | |
618 But don't staticpro it here--that is done in alloc.c. */ | |
619 Qchar_table_extra_slots = intern ("char-table-extra-slots"); | |
620 | |
621 /* Now we are ready to set up this property, so we can | |
622 create category tables. */ | |
623 Fput (Qcategory_table, Qchar_table_extra_slots, make_number (2)); | |
624 | |
625 Vstandard_category_table = Fmake_char_table (Qcategory_table, Qnil); | |
626 /* Set a category set which contains nothing to the default. */ | |
627 XCHAR_TABLE (Vstandard_category_table)->defalt = MAKE_CATEGORY_SET; | |
20189
16f5b56c2f68
(copy_category_table): Copy also the first extra slot
Kenichi Handa <handa@m17n.org>
parents:
19659
diff
changeset
|
628 Fset_char_table_extra_slot (Vstandard_category_table, make_number (0), |
17052 | 629 Fmake_vector (make_number (95), Qnil)); |
630 } | |
631 | |
21514 | 632 void |
17052 | 633 syms_of_category () |
634 { | |
635 Qcategoryp = intern ("categoryp"); | |
636 staticpro (&Qcategoryp); | |
637 Qcategorysetp = intern ("categorysetp"); | |
638 staticpro (&Qcategorysetp); | |
639 Qcategory_table_p = intern ("category-table-p"); | |
640 staticpro (&Qcategory_table_p); | |
641 | |
642 DEFVAR_LISP ("word-combining-categories", &Vword_combining_categories, | |
643 "List of pair (cons) of categories to determine word boundary.\n\ | |
644 \n\ | |
645 Emacs treats a sequence of word constituent characters as a single\n\ | |
646 word (i.e. finds no word boundary between them) iff they belongs to\n\ | |
647 the same charset. But, exceptions are allowed in the following cases.\n\ | |
648 \n\ | |
23543
6f3b920860e5
(syms_of_category): Doc-string modified.
Kenichi Handa <handa@m17n.org>
parents:
21514
diff
changeset
|
649 \(1) The case that characters are in different charsets is controlled\n\ |
17052 | 650 by the variable `word-combining-categories'.\n\ |
651 \n\ | |
652 Emacs finds no word boundary between characters of different charsets\n\ | |
653 if they have categories matching some element of this list.\n\ | |
654 \n\ | |
655 More precisely, if an element of this list is a cons of category CAT1\n\ | |
656 and CAT2, and a multibyte character C1 which has CAT1 is followed by\n\ | |
657 C2 which has CAT2, there's no word boundary between C1 and C2.\n\ | |
658 \n\ | |
659 For instance, to tell that ASCII characters and Latin-1 characters can\n\ | |
660 form a single word, the element `(?l . ?l)' should be in this list\n\ | |
661 because both characters have the category `l' (Latin characters).\n\ | |
662 \n\ | |
23543
6f3b920860e5
(syms_of_category): Doc-string modified.
Kenichi Handa <handa@m17n.org>
parents:
21514
diff
changeset
|
663 \(2) The case that character are in the same charset is controlled by\n\ |
17052 | 664 the variable `word-separating-categories'.\n\ |
665 \n\ | |
666 Emacs find a word boundary between characters of the same charset\n\ | |
667 if they have categories matching some element of this list.\n\ | |
668 \n\ | |
669 More precisely, if an element of this list is a cons of category CAT1\n\ | |
670 and CAT2, and a multibyte character C1 which has CAT1 is followed by\n\ | |
671 C2 which has CAT2, there's a word boundary between C1 and C2.\n\ | |
672 \n\ | |
673 For instance, to tell that there's a word boundary between Japanese\n\ | |
674 Hiragana and Japanese Kanji (both are in the same charset), the\n\ | |
675 element `(?H . ?C) should be in this list."); | |
676 | |
677 Vword_combining_categories = Qnil; | |
678 | |
679 DEFVAR_LISP ("word-separating-categories", &Vword_separating_categories, | |
680 "List of pair (cons) of categories to determine word boundary.\n\ | |
681 See the documentation of the variable `word-combining-categories'."); | |
682 | |
683 Vword_separating_categories = Qnil; | |
684 | |
685 defsubr (&Smake_category_set); | |
686 defsubr (&Sdefine_category); | |
687 defsubr (&Scategory_docstring); | |
688 defsubr (&Sget_unused_category); | |
689 defsubr (&Scategory_table_p); | |
690 defsubr (&Scategory_table); | |
691 defsubr (&Sstandard_category_table); | |
692 defsubr (&Scopy_category_table); | |
693 defsubr (&Sset_category_table); | |
694 defsubr (&Schar_category_set); | |
695 defsubr (&Scategory_set_mnemonics); | |
696 defsubr (&Smodify_category_entry); | |
20825
1b98a0ab1bee
(Fmodify_category_entry): Doc fix.
Richard M. Stallman <rms@gnu.org>
parents:
20612
diff
changeset
|
697 defsubr (&Sdescribe_categories); |
17052 | 698 |
699 category_table_version = 0; | |
700 } |