Mercurial > emacs
annotate src/charset.h @ 88769:9714c10f165d
(set-locale-environment): Use
locale-codeset.
author | Dave Love <fx@gnu.org> |
---|---|
date | Sun, 16 Jun 2002 11:43:54 +0000 |
parents | 5b9a72e491d4 |
children | 0a02d452fece |
rev | line source |
---|---|
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
1 /* Header for charset handler. |
20708 | 2 Copyright (C) 1995, 1997, 1998 Electrotechnical Laboratory, JAPAN. |
18341
33e78cc7f058
Change copyright notices.
Richard M. Stallman <rms@gnu.org>
parents:
17833
diff
changeset
|
3 Licensed to the Free Software Foundation. |
38395
b7a9187751b2
(CHAR_STRING_NO_SIGNAL): New macro.
Gerd Moellmann <gerd@gnu.org>
parents:
35949
diff
changeset
|
4 Copyright (C) 2001 Free Software Foundation, Inc. |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
5 Copyright (C) 2001, 2002 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
6 National Institute of Advanced Industrial Science and Technology (AIST) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
7 Registration Number H13PRO009 |
17052 | 8 |
17071 | 9 This file is part of GNU Emacs. |
10 | |
11 GNU Emacs is free software; you can redistribute it and/or modify | |
12 it under the terms of the GNU General Public License as published by | |
13 the Free Software Foundation; either version 2, or (at your option) | |
14 any later version. | |
17052 | 15 |
17071 | 16 GNU Emacs is distributed in the hope that it will be useful, |
17 but WITHOUT ANY WARRANTY; without even the implied warranty of | |
18 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
19 GNU General Public License for more details. | |
17052 | 20 |
17071 | 21 You should have received a copy of the GNU General Public License |
22 along with GNU Emacs; see the file COPYING. If not, write to | |
23 the Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
24 Boston, MA 02111-1307, USA. */ | |
17052 | 25 |
29570
825505ff211e
(EMACS_CHARSET_H): Renamed from _CHARSET_H.
Kenichi Handa <handa@m17n.org>
parents:
29539
diff
changeset
|
26 #ifndef EMACS_CHARSET_H |
825505ff211e
(EMACS_CHARSET_H): Renamed from _CHARSET_H.
Kenichi Handa <handa@m17n.org>
parents:
29539
diff
changeset
|
27 #define EMACS_CHARSET_H |
17052 | 28 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
29 /* Index to arguments of Fdefine_charset_internal. */ |
17052 | 30 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
31 enum define_charset_arg_index |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
32 { |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
33 charset_arg_name, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
34 charset_arg_dimension, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
35 charset_arg_code_space, |
88677
61f981fb213a
(sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents:
88476
diff
changeset
|
36 charset_arg_min_code, |
61f981fb213a
(sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents:
88476
diff
changeset
|
37 charset_arg_max_code, |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
38 charset_arg_iso_final, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
39 charset_arg_iso_revision, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
40 charset_arg_emacs_mule_id, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
41 charset_arg_ascii_compatible_p, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
42 charset_arg_supplementary_p, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
43 charset_arg_invalid_code, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
44 charset_arg_code_offset, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
45 charset_arg_map, |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
46 charset_arg_subset, |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
47 charset_arg_superset, |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
48 charset_arg_unify_map, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
49 charset_arg_plist, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
50 charset_arg_max |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
51 }; |
17052 | 52 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
53 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
54 /* Indices to charset attributes vector. */ |
17052 | 55 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
56 enum charset_attr_index |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
57 { |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
58 /* ID number of the charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
59 charset_id, |
17052 | 60 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
61 /* Name of the charset (symbol). */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
62 charset_name, |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
63 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
64 /* Property list of the charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
65 charset_plist, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
66 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
67 /* If the method of the charset is `MAP_DEFERRED', the value is a |
88436 | 68 mapping vector or a file name that contains mapping vector. |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
69 Otherwise, nil. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
70 charset_map, |
17052 | 71 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
72 /* If the method of the charset is `MAP', the value is a vector |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
73 that maps code points of the charset to characters. The vector |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
74 is indexed by a character index. A character index is |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
75 calculated from a code point and the code-space table of the |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
76 charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
77 charset_decoder, |
17052 | 78 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
79 /* If the method of the charset is `MAP', the value is a |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
80 char-table that maps characters of the charset to code |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
81 points. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
82 charset_encoder, |
17052 | 83 |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
84 /* If the method of the charset is `SUBSET', the value is a vector |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
85 that has this form: |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
86 |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
87 [ CHARSET-ID MIN-CODE MAX-CODE OFFSET ] |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
88 |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
89 CHARSET-ID is an ID number of a parent charset. MIN-CODE and |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
90 MAX-CODE specify the range of characters inherited from the |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
91 parent. OFFSET is an integer value to add to a code point of |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
92 the parent charset to get the corresponding code point of this |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
93 charset. */ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
94 charset_subset, |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
95 |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
96 /* If the method of the charset is `SUPERSET', the value is a list |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
97 whose elements have this form: |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
98 |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
99 (CHARSET-ID . OFFSET) |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
100 |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
101 CHARSET-IDs are ID numbers of parent charsets. OFFSET is an |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
102 integer value to add to a code point of the parent charset to |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
103 get the corresponding code point of this charset. */ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
104 charset_superset, |
17052 | 105 |
88436 | 106 /* The value is a mapping vector or a file name that contains |
107 mapping vector. This provide how characters in the charset | |
108 should be unified with Unicode. The value of the member | |
109 `charset_deunifier' is created from this information. */ | |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
110 charset_unify_map, |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
111 |
88436 | 112 /* If characters in the charset must be unified Unicode, the value |
113 is a char table that maps a character code in the charset to | |
114 the corresponding Unicode character. */ | |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
115 charset_deunifier, |
17052 | 116 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
117 /* The length of charset attribute vector. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
118 charset_attr_max |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
119 }; |
17052 | 120 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
121 /* Methods for converting code points and characters of charsets. */ |
17052 | 122 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
123 enum charset_method |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
124 { |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
125 /* For a charset of this method, a character code is calculated |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
126 from a character index (which is calculated from a code point) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
127 simply by adding an offset value. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
128 CHARSET_METHOD_OFFSET, |
17052 | 129 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
130 /* For a charset of this method, a decoder vector and an encoder |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
131 char-table is used for code point <-> character code |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
132 conversion. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
133 CHARSET_METHOD_MAP, |
17052 | 134 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
135 /* Same as above but decoder and encoder are loaded from a file on |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
136 demand. Once loaded, the method is changed to |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
137 CHARSET_METHOD_MAP. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
138 CHARSET_METHOD_MAP_DEFERRED, |
17052 | 139 |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
140 /* A charset of this method is a subset of the other charset. */ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
141 CHARSET_METHOD_SUBSET, |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
142 |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
143 /* A charset of this method is a superset of the other charsets. */ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
144 CHARSET_METHOD_SUPERSET |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
145 }; |
17052 | 146 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
147 struct charset |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
148 { |
88436 | 149 /* Index to charset_table. */ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
150 int id; |
17052 | 151 |
88436 | 152 /* Index to Vcharset_hash_table. */ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
153 int hash_index; |
17052 | 154 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
155 /* Dimension of the charset: 1, 2, 3, or 4. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
156 int dimension; |
17052 | 157 |
88476
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
158 /* Byte code range of each dimension. <code_space>[4N] is a mininum |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
159 byte code of the (N+1)th dimension, <code_space>[4N+1] is a |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
160 maximum byte code of the (N+1)th dimension, <code_space>[4N+2] is |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
161 (<code_space>[4N+1] - <code_space>[4N] + 1), <code_space>[4N+3] |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
162 is a number of characters containd in the first to (N+1)th |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
163 dismesions. We get `char-index' of a `code-point' from this |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
164 information. */ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
165 int code_space[16]; |
17052 | 166 |
88476
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
167 /* If B is a byte of Nth dimension of a code-point, the (N-1)th bit |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
168 of code_space_mask[B] is set. This array is used to quickly |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
169 check if a code-point is in a valid range. */ |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
170 unsigned char *code_space_mask; |
47c2e6825a1e
(struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents:
88436
diff
changeset
|
171 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
172 /* 1 if there's no gap in code-points. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
173 int code_linear_p; |
17052 | 174 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
175 /* If the charset is treated as 94-chars in ISO-2022, the value is 0. |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
176 If the charset is treated as 96-chars in ISO-2022, the value is 1. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
177 int iso_chars_96; |
17052 | 178 |
88436 | 179 /* ISO final byte of the charset: 48..127. It may be -1 if the |
180 charset doesn't conform to ISO-2022. */ | |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
181 int iso_final; |
17052 | 182 |
88436 | 183 /* ISO revision number of the charset. */ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
184 int iso_revision; |
17052 | 185 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
186 /* If the charset is identical to what supported by Emacs 21 and the |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
187 priors, the identification number of the charset used in those |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
188 version. Otherwise, -1. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
189 int emacs_mule_id; |
17052 | 190 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
191 /* Nonzero iff the charset is compatible with ASCII. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
192 int ascii_compatible_p; |
35478 | 193 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
194 /* Nonzero iff the charset is supplementary. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
195 int supplementary_p; |
17052 | 196 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
197 /* Nonzero iff all the code points are representable by Lisp_Int. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
198 int compact_codes_p; |
17052 | 199 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
200 /* The method for encoding/decoding characters of the charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
201 enum charset_method method; |
17052 | 202 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
203 /* Mininum and Maximum code points of the charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
204 unsigned min_code, max_code; |
17052 | 205 |
88677
61f981fb213a
(sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents:
88476
diff
changeset
|
206 /* Offset value used by macros CODE_POINT_TO_INDEX and |
61f981fb213a
(sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents:
88476
diff
changeset
|
207 INDEX_TO_CODE_POINT. . */ |
61f981fb213a
(sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents:
88476
diff
changeset
|
208 unsigned char_index_offset; |
61f981fb213a
(sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents:
88476
diff
changeset
|
209 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
210 /* Mininum and Maximum character codes of the charset. If the |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
211 charset is compatible with ASCII, min_char is a minimum non-ASCII |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
212 character of the charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
213 int min_char, max_char; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
214 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
215 /* The code returned by ENCODE_CHAR if a character is not encodable |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
216 by the charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
217 unsigned invalid_code; |
17052 | 218 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
219 /* If the method of the charset is CHARSET_METHOD_MAP, this is a |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
220 table of bits used to quickly and roughly guess if a character |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
221 belongs to the charset. |
17052 | 222 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
223 The first 64 elements are 512 bits for characters less than |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
224 0x10000. Each bit corresponds to 128-character block. The last |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
225 126 elements are 1008 bits for the greater characters |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
226 (0x10000..0x3FFFFF). Each bit corresponds to 4096-character |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
227 block. |
17052 | 228 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
229 If a bit is 1, at least one character in the corresponds block is |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
230 in this charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
231 unsigned char fast_map[190]; |
17052 | 232 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
233 /* Offset value to calculate a character code from code-point, and |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
234 visa versa. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
235 int code_offset; |
17052 | 236 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
237 int unified_p; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
238 }; |
17052 | 239 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
240 /* Hash table of charset symbols vs. the correponding attribute |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
241 vectors. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
242 extern Lisp_Object Vcharset_hash_table; |
17052 | 243 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
244 /* Table of struct charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
245 extern struct charset *charset_table; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
246 extern int charset_table_used; |
17052 | 247 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
248 #define CHARSET_FROM_ID(id) (charset_table + (id)) |
17052 | 249 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
250 extern Lisp_Object Vcharset_list; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
251 extern Lisp_Object Viso_2022_charset_list; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
252 extern Lisp_Object Vemacs_mule_charset_list; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
253 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
254 extern struct charset *emacs_mule_charset[256]; |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
255 |
17052 | 256 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
257 /* Macros to access information about charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
258 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
259 /* Return the attribute vector of charset whose symbol is SYMBOL. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
260 #define CHARSET_SYMBOL_ATTRIBUTES(symbol) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
261 Fgethash ((symbol), Vcharset_hash_table, Qnil) |
17833
59aa4a0772f6
(VALID_CHAR_P): New macro.
Kenichi Handa <handa@m17n.org>
parents:
17726
diff
changeset
|
262 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
263 #define CHARSET_ATTR_ID(attrs) AREF ((attrs), charset_id) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
264 #define CHARSET_ATTR_NAME(attrs) AREF ((attrs), charset_name) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
265 #define CHARSET_ATTR_PLIST(attrs) AREF ((attrs), charset_plist) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
266 #define CHARSET_ATTR_MAP(attrs) AREF ((attrs), charset_map) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
267 #define CHARSET_ATTR_DECODER(attrs) AREF ((attrs), charset_decoder) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
268 #define CHARSET_ATTR_ENCODER(attrs) AREF ((attrs), charset_encoder) |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
269 #define CHARSET_ATTR_SUBSET(attrs) AREF ((attrs), charset_subset) |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
270 #define CHARSET_ATTR_SUPERSET(attrs) AREF ((attrs), charset_superset) |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
271 #define CHARSET_ATTR_UNIFY_MAP(attrs) AREF ((attrs), charset_unify_map) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
272 #define CHARSET_ATTR_DEUNIFIER(attrs) AREF ((attrs), charset_deunifier) |
21033
9f32198e0d9f
(NONASCII_INSERT_OFFSET): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20932
diff
changeset
|
273 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
274 #define CHARSET_SYMBOL_ID(symbol) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
275 CHARSET_ATTR_ID (CHARSET_SYMBOL_ATTRIBUTES (symbol)) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
276 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
277 /* Return an index to Vcharset_hash_table of the charset whose symbol |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
278 is SYMBOL. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
279 #define CHARSET_SYMBOL_HASH_INDEX(symbol) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
280 hash_lookup (XHASH_TABLE (Vcharset_hash_table), symbol, NULL) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
281 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
282 /* Return the attribute vector of CHARSET. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
283 #define CHARSET_ATTRIBUTES(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
284 (HASH_VALUE (XHASH_TABLE (Vcharset_hash_table), (charset)->hash_index)) |
21033
9f32198e0d9f
(NONASCII_INSERT_OFFSET): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20932
diff
changeset
|
285 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
286 #define CHARSET_ID(charset) ((charset)->id) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
287 #define CHARSET_HASH_INDEX(charset) ((charset)->hash_index) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
288 #define CHARSET_DIMENSION(charset) ((charset)->dimension) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
289 #define CHARSET_CODE_SPACE(charset) ((charset)->code_space) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
290 #define CHARSET_CODE_LINEAR_P(charset) ((charset)->code_linear_p) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
291 #define CHARSET_ISO_CHARS_96(charset) ((charset)->iso_chars_96) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
292 #define CHARSET_ISO_FINAL(charset) ((charset)->iso_final) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
293 #define CHARSET_ISO_PLANE(charset) ((charset)->iso_plane) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
294 #define CHARSET_ISO_REVISION(charset) ((charset)->iso_revision) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
295 #define CHARSET_EMACS_MULE_ID(charset) ((charset)->emacs_mule_id) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
296 #define CHARSET_ASCII_COMPATIBLE_P(charset) ((charset)->ascii_compatible_p) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
297 #define CHARSET_COMPACT_CODES_P(charset) ((charset)->compact_codes_p) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
298 #define CHARSET_METHOD(charset) ((charset)->method) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
299 #define CHARSET_MIN_CODE(charset) ((charset)->min_code) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
300 #define CHARSET_MAX_CODE(charset) ((charset)->max_code) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
301 #define CHARSET_INVALID_CODE(charset) ((charset)->invalid_code) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
302 #define CHARSET_MIN_CHAR(charset) ((charset)->min_char) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
303 #define CHARSET_MAX_CHAR(charset) ((charset)->max_char) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
304 #define CHARSET_CODE_OFFSET(charset) ((charset)->code_offset) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
305 #define CHARSET_UNIFIED_P(charset) ((charset)->unified_p) |
25505
4d5f87073d63
(MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents:
25234
diff
changeset
|
306 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
307 #define CHARSET_NAME(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
308 (CHARSET_ATTR_NAME (CHARSET_ATTRIBUTES (charset))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
309 #define CHARSET_MAP(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
310 (CHARSET_ATTR_MAP (CHARSET_ATTRIBUTES (charset))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
311 #define CHARSET_DECODER(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
312 (CHARSET_ATTR_DECODER (CHARSET_ATTRIBUTES (charset))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
313 #define CHARSET_ENCODER(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
314 (CHARSET_ATTR_ENCODER (CHARSET_ATTRIBUTES (charset))) |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
315 #define CHARSET_SUBSET(charset) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
316 (CHARSET_ATTR_SUBSET (CHARSET_ATTRIBUTES (charset))) |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
317 #define CHARSET_SUPERSET(charset) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
318 (CHARSET_ATTR_SUPERSET (CHARSET_ATTRIBUTES (charset))) |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
319 #define CHARSET_UNIFY_MAP(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
320 (CHARSET_ATTR_UNIFY_MAP (CHARSET_ATTRIBUTES (charset))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
321 #define CHARSET_DEUNIFIER(charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
322 (CHARSET_ATTR_DEUNIFIER (CHARSET_ATTRIBUTES (charset))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
323 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
324 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
325 /* Nonzero iff OBJ is a valid charset symbol. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
326 #define CHARSETP(obj) (CHARSET_SYMBOL_HASH_INDEX (obj) >= 0) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
327 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
328 /* Check if X is a valid charset symbol. If not, signal an error. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
329 #define CHECK_CHARSET(x) \ |
25505
4d5f87073d63
(MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents:
25234
diff
changeset
|
330 do { \ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
331 if (! SYMBOLP (x) || CHARSET_SYMBOL_HASH_INDEX (x) < 0) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
332 x = wrong_type_argument (Qcharsetp, (x)); \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
333 } while (0) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
334 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
335 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
336 /* Check if X is a valid charset symbol. If valid, set ID to the id |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
337 number of the charset. Otherwise, signal an error. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
338 #define CHECK_CHARSET_GET_ID(x, id) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
339 do { \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
340 int idx; \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
341 \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
342 if (! SYMBOLP (x) || (idx = CHARSET_SYMBOL_HASH_INDEX (x)) < 0) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
343 x = wrong_type_argument (Qcharsetp, (x)); \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
344 id = AREF (HASH_VALUE (XHASH_TABLE (Vcharset_hash_table), idx), \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
345 charset_id); \ |
25505
4d5f87073d63
(MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents:
25234
diff
changeset
|
346 } while (0) |
21033
9f32198e0d9f
(NONASCII_INSERT_OFFSET): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20932
diff
changeset
|
347 |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
348 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
349 /* Check if X is a valid charset symbol. If valid, set ATTR to the |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
350 attr vector of the charset. Otherwise, signal an error. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
351 #define CHECK_CHARSET_GET_ATTR(x, attr) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
352 do { \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
353 if (!SYMBOLP (x) || NILP (attr = CHARSET_SYMBOL_ATTRIBUTES (x))) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
354 x = wrong_type_argument (Qcharsetp, (x)); \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
355 } while (0) |
19319 | 356 |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
357 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
358 #define CHECK_CHARSET_GET_CHARSET(x, charset) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
359 do { \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
360 int id; \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
361 CHECK_CHARSET_GET_ID (x, id); \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
362 charset = CHARSET_FROM_ID (id); \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
363 } while (0) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
364 |
19319 | 365 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
366 /* Lookup Vcharset_order_list and return the first charset that |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
367 contains the character C. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
368 #define CHAR_CHARSET(c) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
369 char_charset ((c), Qnil, NULL) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
370 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
371 #if 0 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
372 /* Char-table of charset-sets. Each element is a bool vector indexed |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
373 by a charset ID. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
374 extern Lisp_Object Vchar_charset_set; |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
375 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
376 /* Charset-bag of character C. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
377 #define CHAR_CHARSET_SET(c) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
378 CHAR_TABLE_REF (Vchar_charset_set, c) |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
379 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
380 /* Check if two characters C1 and C2 belong to the same charset. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
381 #define SAME_CHARSET_P(c1, c2) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
382 intersection_p (CHAR_CHARSET_SET (c1), CHAR_CHARSET_SET (c2)) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
383 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
384 #endif |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
385 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
386 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
387 /* Return a character correponding to the code-point CODE of CHARSET. |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
388 Try some optimization before calling decode_char. */ |
17052 | 389 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
390 #define DECODE_CHAR(charset, code) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
391 ((ASCII_BYTE_P (code) && (charset)->ascii_compatible_p) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
392 ? (code) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
393 : ((code) < (charset)->min_code || (code) > (charset)->max_code) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
394 ? -1 \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
395 : (charset)->unified_p \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
396 ? decode_char ((charset), (code)) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
397 : (charset)->method == CHARSET_METHOD_OFFSET \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
398 ? ((charset)->code_linear_p \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
399 ? (code) - (charset)->min_code + (charset)->code_offset \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
400 : decode_char ((charset), (code))) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
401 : (charset)->method == CHARSET_METHOD_MAP \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
402 ? ((charset)->code_linear_p \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
403 ? XINT (AREF (CHARSET_DECODER (charset), \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
404 (code) - (charset)->min_code)) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
405 : decode_char ((charset), (code))) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
406 : decode_char ((charset), (code))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
407 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
408 |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
409 extern Lisp_Object charset_work; |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
410 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
411 /* Return a code point of CHAR in CHARSET. |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
412 Try some optimization before calling encode_char. */ |
19319 | 413 |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
414 #define ENCODE_CHAR(charset, c) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
415 ((ASCII_CHAR_P (c) && (charset)->ascii_compatible_p) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
416 ? (c) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
417 : (charset)->unified_p \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
418 ? encode_char ((charset), (c)) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
419 : ((c) < (charset)->min_char || (c) > (charset)->max_char) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
420 ? (charset)->invalid_code \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
421 : (charset)->method == CHARSET_METHOD_OFFSET \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
422 ? ((charset)->code_linear_p \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
423 ? (c) - (charset)->code_offset + (charset)->min_code \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
424 : encode_char ((charset), (c))) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
425 : (charset)->method == CHARSET_METHOD_MAP \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
426 ? ((charset)->compact_codes_p \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
427 ? (charset_work = CHAR_TABLE_REF (CHARSET_ENCODER (charset), (c)), \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
428 (NILP (charset_work) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
429 ? (charset)->invalid_code \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
430 : XFASTINT (charset_work))) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
431 : encode_char ((charset), (c))) \ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
432 : encode_char ((charset), (c))) |
17052 | 433 |
25505
4d5f87073d63
(MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents:
25234
diff
changeset
|
434 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
435 /* Set to 1 when a charset map is loaded to warn that a buffer text |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
436 and a string data may be relocated. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
437 extern int charset_map_loaded; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
438 |
19319 | 439 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
440 /* Set CHARSET to the charset highest priority of C, CODE to the |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
441 code-point of C in CHARSET. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
442 #define SPLIT_CHAR(c, charset, code) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
443 ((charset) = char_charset ((c), Qnil, &(code))) |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
444 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
445 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
446 #define ISO_MAX_DIMENSION 3 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
447 #define ISO_MAX_CHARS 2 |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
448 #define ISO_MAX_FINAL 0x80 /* only 0x30..0xFF are used */ |
17052 | 449 |
450 /* Mapping table from ISO2022's charset (specified by DIMENSION, | |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
451 CHARS, and FINAL_CHAR) to Emacs' charset ID. Should be accessed by |
17052 | 452 macro ISO_CHARSET_TABLE (DIMENSION, CHARS, FINAL_CHAR). */ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
453 extern int iso_charset_table[ISO_MAX_DIMENSION][ISO_MAX_CHARS][ISO_MAX_FINAL]; |
17052 | 454 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
455 /* A charset of type iso2022 who has DIMENSION, CHARS, and FINAL |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
456 (final character). */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
457 #define ISO_CHARSET_TABLE(dimension, chars_96, final) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
458 iso_charset_table[(dimension) - 1][(chars_96)][(final)] |
20589
3acb053e757e
(FETCH_STRING_CHAR_ADVANCE): New macro.
Richard M. Stallman <rms@gnu.org>
parents:
20531
diff
changeset
|
459 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
460 /* Nonzero iff the charset who has FAST_MAP may contain C. */ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
461 #define CHARSET_FAST_MAP_REF(c, fast_map) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
462 ((c) < 0x10000 \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
463 ? fast_map[(c) >> 10] & (1 << (((c) >> 7) & 7)) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
464 : fast_map[((c) >> 15) + 62] & (1 << (((c) >> 12) & 7))) |
26843
0aadeca4a4a7
In this entry, just `Modified' means that codes for a
Kenichi Handa <handa@m17n.org>
parents:
25637
diff
changeset
|
465 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
466 #define CHARSET_FAST_MAP_SET(c, fast_map) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
467 do { \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
468 if ((c) < 0x10000) \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
469 (fast_map)[(c) >> 10] |= 1 << (((c) >> 7) & 7); \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
470 else \ |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
471 (fast_map)[((c) >> 15) + 62] |= 1 << (((c) >> 12) & 7); \ |
17052 | 472 } while (0) |
473 | |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
474 |
20531
f019e056ad9a
(CHAR_HEAD_P): Take char, not pointer, as arg.
Richard M. Stallman <rms@gnu.org>
parents:
20352
diff
changeset
|
475 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
476 /* 1 iff CHARSET may contain the character C. */ |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
477 #define CHAR_CHARSET_P(c, charset) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
478 ((ASCII_CHAR_P (c) && (charset)->ascii_compatible_p) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
479 || (CHARSET_UNIFIED_P (charset) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
480 ? encode_char ((charset), (c)) != (charset)->invalid_code \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
481 : (CHARSET_FAST_MAP_REF ((c), (charset)->fast_map) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
482 && ((charset)->method == CHARSET_METHOD_OFFSET \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
483 ? (c) >= (charset)->min_char && (c) <= (charset)->max_char \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
484 : ((charset)->method == CHARSET_METHOD_MAP \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
485 && (charset)->compact_codes_p) \ |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
486 ? ! NILP (CHAR_TABLE_REF (CHARSET_ENCODER (charset), (c))) \ |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
487 : encode_char ((charset), (c)) != (charset)->invalid_code)))) |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
488 |
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
489 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
490 extern Lisp_Object Qcharsetp; |
29004
383e4e21306a
(LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents:
28513
diff
changeset
|
491 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
492 extern Lisp_Object Qascii, Qunicode; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
493 extern int charset_ascii, charset_8_bit_control, charset_8_bit_graphic; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
494 extern int charset_iso_8859_1; |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
495 extern int charset_primary; |
88682
e2170fdb6abc
(charset_jisx0201_roman, charset_jisx0208_1978,
Kenichi Handa <handa@m17n.org>
parents:
88677
diff
changeset
|
496 extern int charset_jisx0201_roman; |
e2170fdb6abc
(charset_jisx0201_roman, charset_jisx0208_1978,
Kenichi Handa <handa@m17n.org>
parents:
88677
diff
changeset
|
497 extern int charset_jisx0208_1978; |
e2170fdb6abc
(charset_jisx0201_roman, charset_jisx0208_1978,
Kenichi Handa <handa@m17n.org>
parents:
88677
diff
changeset
|
498 extern int charset_jisx0208; |
20932
3c2c8431c51d
(INC_POS): Use macro BASE_LEADING_CODE_P.
Kenichi Handa <handa@m17n.org>
parents:
20904
diff
changeset
|
499 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
500 extern struct charset *char_charset P_ ((int, Lisp_Object, unsigned *)); |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
501 extern Lisp_Object charset_attributes P_ ((int)); |
17726 | 502 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
503 extern int decode_char P_ ((struct charset *, unsigned)); |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
504 extern unsigned encode_char P_ ((struct charset *, int)); |
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
505 extern int string_xstring_p P_ ((Lisp_Object)); |
23488
958ab288116d
(Vauto_fill_chars): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
23202
diff
changeset
|
506 |
88744
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
507 extern void map_charset_chars P_ ((void (*) (Lisp_Object, Lisp_Object), |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
508 Lisp_Object, Lisp_Object, |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
509 struct charset *, unsigned, unsigned)); |
5b9a72e491d4
(enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents:
88682
diff
changeset
|
510 |
88364
f6557aebe110
Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents:
42473
diff
changeset
|
511 EXFUN (Funify_charset, 2); |
20719 | 512 |
29570
825505ff211e
(EMACS_CHARSET_H): Renamed from _CHARSET_H.
Kenichi Handa <handa@m17n.org>
parents:
29539
diff
changeset
|
513 #endif /* EMACS_CHARSET_H */ |