annotate src/charset.h @ 89795:d117367b6d18

*** empty log message ***
author Kenichi Handa <handa@m17n.org>
date Tue, 03 Feb 2004 04:39:27 +0000
parents 0747ef3c747c
children 109e674576b8
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
1 /* Header for charset handler.
20708
ed9ed828415e Update copyright year.
Richard M. Stallman <rms@gnu.org>
parents: 20589
diff changeset
2 Copyright (C) 1995, 1997, 1998 Electrotechnical Laboratory, JAPAN.
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89366
diff changeset
3 Licensed to the Free Software Foundation.
38395
b7a9187751b2 (CHAR_STRING_NO_SIGNAL): New macro.
Gerd Moellmann <gerd@gnu.org>
parents: 35949
diff changeset
4 Copyright (C) 2001 Free Software Foundation, Inc.
89483
2f877ed80fa6 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88123 89366
diff changeset
5 Copyright (C) 2003
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
6 National Institute of Advanced Industrial Science and Technology (AIST)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
7 Registration Number H13PRO009
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
8
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
9 This file is part of GNU Emacs.
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
10
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
11 GNU Emacs is free software; you can redistribute it and/or modify
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
12 it under the terms of the GNU General Public License as published by
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
13 the Free Software Foundation; either version 2, or (at your option)
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
14 any later version.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
15
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
16 GNU Emacs is distributed in the hope that it will be useful,
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
17 but WITHOUT ANY WARRANTY; without even the implied warranty of
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
18 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
19 GNU General Public License for more details.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
20
17071
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
21 You should have received a copy of the GNU General Public License
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
22 along with GNU Emacs; see the file COPYING. If not, write to
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
23 the Free Software Foundation, Inc., 59 Temple Place - Suite 330,
70194012fb3a Fix FSF address in comment.
Karl Heuer <kwzh@gnu.org>
parents: 17052
diff changeset
24 Boston, MA 02111-1307, USA. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
25
29570
825505ff211e (EMACS_CHARSET_H): Renamed from _CHARSET_H.
Kenichi Handa <handa@m17n.org>
parents: 29539
diff changeset
26 #ifndef EMACS_CHARSET_H
825505ff211e (EMACS_CHARSET_H): Renamed from _CHARSET_H.
Kenichi Handa <handa@m17n.org>
parents: 29539
diff changeset
27 #define EMACS_CHARSET_H
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
28
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
29 /* Index to arguments of Fdefine_charset_internal. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
30
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
31 enum define_charset_arg_index
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
32 {
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
33 charset_arg_name,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
34 charset_arg_dimension,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
35 charset_arg_code_space,
88677
61f981fb213a (sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents: 88476
diff changeset
36 charset_arg_min_code,
61f981fb213a (sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents: 88476
diff changeset
37 charset_arg_max_code,
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
38 charset_arg_iso_final,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
39 charset_arg_iso_revision,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
40 charset_arg_emacs_mule_id,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
41 charset_arg_ascii_compatible_p,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
42 charset_arg_supplementary_p,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
43 charset_arg_invalid_code,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
44 charset_arg_code_offset,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
45 charset_arg_map,
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
46 charset_arg_subset,
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
47 charset_arg_superset,
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
48 charset_arg_unify_map,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
49 charset_arg_plist,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
50 charset_arg_max
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
51 };
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
52
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
53
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
54 /* Indices to charset attributes vector. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
55
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
56 enum charset_attr_index
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
57 {
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
58 /* ID number of the charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
59 charset_id,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
60
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
61 /* Name of the charset (symbol). */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
62 charset_name,
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
63
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
64 /* Property list of the charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
65 charset_plist,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
66
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
67 /* If the method of the charset is `MAP_DEFERRED', the value is a
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
68 mapping vector or a file name that contains mapping vector.
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
69 Otherwise, nil. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
70 charset_map,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
71
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
72 /* If the method of the charset is `MAP', the value is a vector
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
73 that maps code points of the charset to characters. The vector
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
74 is indexed by a character index. A character index is
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
75 calculated from a code point and the code-space table of the
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
76 charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
77 charset_decoder,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
78
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
79 /* If the method of the charset is `MAP', the value is a
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
80 char-table that maps characters of the charset to code
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
81 points. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
82 charset_encoder,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
83
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
84 /* If the method of the charset is `SUBSET', the value is a vector
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
85 that has this form:
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
86
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
87 [ CHARSET-ID MIN-CODE MAX-CODE OFFSET ]
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
88
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
89 CHARSET-ID is an ID number of a parent charset. MIN-CODE and
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
90 MAX-CODE specify the range of characters inherited from the
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
91 parent. OFFSET is an integer value to add to a code point of
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
92 the parent charset to get the corresponding code point of this
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
93 charset. */
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
94 charset_subset,
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
95
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
96 /* If the method of the charset is `SUPERSET', the value is a list
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
97 whose elements have this form:
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
98
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
99 (CHARSET-ID . OFFSET)
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
100
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
101 CHARSET-IDs are ID numbers of parent charsets. OFFSET is an
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
102 integer value to add to a code point of the parent charset to
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
103 get the corresponding code point of this charset. */
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
104 charset_superset,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
105
88839
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
106 /* The value is a mapping vector or a file name that contains the
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
107 mapping. This defines how characters in the charset should be
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
108 unified with Unicode. The value of the member
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
109 `charset_deunifier' is created from this information. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
110 charset_unify_map,
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
111
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
112 /* If characters in the charset must be unified Unicode, the value
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
113 is a char table that maps a character code in the charset to
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
114 the corresponding Unicode character. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
115 charset_deunifier,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
116
88839
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
117 /* The length of the charset attribute vector. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
118 charset_attr_max
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
119 };
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
120
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
121 /* Methods for converting code points and characters of charsets. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
122
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
123 enum charset_method
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
124 {
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
125 /* For a charset of this method, a character code is calculated
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
126 from a character index (which is calculated from a code point)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
127 simply by adding an offset value. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
128 CHARSET_METHOD_OFFSET,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
129
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
130 /* For a charset of this method, a decoder vector and an encoder
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
131 char-table is used for code point <-> character code
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
132 conversion. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
133 CHARSET_METHOD_MAP,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
134
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
135 /* Same as above but decoder and encoder are loaded from a file on
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
136 demand. Once loaded, the method is changed to
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
137 CHARSET_METHOD_MAP. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
138 CHARSET_METHOD_MAP_DEFERRED,
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
139
88839
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
140 /* A charset of this method is a subset of another charset. */
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
141 CHARSET_METHOD_SUBSET,
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
142
88839
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
143 /* A charset of this method is a superset of other charsets. */
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
144 CHARSET_METHOD_SUPERSET
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
145 };
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
146
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
147 struct charset
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
148 {
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
149 /* Index to charset_table. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
150 int id;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
151
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
152 /* Index to Vcharset_hash_table. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
153 int hash_index;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
154
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
155 /* Dimension of the charset: 1, 2, 3, or 4. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
156 int dimension;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
157
88476
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
158 /* Byte code range of each dimension. <code_space>[4N] is a mininum
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
159 byte code of the (N+1)th dimension, <code_space>[4N+1] is a
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
160 maximum byte code of the (N+1)th dimension, <code_space>[4N+2] is
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
161 (<code_space>[4N+1] - <code_space>[4N] + 1), <code_space>[4N+3]
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
162 is a number of characters containd in the first to (N+1)th
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
163 dismesions. We get `char-index' of a `code-point' from this
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
164 information. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
165 int code_space[16];
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
166
88476
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
167 /* If B is a byte of Nth dimension of a code-point, the (N-1)th bit
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
168 of code_space_mask[B] is set. This array is used to quickly
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
169 check if a code-point is in a valid range. */
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
170 unsigned char *code_space_mask;
47c2e6825a1e (struct charset): New member `code_space_mask'.
Kenichi Handa <handa@m17n.org>
parents: 88436
diff changeset
171
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
172 /* 1 if there's no gap in code-points. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
173 int code_linear_p;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
174
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
175 /* If the charset is treated as 94-chars in ISO-2022, the value is 0.
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
176 If the charset is treated as 96-chars in ISO-2022, the value is 1. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
177 int iso_chars_96;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
178
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
179 /* ISO final byte of the charset: 48..127. It may be -1 if the
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
180 charset doesn't conform to ISO-2022. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
181 int iso_final;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
182
88436
29c4241b5418 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88364
diff changeset
183 /* ISO revision number of the charset. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
184 int iso_revision;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
185
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
186 /* If the charset is identical to what supported by Emacs 21 and the
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
187 priors, the identification number of the charset used in those
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
188 version. Otherwise, -1. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
189 int emacs_mule_id;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
190
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
191 /* Nonzero iff the charset is compatible with ASCII. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
192 int ascii_compatible_p;
35478
340a9e4aeb29 comment fixes
Dave Love <fx@gnu.org>
parents: 35408
diff changeset
193
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
194 /* Nonzero iff the charset is supplementary. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
195 int supplementary_p;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
196
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
197 /* Nonzero iff all the code points are representable by Lisp_Int. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
198 int compact_codes_p;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
199
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
200 /* The method for encoding/decoding characters of the charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
201 enum charset_method method;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
202
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
203 /* Mininum and Maximum code points of the charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
204 unsigned min_code, max_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
205
88677
61f981fb213a (sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents: 88476
diff changeset
206 /* Offset value used by macros CODE_POINT_TO_INDEX and
61f981fb213a (sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents: 88476
diff changeset
207 INDEX_TO_CODE_POINT. . */
61f981fb213a (sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents: 88476
diff changeset
208 unsigned char_index_offset;
61f981fb213a (sturct define_charset_arg_index): New enums charset_arg_min_code and
Kenichi Handa <handa@m17n.org>
parents: 88476
diff changeset
209
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
210 /* Mininum and Maximum character codes of the charset. If the
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
211 charset is compatible with ASCII, min_char is a minimum non-ASCII
88875
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
212 character of the charset. If the method of charset is
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
213 CHARSET_METHOD_OFFSET, even if the charset is unified, min_char
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
214 and max_char doesn't change. */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
215 int min_char, max_char;
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
216
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
217 /* The code returned by ENCODE_CHAR if a character is not encodable
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
218 by the charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
219 unsigned invalid_code;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
220
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
221 /* If the method of the charset is CHARSET_METHOD_MAP, this is a
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
222 table of bits used to quickly and roughly guess if a character
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
223 belongs to the charset.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
224
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
225 The first 64 elements are 512 bits for characters less than
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
226 0x10000. Each bit corresponds to 128-character block. The last
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
227 126 elements are 1008 bits for the greater characters
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
228 (0x10000..0x3FFFFF). Each bit corresponds to 4096-character
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
229 block.
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
230
88839
0a02d452fece Comments.
Dave Love <fx@gnu.org>
parents: 88744
diff changeset
231 If a bit is 1, at least one character in the corresponding block is
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
232 in this charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
233 unsigned char fast_map[190];
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
234
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
235 /* Offset value to calculate a character code from code-point, and
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
236 visa versa. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
237 int code_offset;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
238
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
239 int unified_p;
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
240 };
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
241
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
242 /* Hash table of charset symbols vs. the correponding attribute
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
243 vectors. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
244 extern Lisp_Object Vcharset_hash_table;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
245
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
246 /* Table of struct charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
247 extern struct charset *charset_table;
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
248
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
249 #define CHARSET_FROM_ID(id) (charset_table + (id))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
250
88875
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
251 extern Lisp_Object Vcharset_ordered_list;
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
252
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
253 /* Incremented everytime we change the priority of charsets. */
89065
62aa2d4f3773 (charset_ordered_list_tick): Declare extern.
Dave Love <fx@gnu.org>
parents: 89064
diff changeset
254 extern unsigned short charset_ordered_list_tick;
88875
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
255
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
256 extern Lisp_Object Vcharset_list;
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
257 extern Lisp_Object Viso_2022_charset_list;
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
258 extern Lisp_Object Vemacs_mule_charset_list;
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
259
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
260 extern struct charset *emacs_mule_charset[256];
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
261
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
262
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
263 /* Macros to access information about charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
264
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
265 /* Return the attribute vector of charset whose symbol is SYMBOL. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
266 #define CHARSET_SYMBOL_ATTRIBUTES(symbol) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
267 Fgethash ((symbol), Vcharset_hash_table, Qnil)
17833
59aa4a0772f6 (VALID_CHAR_P): New macro.
Kenichi Handa <handa@m17n.org>
parents: 17726
diff changeset
268
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
269 #define CHARSET_ATTR_ID(attrs) AREF ((attrs), charset_id)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
270 #define CHARSET_ATTR_NAME(attrs) AREF ((attrs), charset_name)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
271 #define CHARSET_ATTR_PLIST(attrs) AREF ((attrs), charset_plist)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
272 #define CHARSET_ATTR_MAP(attrs) AREF ((attrs), charset_map)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
273 #define CHARSET_ATTR_DECODER(attrs) AREF ((attrs), charset_decoder)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
274 #define CHARSET_ATTR_ENCODER(attrs) AREF ((attrs), charset_encoder)
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
275 #define CHARSET_ATTR_SUBSET(attrs) AREF ((attrs), charset_subset)
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
276 #define CHARSET_ATTR_SUPERSET(attrs) AREF ((attrs), charset_superset)
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
277 #define CHARSET_ATTR_UNIFY_MAP(attrs) AREF ((attrs), charset_unify_map)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
278 #define CHARSET_ATTR_DEUNIFIER(attrs) AREF ((attrs), charset_deunifier)
21033
9f32198e0d9f (NONASCII_INSERT_OFFSET): New macro.
Kenichi Handa <handa@m17n.org>
parents: 20932
diff changeset
279
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
280 #define CHARSET_SYMBOL_ID(symbol) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
281 CHARSET_ATTR_ID (CHARSET_SYMBOL_ATTRIBUTES (symbol))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
282
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
283 /* Return an index to Vcharset_hash_table of the charset whose symbol
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
284 is SYMBOL. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
285 #define CHARSET_SYMBOL_HASH_INDEX(symbol) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
286 hash_lookup (XHASH_TABLE (Vcharset_hash_table), symbol, NULL)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
287
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
288 /* Return the attribute vector of CHARSET. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
289 #define CHARSET_ATTRIBUTES(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
290 (HASH_VALUE (XHASH_TABLE (Vcharset_hash_table), (charset)->hash_index))
21033
9f32198e0d9f (NONASCII_INSERT_OFFSET): New macro.
Kenichi Handa <handa@m17n.org>
parents: 20932
diff changeset
291
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
292 #define CHARSET_ID(charset) ((charset)->id)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
293 #define CHARSET_HASH_INDEX(charset) ((charset)->hash_index)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
294 #define CHARSET_DIMENSION(charset) ((charset)->dimension)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
295 #define CHARSET_CODE_SPACE(charset) ((charset)->code_space)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
296 #define CHARSET_CODE_LINEAR_P(charset) ((charset)->code_linear_p)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
297 #define CHARSET_ISO_CHARS_96(charset) ((charset)->iso_chars_96)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
298 #define CHARSET_ISO_FINAL(charset) ((charset)->iso_final)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
299 #define CHARSET_ISO_PLANE(charset) ((charset)->iso_plane)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
300 #define CHARSET_ISO_REVISION(charset) ((charset)->iso_revision)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
301 #define CHARSET_EMACS_MULE_ID(charset) ((charset)->emacs_mule_id)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
302 #define CHARSET_ASCII_COMPATIBLE_P(charset) ((charset)->ascii_compatible_p)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
303 #define CHARSET_COMPACT_CODES_P(charset) ((charset)->compact_codes_p)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
304 #define CHARSET_METHOD(charset) ((charset)->method)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
305 #define CHARSET_MIN_CODE(charset) ((charset)->min_code)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
306 #define CHARSET_MAX_CODE(charset) ((charset)->max_code)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
307 #define CHARSET_INVALID_CODE(charset) ((charset)->invalid_code)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
308 #define CHARSET_MIN_CHAR(charset) ((charset)->min_char)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
309 #define CHARSET_MAX_CHAR(charset) ((charset)->max_char)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
310 #define CHARSET_CODE_OFFSET(charset) ((charset)->code_offset)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
311 #define CHARSET_UNIFIED_P(charset) ((charset)->unified_p)
25505
4d5f87073d63 (MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents: 25234
diff changeset
312
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
313 #define CHARSET_NAME(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
314 (CHARSET_ATTR_NAME (CHARSET_ATTRIBUTES (charset)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
315 #define CHARSET_MAP(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
316 (CHARSET_ATTR_MAP (CHARSET_ATTRIBUTES (charset)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
317 #define CHARSET_DECODER(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
318 (CHARSET_ATTR_DECODER (CHARSET_ATTRIBUTES (charset)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
319 #define CHARSET_ENCODER(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
320 (CHARSET_ATTR_ENCODER (CHARSET_ATTRIBUTES (charset)))
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
321 #define CHARSET_SUBSET(charset) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
322 (CHARSET_ATTR_SUBSET (CHARSET_ATTRIBUTES (charset)))
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
323 #define CHARSET_SUPERSET(charset) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
324 (CHARSET_ATTR_SUPERSET (CHARSET_ATTRIBUTES (charset)))
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
325 #define CHARSET_UNIFY_MAP(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
326 (CHARSET_ATTR_UNIFY_MAP (CHARSET_ATTRIBUTES (charset)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
327 #define CHARSET_DEUNIFIER(charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
328 (CHARSET_ATTR_DEUNIFIER (CHARSET_ATTRIBUTES (charset)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
329
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
330
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
331 /* Nonzero iff OBJ is a valid charset symbol. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
332 #define CHARSETP(obj) (CHARSET_SYMBOL_HASH_INDEX (obj) >= 0)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
333
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
334 /* Check if X is a valid charset symbol. If not, signal an error. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
335 #define CHECK_CHARSET(x) \
25505
4d5f87073d63 (MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents: 25234
diff changeset
336 do { \
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
337 if (! SYMBOLP (x) || CHARSET_SYMBOL_HASH_INDEX (x) < 0) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
338 x = wrong_type_argument (Qcharsetp, (x)); \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
339 } while (0)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
340
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
341
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
342 /* Check if X is a valid charset symbol. If valid, set ID to the id
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
343 number of the charset. Otherwise, signal an error. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
344 #define CHECK_CHARSET_GET_ID(x, id) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
345 do { \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
346 int idx; \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
347 \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
348 if (! SYMBOLP (x) || (idx = CHARSET_SYMBOL_HASH_INDEX (x)) < 0) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
349 x = wrong_type_argument (Qcharsetp, (x)); \
88854
8b5248397330 (CHECK_CHARSET_GET_ID): Use XINT on AREF result.
Dave Love <fx@gnu.org>
parents: 88839
diff changeset
350 id = XINT (AREF (HASH_VALUE (XHASH_TABLE (Vcharset_hash_table), idx), \
8b5248397330 (CHECK_CHARSET_GET_ID): Use XINT on AREF result.
Dave Love <fx@gnu.org>
parents: 88839
diff changeset
351 charset_id)); \
25505
4d5f87073d63 (MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents: 25234
diff changeset
352 } while (0)
21033
9f32198e0d9f (NONASCII_INSERT_OFFSET): New macro.
Kenichi Handa <handa@m17n.org>
parents: 20932
diff changeset
353
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
354
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
355 /* Check if X is a valid charset symbol. If valid, set ATTR to the
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
356 attr vector of the charset. Otherwise, signal an error. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
357 #define CHECK_CHARSET_GET_ATTR(x, attr) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
358 do { \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
359 if (!SYMBOLP (x) || NILP (attr = CHARSET_SYMBOL_ATTRIBUTES (x))) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
360 x = wrong_type_argument (Qcharsetp, (x)); \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
361 } while (0)
19319
9ea3c87ea61d Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18341
diff changeset
362
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
363
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
364 #define CHECK_CHARSET_GET_CHARSET(x, charset) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
365 do { \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
366 int id; \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
367 CHECK_CHARSET_GET_ID (x, id); \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
368 charset = CHARSET_FROM_ID (id); \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
369 } while (0)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
370
19319
9ea3c87ea61d Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18341
diff changeset
371
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
372 /* Lookup Vcharset_order_list and return the first charset that
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
373 contains the character C. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
374 #define CHAR_CHARSET(c) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
375 char_charset ((c), Qnil, NULL)
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
376
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
377 #if 0
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
378 /* Char-table of charset-sets. Each element is a bool vector indexed
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
379 by a charset ID. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
380 extern Lisp_Object Vchar_charset_set;
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
381
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
382 /* Charset-bag of character C. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
383 #define CHAR_CHARSET_SET(c) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
384 CHAR_TABLE_REF (Vchar_charset_set, c)
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
385
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
386 /* Check if two characters C1 and C2 belong to the same charset. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
387 #define SAME_CHARSET_P(c1, c2) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
388 intersection_p (CHAR_CHARSET_SET (c1), CHAR_CHARSET_SET (c2))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
389
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
390 #endif
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
391
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
392
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
393 /* Return a character correponding to the code-point CODE of CHARSET.
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
394 Try some optimization before calling decode_char. */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
395
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
396 #define DECODE_CHAR(charset, code) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
397 ((ASCII_BYTE_P (code) && (charset)->ascii_compatible_p) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
398 ? (code) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
399 : ((code) < (charset)->min_code || (code) > (charset)->max_code) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
400 ? -1 \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
401 : (charset)->unified_p \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
402 ? decode_char ((charset), (code)) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
403 : (charset)->method == CHARSET_METHOD_OFFSET \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
404 ? ((charset)->code_linear_p \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
405 ? (code) - (charset)->min_code + (charset)->code_offset \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
406 : decode_char ((charset), (code))) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
407 : (charset)->method == CHARSET_METHOD_MAP \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
408 ? ((charset)->code_linear_p \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
409 ? XINT (AREF (CHARSET_DECODER (charset), \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
410 (code) - (charset)->min_code)) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
411 : decode_char ((charset), (code))) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
412 : decode_char ((charset), (code)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
413
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
414
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
415 extern Lisp_Object charset_work;
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
416
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
417 /* Return a code point of CHAR in CHARSET.
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
418 Try some optimization before calling encode_char. */
19319
9ea3c87ea61d Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18341
diff changeset
419
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
420 #define ENCODE_CHAR(charset, c) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
421 ((ASCII_CHAR_P (c) && (charset)->ascii_compatible_p) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
422 ? (c) \
89366
0c9b64b6b6af (ENCODE_CHAR): If the method is SUBSET or SUPERSET, call encode_char.
Kenichi Handa <handa@m17n.org>
parents: 89065
diff changeset
423 : ((charset)->unified_p \
0c9b64b6b6af (ENCODE_CHAR): If the method is SUBSET or SUPERSET, call encode_char.
Kenichi Handa <handa@m17n.org>
parents: 89065
diff changeset
424 || (charset)->method == CHARSET_METHOD_SUBSET \
0c9b64b6b6af (ENCODE_CHAR): If the method is SUBSET or SUPERSET, call encode_char.
Kenichi Handa <handa@m17n.org>
parents: 89065
diff changeset
425 || (charset)->method == CHARSET_METHOD_SUPERSET) \
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
426 ? encode_char ((charset), (c)) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
427 : ((c) < (charset)->min_char || (c) > (charset)->max_char) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
428 ? (charset)->invalid_code \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
429 : (charset)->method == CHARSET_METHOD_OFFSET \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
430 ? ((charset)->code_linear_p \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
431 ? (c) - (charset)->code_offset + (charset)->min_code \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
432 : encode_char ((charset), (c))) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
433 : (charset)->method == CHARSET_METHOD_MAP \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
434 ? ((charset)->compact_codes_p \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
435 ? (charset_work = CHAR_TABLE_REF (CHARSET_ENCODER (charset), (c)), \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
436 (NILP (charset_work) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
437 ? (charset)->invalid_code \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
438 : XFASTINT (charset_work))) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
439 : encode_char ((charset), (c))) \
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
440 : encode_char ((charset), (c)))
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
441
25505
4d5f87073d63 (MAKE_NON_ASCII_CHAR): Handle the case that C1 or C2
Kenichi Handa <handa@m17n.org>
parents: 25234
diff changeset
442
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
443 /* Set to 1 when a charset map is loaded to warn that a buffer text
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
444 and a string data may be relocated. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
445 extern int charset_map_loaded;
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
446
19319
9ea3c87ea61d Comment changes.
Richard M. Stallman <rms@gnu.org>
parents: 18341
diff changeset
447
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
448 /* Set CHARSET to the charset highest priority of C, CODE to the
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
449 code-point of C in CHARSET. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
450 #define SPLIT_CHAR(c, charset, code) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
451 ((charset) = char_charset ((c), Qnil, &(code)))
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
452
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
453
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
454 #define ISO_MAX_DIMENSION 3
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
455 #define ISO_MAX_CHARS 2
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
456 #define ISO_MAX_FINAL 0x80 /* only 0x30..0xFF are used */
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
457
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
458 /* Mapping table from ISO2022's charset (specified by DIMENSION,
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
459 CHARS, and FINAL_CHAR) to Emacs' charset ID. Should be accessed by
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
460 macro ISO_CHARSET_TABLE (DIMENSION, CHARS, FINAL_CHAR). */
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
461 extern int iso_charset_table[ISO_MAX_DIMENSION][ISO_MAX_CHARS][ISO_MAX_FINAL];
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
462
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
463 /* A charset of type iso2022 who has DIMENSION, CHARS, and FINAL
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
464 (final character). */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
465 #define ISO_CHARSET_TABLE(dimension, chars_96, final) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
466 iso_charset_table[(dimension) - 1][(chars_96)][(final)]
20589
3acb053e757e (FETCH_STRING_CHAR_ADVANCE): New macro.
Richard M. Stallman <rms@gnu.org>
parents: 20531
diff changeset
467
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
468 /* Nonzero iff the charset who has FAST_MAP may contain C. */
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
469 #define CHARSET_FAST_MAP_REF(c, fast_map) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
470 ((c) < 0x10000 \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
471 ? fast_map[(c) >> 10] & (1 << (((c) >> 7) & 7)) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
472 : fast_map[((c) >> 15) + 62] & (1 << (((c) >> 12) & 7)))
26843
0aadeca4a4a7 In this entry, just `Modified' means that codes for a
Kenichi Handa <handa@m17n.org>
parents: 25637
diff changeset
473
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
474 #define CHARSET_FAST_MAP_SET(c, fast_map) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
475 do { \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
476 if ((c) < 0x10000) \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
477 (fast_map)[(c) >> 10] |= 1 << (((c) >> 7) & 7); \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
478 else \
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
479 (fast_map)[((c) >> 15) + 62] |= 1 << (((c) >> 12) & 7); \
17052
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
480 } while (0)
d0d7b244b1d0 Initial revision
Karl Heuer <kwzh@gnu.org>
parents:
diff changeset
481
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
482
20531
f019e056ad9a (CHAR_HEAD_P): Take char, not pointer, as arg.
Richard M. Stallman <rms@gnu.org>
parents: 20352
diff changeset
483
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
484 /* 1 iff CHARSET may contain the character C. */
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
485 #define CHAR_CHARSET_P(c, charset) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
486 ((ASCII_CHAR_P (c) && (charset)->ascii_compatible_p) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
487 || (CHARSET_UNIFIED_P (charset) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
488 ? encode_char ((charset), (c)) != (charset)->invalid_code \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
489 : (CHARSET_FAST_MAP_REF ((c), (charset)->fast_map) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
490 && ((charset)->method == CHARSET_METHOD_OFFSET \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
491 ? (c) >= (charset)->min_char && (c) <= (charset)->max_char \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
492 : ((charset)->method == CHARSET_METHOD_MAP \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
493 && (charset)->compact_codes_p) \
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
494 ? ! NILP (CHAR_TABLE_REF (CHARSET_ENCODER (charset), (c))) \
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
495 : encode_char ((charset), (c)) != (charset)->invalid_code))))
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
496
88875
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
497
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
498 /* Special macros for emacs-mule encoding. */
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
499
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
500 /* Leading-code followed by extended leading-code. DIMENSION/COLUMN */
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
501 #define EMACS_MULE_LEADING_CODE_PRIVATE_11 0x9A /* 1/1 */
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
502 #define EMACS_MULE_LEADING_CODE_PRIVATE_12 0x9B /* 1/2 */
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
503 #define EMACS_MULE_LEADING_CODE_PRIVATE_21 0x9C /* 2/2 */
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
504 #define EMACS_MULE_LEADING_CODE_PRIVATE_22 0x9D /* 2/2 */
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
505
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
506 extern struct charset *emacs_mule_charset[256];
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
507
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
508
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
509
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
510 extern Lisp_Object Qcharsetp;
29004
383e4e21306a (LEADING_CODE_8_BIT_CONTROL, CHARSET_8_BIT_CONTROL,
Kenichi Handa <handa@m17n.org>
parents: 28513
diff changeset
511
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
512 extern Lisp_Object Qascii, Qunicode;
88949
57ca0c34b3be (charset_8_bit): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88875
diff changeset
513 extern int charset_ascii, charset_eight_bit;
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
514 extern int charset_iso_8859_1;
89569
111c03888806 (charset_unicode): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 89483
diff changeset
515 extern int charset_unicode;
88682
e2170fdb6abc (charset_jisx0201_roman, charset_jisx0208_1978,
Kenichi Handa <handa@m17n.org>
parents: 88677
diff changeset
516 extern int charset_jisx0201_roman;
e2170fdb6abc (charset_jisx0201_roman, charset_jisx0208_1978,
Kenichi Handa <handa@m17n.org>
parents: 88677
diff changeset
517 extern int charset_jisx0208_1978;
e2170fdb6abc (charset_jisx0201_roman, charset_jisx0208_1978,
Kenichi Handa <handa@m17n.org>
parents: 88677
diff changeset
518 extern int charset_jisx0208;
20932
3c2c8431c51d (INC_POS): Use macro BASE_LEADING_CODE_P.
Kenichi Handa <handa@m17n.org>
parents: 20904
diff changeset
519
89064
2ac5108292b2 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88984
diff changeset
520 extern int charset_unibyte;
2ac5108292b2 *** empty log message ***
Kenichi Handa <handa@m17n.org>
parents: 88984
diff changeset
521
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
522 extern struct charset *char_charset P_ ((int, Lisp_Object, unsigned *));
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
523 extern Lisp_Object charset_attributes P_ ((int));
17726
b5f2a7d6a2d0 (unify_char): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 17321
diff changeset
524
88364
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
525 extern int decode_char P_ ((struct charset *, unsigned));
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
526 extern unsigned encode_char P_ ((struct charset *, int));
f6557aebe110 Completely re-written. Character and multibyte
Kenichi Handa <handa@m17n.org>
parents: 42473
diff changeset
527 extern int string_xstring_p P_ ((Lisp_Object));
23488
958ab288116d (Vauto_fill_chars): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 23202
diff changeset
528
88744
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
529 extern void map_charset_chars P_ ((void (*) (Lisp_Object, Lisp_Object),
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
530 Lisp_Object, Lisp_Object,
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
531 struct charset *, unsigned, unsigned));
5b9a72e491d4 (enum define_charset_arg_index): Delete
Kenichi Handa <handa@m17n.org>
parents: 88682
diff changeset
532
88875
1a232a6d79fc (Vcharset_ordered_list): Extern it.
Kenichi Handa <handa@m17n.org>
parents: 88854
diff changeset
533 EXFUN (Funify_charset, 3);
20719
78d95f2a9d92 (BCOPY_SHORT): New macro.
Kenichi Handa <handa@m17n.org>
parents: 20708
diff changeset
534
29570
825505ff211e (EMACS_CHARSET_H): Renamed from _CHARSET_H.
Kenichi Handa <handa@m17n.org>
parents: 29539
diff changeset
535 #endif /* EMACS_CHARSET_H */