Mercurial > emacs
annotate src/coding.h @ 89942:9cb747ae49af emacs-unicode-2-pre-sync
*** empty log message ***
author | Kenichi Handa <handa@m17n.org> |
---|---|
date | Sat, 29 May 2004 02:17:09 +0000 |
parents | 67cdf4445614 |
children | f2ebccfa87d4 |
rev | line source |
---|---|
17052 | 1 /* Header for coding system handler. |
18341
33e78cc7f058
Change copyright notices.
Richard M. Stallman <rms@gnu.org>
parents:
18181
diff
changeset
|
2 Copyright (C) 1995, 1997 Electrotechnical Laboratory, JAPAN. |
89483 | 3 Licensed to the Free Software Foundation. |
4 Copyright (C) 2003 | |
88365 | 5 National Institute of Advanced Industrial Science and Technology (AIST) |
6 Registration Number H13PRO009 | |
17052 | 7 |
17071 | 8 This file is part of GNU Emacs. |
9 | |
10 GNU Emacs is free software; you can redistribute it and/or modify | |
11 it under the terms of the GNU General Public License as published by | |
12 the Free Software Foundation; either version 2, or (at your option) | |
13 any later version. | |
17052 | 14 |
17071 | 15 GNU Emacs is distributed in the hope that it will be useful, |
16 but WITHOUT ANY WARRANTY; without even the implied warranty of | |
17 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the | |
18 GNU General Public License for more details. | |
17052 | 19 |
17071 | 20 You should have received a copy of the GNU General Public License |
21 along with GNU Emacs; see the file COPYING. If not, write to | |
22 the Free Software Foundation, Inc., 59 Temple Place - Suite 330, | |
23 Boston, MA 02111-1307, USA. */ | |
17052 | 24 |
29571
951ead33c624
(EMASC_CODING_H): Renamed from _CODING_H.
Kenichi Handa <handa@m17n.org>
parents:
29438
diff
changeset
|
25 #ifndef EMACS_CODING_H |
951ead33c624
(EMASC_CODING_H): Renamed from _CODING_H.
Kenichi Handa <handa@m17n.org>
parents:
29438
diff
changeset
|
26 #define EMACS_CODING_H |
17052 | 27 |
88365 | 28 /* Index to arguments of Fdefine_coding_system_internal. */ |
17052 | 29 |
88365 | 30 enum define_coding_system_arg_index |
17052 | 31 { |
88365 | 32 coding_arg_name, |
33 coding_arg_mnemonic, | |
34 coding_arg_coding_type, | |
35 coding_arg_charset_list, | |
36 coding_arg_ascii_compatible_p, | |
37 coding_arg_decode_translation_table, | |
38 coding_arg_encode_translation_table, | |
39 coding_arg_post_read_conversion, | |
40 coding_arg_pre_write_conversion, | |
41 coding_arg_default_char, | |
89483 | 42 coding_arg_for_unibyte, |
88365 | 43 coding_arg_plist, |
44 coding_arg_eol_type, | |
45 coding_arg_max | |
46 }; | |
47 | |
48 enum define_coding_iso2022_arg_index | |
49 { | |
50 coding_arg_iso2022_initial = coding_arg_max, | |
51 coding_arg_iso2022_reg_usage, | |
52 coding_arg_iso2022_request, | |
53 coding_arg_iso2022_flags, | |
54 coding_arg_iso2022_max | |
55 }; | |
56 | |
57 enum define_coding_utf16_arg_index | |
58 { | |
59 coding_arg_utf16_bom = coding_arg_max, | |
60 coding_arg_utf16_endian, | |
61 coding_arg_utf16_max | |
17052 | 62 }; |
63 | |
88365 | 64 enum define_coding_ccl_arg_index |
65 { | |
89372
95c081cdbd5f
(enum define_coding_ccl_arg_index): Set the first
Kenichi Handa <handa@m17n.org>
parents:
89330
diff
changeset
|
66 coding_arg_ccl_decoder = coding_arg_max, |
88365 | 67 coding_arg_ccl_encoder, |
68 coding_arg_ccl_valids, | |
69 coding_arg_ccl_max | |
70 }; | |
17052 | 71 |
89886 | 72 /* Hash table for all coding systems. Keys are coding system symbols |
73 and values are spec vectors of the corresponding coding system. A | |
74 spec vector has the form [ ATTRS ALIASES EOL-TYPE ]. ATTRS is a | |
75 vector of attribute of the coding system. ALIASES is a list of | |
76 aliases (symbols) of the coding system. EOL-TYPE is `unix', `dos', | |
77 `mac' or a vector of coding systems (symbols). */ | |
78 | |
88365 | 79 extern Lisp_Object Vcoding_system_hash_table; |
80 | |
89886 | 81 |
88365 | 82 /* Enumeration of coding system type. */ |
17052 | 83 |
88365 | 84 enum coding_system_type |
17052 | 85 { |
88365 | 86 coding_type_charset, |
87 coding_type_utf_8, | |
88 coding_type_utf_16, | |
89 coding_type_iso_2022, | |
90 coding_type_emacs_mule, | |
91 coding_type_sjis, | |
92 coding_type_ccl, | |
93 coding_type_raw_text, | |
94 coding_type_undecided, | |
95 coding_type_max | |
96 }; | |
97 | |
98 | |
99 /* Enumeration of end-of-line format type. */ | |
100 | |
101 enum end_of_line_type | |
102 { | |
103 eol_lf, /* Line-feed only, same as Emacs' internal | |
104 format. */ | |
105 eol_crlf, /* Sequence of carriage-return and | |
106 line-feed. */ | |
107 eol_cr, /* Carriage-return only. */ | |
108 eol_any, /* Accept any of above. Produce line-feed | |
109 only. */ | |
110 eol_undecided, /* This value is used to denote that the | |
111 eol-type is not yet undecided. */ | |
112 eol_type_max | |
17052 | 113 }; |
114 | |
88365 | 115 /* Enumeration of index to an attribute vector of a coding system. */ |
17052 | 116 |
88365 | 117 enum coding_attr_index |
118 { | |
119 coding_attr_base_name, | |
120 coding_attr_docstring, | |
121 coding_attr_mnemonic, | |
122 coding_attr_type, | |
123 coding_attr_charset_list, | |
124 coding_attr_ascii_compat, | |
125 coding_attr_decode_tbl, | |
126 coding_attr_encode_tbl, | |
89733
d001bbbe12ce
(enum coding_attr_index): New member coding_attr_trans_tbl.
Kenichi Handa <handa@m17n.org>
parents:
89685
diff
changeset
|
127 coding_attr_trans_tbl, |
88365 | 128 coding_attr_post_read, |
129 coding_attr_pre_write, | |
130 coding_attr_default_char, | |
89483 | 131 coding_attr_for_unibyte, |
88365 | 132 coding_attr_plist, |
17052 | 133 |
88365 | 134 coding_attr_category, |
135 coding_attr_safe_charsets, | |
17052 | 136 |
88365 | 137 /* The followings are extra attributes for each type. */ |
138 coding_attr_charset_valids, | |
17052 | 139 |
88365 | 140 coding_attr_ccl_decoder, |
141 coding_attr_ccl_encoder, | |
142 coding_attr_ccl_valids, | |
19279
3217a3ba8ef7
(CODING_FLAG_ISO_SAFE): New macro.
Kenichi Handa <handa@m17n.org>
parents:
19096
diff
changeset
|
143 |
88365 | 144 coding_attr_iso_initial, |
145 coding_attr_iso_usage, | |
146 coding_attr_iso_request, | |
147 coding_attr_iso_flags, | |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
148 |
88365 | 149 coding_attr_utf_16_bom, |
150 coding_attr_utf_16_endian, | |
19279
3217a3ba8ef7
(CODING_FLAG_ISO_SAFE): New macro.
Kenichi Handa <handa@m17n.org>
parents:
19096
diff
changeset
|
151 |
88365 | 152 coding_attr_emacs_mule_full, |
153 | |
154 coding_attr_last_index | |
155 }; | |
156 | |
17052 | 157 |
89886 | 158 /* Macros to access an element of an attribute vector. */ |
159 | |
88365 | 160 #define CODING_ATTR_BASE_NAME(attrs) AREF (attrs, coding_attr_base_name) |
161 #define CODING_ATTR_TYPE(attrs) AREF (attrs, coding_attr_type) | |
162 #define CODING_ATTR_CHARSET_LIST(attrs) AREF (attrs, coding_attr_charset_list) | |
163 #define CODING_ATTR_MNEMONIC(attrs) AREF (attrs, coding_attr_mnemonic) | |
164 #define CODING_ATTR_DOCSTRING(attrs) AREF (attrs, coding_attr_docstring) | |
165 #define CODING_ATTR_ASCII_COMPAT(attrs) AREF (attrs, coding_attr_ascii_compat) | |
166 #define CODING_ATTR_DECODE_TBL(attrs) AREF (attrs, coding_attr_decode_tbl) | |
167 #define CODING_ATTR_ENCODE_TBL(attrs) AREF (attrs, coding_attr_encode_tbl) | |
89733
d001bbbe12ce
(enum coding_attr_index): New member coding_attr_trans_tbl.
Kenichi Handa <handa@m17n.org>
parents:
89685
diff
changeset
|
168 #define CODING_ATTR_TRANS_TBL(attrs) AREF (attrs, coding_attr_trans_tbl) |
88365 | 169 #define CODING_ATTR_POST_READ(attrs) AREF (attrs, coding_attr_post_read) |
170 #define CODING_ATTR_PRE_WRITE(attrs) AREF (attrs, coding_attr_pre_write) | |
171 #define CODING_ATTR_DEFAULT_CHAR(attrs) AREF (attrs, coding_attr_default_char) | |
89483 | 172 #define CODING_ATTR_FOR_UNIBYTE(attrs) AREF (attrs, coding_attr_for_unibyte) |
88365 | 173 #define CODING_ATTR_FLUSHING(attrs) AREF (attrs, coding_attr_flushing) |
174 #define CODING_ATTR_PLIST(attrs) AREF (attrs, coding_attr_plist) | |
175 #define CODING_ATTR_CATEGORY(attrs) AREF (attrs, coding_attr_category) | |
176 #define CODING_ATTR_SAFE_CHARSETS(attrs)AREF (attrs, coding_attr_safe_charsets) | |
17052 | 177 |
88365 | 178 |
89886 | 179 /* Return the name of a coding system specified by ID. */ |
180 #define CODING_ID_NAME(id) \ | |
181 (HASH_KEY (XHASH_TABLE (Vcoding_system_hash_table), id)) | |
182 | |
183 /* Return the attribute vector of a coding system specified by ID. */ | |
184 | |
88365 | 185 #define CODING_ID_ATTRS(id) \ |
186 (AREF (HASH_VALUE (XHASH_TABLE (Vcoding_system_hash_table), id), 0)) | |
19284
dd1d7096f59d
(struct iso2022_spec): New member expected_charsets.
Kenichi Handa <handa@m17n.org>
parents:
19279
diff
changeset
|
187 |
89886 | 188 /* Return the list of aliases of a coding system specified by ID. */ |
189 | |
88365 | 190 #define CODING_ID_ALIASES(id) \ |
191 (AREF (HASH_VALUE (XHASH_TABLE (Vcoding_system_hash_table), id), 1)) | |
17118
dcfb481ee914
(struct iso2022_spec): Member requested_designation is
Kenichi Handa <handa@m17n.org>
parents:
17071
diff
changeset
|
192 |
89886 | 193 /* Return the eol-type of a coding system specified by ID. */ |
194 | |
88365 | 195 #define CODING_ID_EOL_TYPE(id) \ |
196 (AREF (HASH_VALUE (XHASH_TABLE (Vcoding_system_hash_table), id), 2)) | |
197 | |
89886 | 198 |
199 /* Return the spec vector of CODING_SYSTEM_SYMBOL. */ | |
17052 | 200 |
88365 | 201 #define CODING_SYSTEM_SPEC(coding_system_symbol) \ |
202 (Fgethash (coding_system_symbol, Vcoding_system_hash_table, Qnil)) | |
203 | |
89886 | 204 |
205 /* Return the ID of CODING_SYSTEM_SYMBOL. */ | |
206 | |
88365 | 207 #define CODING_SYSTEM_ID(coding_system_symbol) \ |
208 hash_lookup (XHASH_TABLE (Vcoding_system_hash_table), \ | |
209 coding_system_symbol, NULL) | |
210 | |
89886 | 211 /* Return 1 iff CODING_SYSTEM_SYMBOL is a coding system. */ |
212 | |
88365 | 213 #define CODING_SYSTEM_P(coding_system_symbol) \ |
214 (! NILP (CODING_SYSTEM_SPEC (coding_system_symbol))) | |
215 | |
89886 | 216 /* Check if X is a coding system or not. */ |
217 | |
89483 | 218 #define CHECK_CODING_SYSTEM(x) \ |
88365 | 219 do { \ |
220 if (!CODING_SYSTEM_P (x)) \ | |
89483 | 221 wrong_type_argument (Qcoding_system_p, (x)); \ |
88365 | 222 } while (0) |
223 | |
17052 | 224 |
89886 | 225 /* Check if X is a coding system or not. If it is, set SEPC to the |
226 spec vector of the coding system. */ | |
227 | |
88365 | 228 #define CHECK_CODING_SYSTEM_GET_SPEC(x, spec) \ |
229 do { \ | |
230 spec = CODING_SYSTEM_SPEC (x); \ | |
231 if (NILP (spec)) \ | |
232 x = wrong_type_argument (Qcoding_system_p, (x)); \ | |
233 } while (0) | |
234 | |
18001
9846609c4fd5
(struct iso2022_spec): Member requested_designation is
Kenichi Handa <handa@m17n.org>
parents:
17879
diff
changeset
|
235 |
89886 | 236 /* Check if X is a coding system or not. If it is, set ID to the |
237 ID of the coding system. */ | |
238 | |
88365 | 239 #define CHECK_CODING_SYSTEM_GET_ID(x, id) \ |
240 do \ | |
241 { \ | |
242 id = CODING_SYSTEM_ID (x); \ | |
243 if (id < 0) \ | |
244 x = wrong_type_argument (Qcoding_system_p, (x)); \ | |
245 } while (0) | |
17052 | 246 |
247 | |
248 /*** GENERAL section ***/ | |
249 | |
88365 | 250 /* Enumeration of result code of code conversion. */ |
251 enum coding_result_code | |
17052 | 252 { |
88365 | 253 CODING_RESULT_SUCCESS, |
254 CODING_RESULT_INSUFFICIENT_SRC, | |
255 CODING_RESULT_INSUFFICIENT_DST, | |
256 CODING_RESULT_INCONSISTENT_EOL, | |
89685
8970a5ea5efc
(enum coding_result_code): Delete
Kenichi Handa <handa@m17n.org>
parents:
89666
diff
changeset
|
257 CODING_RESULT_INVALID_SRC, |
88365 | 258 CODING_RESULT_INTERRUPT, |
259 CODING_RESULT_INSUFFICIENT_MEM | |
17052 | 260 }; |
261 | |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
262 |
21031 | 263 /* Macros used for the member `mode' of the struct coding_system. */ |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
264 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
265 /* If set, recover the original CR or LF of the already decoded text |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
266 when the decoding routine encounters an inconsistent eol format. */ |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
267 #define CODING_MODE_INHIBIT_INCONSISTENT_EOL 0x01 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
268 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
269 /* If set, the decoding/encoding routines treat the current data as |
89172 | 270 the last block of the whole text to be converted, and do the |
271 appropriate finishing job. */ | |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
272 #define CODING_MODE_LAST_BLOCK 0x02 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
273 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
274 /* If set, it means that the current source text is in a buffer which |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
275 enables selective display. */ |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
276 #define CODING_MODE_SELECTIVE_DISPLAY 0x04 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
277 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
278 /* This flag is used by the decoding/encoding routines on the fly. If |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
279 set, it means that right-to-left text is being processed. */ |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
280 #define CODING_MODE_DIRECTION 0x08 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
281 |
88365 | 282 #define CODING_MODE_FIXED_DESTINATION 0x10 |
283 | |
89886 | 284 /* If set, it means that the encoding routines produces some safe |
285 ASCII characters (usually '?') for unsupported characters. */ | |
88365 | 286 #define CODING_MODE_SAFE_ENCODING 0x20 |
287 | |
288 /* Structure of the field `spec.iso_2022' in the structure | |
289 `coding_system'. */ | |
290 struct iso_2022_spec | |
291 { | |
88688 | 292 /* Bit-wise-or of CODING_ISO_FLAG_XXX. */ |
88365 | 293 unsigned flags; |
294 | |
295 /* The current graphic register invoked to each graphic plane. */ | |
296 int current_invocation[2]; | |
297 | |
298 /* The current charset designated to each graphic register. The | |
299 value -1 means that not charset is designated, -2 means that | |
300 there was an invalid designation previously. */ | |
301 int current_designation[4]; | |
302 | |
303 /* Set to 1 temporarily only when graphic register 2 or 3 is invoked | |
304 by single-shift while encoding. */ | |
305 int single_shifting; | |
306 | |
307 /* Set to 1 temporarily only when processing at beginning of line. */ | |
308 int bol; | |
309 }; | |
310 | |
311 struct ccl_spec; | |
312 | |
313 enum utf_16_bom_type | |
314 { | |
315 utf_16_detect_bom, | |
316 utf_16_without_bom, | |
317 utf_16_with_bom | |
318 }; | |
319 | |
320 enum utf_16_endian_type | |
321 { | |
322 utf_16_big_endian, | |
323 utf_16_little_endian | |
324 }; | |
325 | |
326 struct utf_16_spec | |
327 { | |
328 enum utf_16_bom_type bom; | |
329 enum utf_16_endian_type endian; | |
330 int surrogate; | |
331 }; | |
332 | |
89330
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
333 struct coding_detection_info |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
334 { |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
335 /* Values of these members are bitwise-OR of CATEGORY_MASK_XXXs. */ |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
336 /* Which categories are already checked. */ |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
337 int checked; |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
338 /* Which categories are strongly found. */ |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
339 int found; |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
340 /* Which categories are rejected. */ |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
341 int rejected; |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
342 }; |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
343 |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
344 |
17052 | 345 struct coding_system |
346 { | |
88365 | 347 /* ID number of the coding system. This is an index to |
348 Vcoding_system_hash_table. This value is set by | |
349 setup_coding_system. At the early stage of building time, this | |
350 value is -1 in the array coding_categories to indicate that no | |
351 coding-system of that category is yet defined. */ | |
352 int id; | |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
353 |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
354 /* Flag bits of the coding system. The meaning of each bit is common |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
355 to all types of coding systems. */ |
88365 | 356 int common_flags; |
17052 | 357 |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
358 /* Mode bits of the coding system. See the comments of the macros |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
359 CODING_MODE_XXX. */ |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
360 unsigned int mode; |
17052 | 361 |
362 /* Detailed information specific to each type of coding system. */ | |
88365 | 363 union |
17052 | 364 { |
88365 | 365 struct iso_2022_spec iso_2022; |
366 struct ccl_spec *ccl; /* Defined in ccl.h. */ | |
367 struct utf_16_spec utf_16; | |
368 int emacs_mule_full_support; | |
17052 | 369 } spec; |
370 | |
88365 | 371 int max_charset_id; |
372 char *safe_charsets; | |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
373 |
88365 | 374 /* The following two members specify how binary 8-bit code 128..255 |
375 are represented in source and destination text respectively. 1 | |
376 means they are represented by 2-byte sequence, 0 means they are | |
377 represented by 1-byte as is (see the comment in character.h). */ | |
29006
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
378 unsigned src_multibyte : 1; |
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
379 unsigned dst_multibyte : 1; |
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
380 |
21320
278c256defc6
(struct coding_system): Comment for the member
Kenichi Handa <handa@m17n.org>
parents:
21051
diff
changeset
|
381 /* How may heading bytes we can skip for decoding. This is set to |
278c256defc6
(struct coding_system): Comment for the member
Kenichi Handa <handa@m17n.org>
parents:
21051
diff
changeset
|
382 -1 in setup_coding_system, and updated by detect_coding. So, |
278c256defc6
(struct coding_system): Comment for the member
Kenichi Handa <handa@m17n.org>
parents:
21051
diff
changeset
|
383 when this is equal to the byte length of the text being |
278c256defc6
(struct coding_system): Comment for the member
Kenichi Handa <handa@m17n.org>
parents:
21051
diff
changeset
|
384 converted, we can skip the actual conversion process. */ |
88365 | 385 int head_ascii; |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
386 |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
387 /* The following members are set by encoding/decoding routine. */ |
88365 | 388 EMACS_INT produced, produced_char, consumed, consumed_char; |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
389 |
29006
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
390 /* Number of error source data found in a decoding routine. */ |
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
391 int errors; |
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
392 |
88365 | 393 /* Store the positions of error source data. */ |
394 EMACS_INT *error_positions; | |
20930
1331679fe704
(struct coding_system): New member fake_multibyte.
Kenichi Handa <handa@m17n.org>
parents:
20717
diff
changeset
|
395 |
88365 | 396 /* Finish status of code conversion. */ |
397 enum coding_result_code result; | |
35530
cb627d09f8c3
(struct coding_system): New member suppress_error.
Kenichi Handa <handa@m17n.org>
parents:
34152
diff
changeset
|
398 |
88365 | 399 EMACS_INT src_pos, src_pos_byte, src_chars, src_bytes; |
400 Lisp_Object src_object; | |
89483 | 401 const unsigned char *source; |
17052 | 402 |
88365 | 403 EMACS_INT dst_pos, dst_pos_byte, dst_bytes; |
404 Lisp_Object dst_object; | |
405 unsigned char *destination; | |
406 | |
89886 | 407 /* Set to 1 iff the source of conversion is not in the member |
408 `charbuf', but at `src_object'. */ | |
88365 | 409 int chars_at_source; |
410 | |
411 /* If an element is non-negative, it is a character code. | |
412 | |
413 If it is in the range -128..-1, it is a 8-bit character code | |
414 minus 256. | |
17052 | 415 |
88365 | 416 If it is less than -128, it specifies the start of an annotation |
417 chunk. The length of the chunk is -128 minus the value of the | |
418 element. The following elements are OFFSET, ANNOTATION-TYPE, and | |
419 a sequence of actual data for the annotation. OFFSET is a | |
420 character position offset from dst_pos or src_pos, | |
421 ANNOTATION-TYPE specfies the meaning of the annotation and how to | |
422 handle the following data.. */ | |
423 int *charbuf; | |
424 int charbuf_size, charbuf_used; | |
17052 | 425 |
88365 | 426 /* Set to 1 if charbuf contains an annotation. */ |
427 int annotated; | |
428 | |
429 unsigned char carryover[64]; | |
430 int carryover_bytes; | |
431 | |
432 int default_char; | |
433 | |
89330
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
434 int (*detector) P_ ((struct coding_system *, |
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
435 struct coding_detection_info *)); |
88365 | 436 void (*decoder) P_ ((struct coding_system *)); |
437 int (*encoder) P_ ((struct coding_system *)); | |
17052 | 438 }; |
439 | |
88365 | 440 /* Meanings of bits in the member `common_flags' of the structure |
441 coding_system. The lowest 8 bits are reserved for various kind of | |
442 annotations (currently two of them are used). */ | |
443 #define CODING_ANNOTATION_MASK 0x00FF | |
444 #define CODING_ANNOTATE_COMPOSITION_MASK 0x0001 | |
445 #define CODING_ANNOTATE_DIRECTION_MASK 0x0002 | |
89330
ee0338e83a2b
(struct coding_detection_info): New structure.
Kenichi Handa <handa@m17n.org>
parents:
89172
diff
changeset
|
446 #define CODING_ANNOTATE_CHARSET_MASK 0x0003 |
88365 | 447 #define CODING_FOR_UNIBYTE_MASK 0x0100 |
448 #define CODING_REQUIRE_FLUSHING_MASK 0x0200 | |
449 #define CODING_REQUIRE_DECODING_MASK 0x0400 | |
450 #define CODING_REQUIRE_ENCODING_MASK 0x0800 | |
451 #define CODING_REQUIRE_DETECTION_MASK 0x1000 | |
452 #define CODING_RESET_AT_BOL_MASK 0x2000 | |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
453 |
88365 | 454 /* Return 1 if the coding context CODING requires annotaion |
455 handling. */ | |
456 #define CODING_REQUIRE_ANNOTATION(coding) \ | |
457 ((coding)->common_flags & CODING_ANNOTATION_MASK) | |
458 | |
459 /* Return 1 if the coding context CODING prefers decoding into unibyte. */ | |
460 #define CODING_FOR_UNIBYTE(coding) \ | |
461 ((coding)->common_flags & CODING_FOR_UNIBYTE_MASK) | |
462 | |
463 /* Return 1 if the coding context CODING requires specific code to be | |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
464 attached at the tail of converted text. */ |
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
465 #define CODING_REQUIRE_FLUSHING(coding) \ |
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
466 ((coding)->common_flags & CODING_REQUIRE_FLUSHING_MASK) |
17052 | 467 |
88365 | 468 /* Return 1 if the coding context CODING requires code conversion on |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
469 decoding. */ |
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
470 #define CODING_REQUIRE_DECODING(coding) \ |
29006
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
471 ((coding)->dst_multibyte \ |
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
472 || (coding)->common_flags & CODING_REQUIRE_DECODING_MASK) |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
473 |
88365 | 474 |
475 /* Return 1 if the coding context CODING requires code conversion on | |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
476 encoding. */ |
88365 | 477 #define CODING_REQUIRE_ENCODING(coding) \ |
478 ((coding)->src_multibyte \ | |
479 || (coding)->common_flags & CODING_REQUIRE_ENCODING_MASK \ | |
480 || (coding)->mode & CODING_MODE_SELECTIVE_DISPLAY) | |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
481 |
88365 | 482 |
483 /* Return 1 if the coding context CODING requires some kind of code | |
20226
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
484 detection. */ |
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
485 #define CODING_REQUIRE_DETECTION(coding) \ |
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
486 ((coding)->common_flags & CODING_REQUIRE_DETECTION_MASK) |
549826cf2952
(struct coding_system): Add member common_flags, delete
Kenichi Handa <handa@m17n.org>
parents:
20149
diff
changeset
|
487 |
88365 | 488 /* Return 1 if the coding context CODING requires code conversion on |
29006
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
489 decoding or some kind of code detection. */ |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
490 #define CODING_MAY_REQUIRE_DECODING(coding) \ |
29006
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
491 (CODING_REQUIRE_DECODING (coding) \ |
bf92db6e609a
(enum iso_code_class_type): Member ISO_control_code is
Kenichi Handa <handa@m17n.org>
parents:
28512
diff
changeset
|
492 || CODING_REQUIRE_DETECTION (coding)) |
17052 | 493 |
494 /* Macros to decode or encode a character of JISX0208 in SJIS. S1 and | |
495 S2 are the 1st and 2nd position-codes of JISX0208 in SJIS coding | |
496 system. C1 and C2 are the 1st and 2nd position codes of Emacs' | |
497 internal format. */ | |
498 | |
88365 | 499 #define SJIS_TO_JIS(code) \ |
500 do { \ | |
501 int s1, s2, j1, j2; \ | |
502 \ | |
503 s1 = (code) >> 8, s2 = (code) & 0xFF; \ | |
504 \ | |
505 if (s2 >= 0x9F) \ | |
506 (j1 = s1 * 2 - (s1 >= 0xE0 ? 0x160 : 0xE0), \ | |
507 j2 = s2 - 0x7E); \ | |
508 else \ | |
509 (j1 = s1 * 2 - ((s1 >= 0xE0) ? 0x161 : 0xE1), \ | |
510 j2 = s2 - ((s2 >= 0x7F) ? 0x20 : 0x1F)); \ | |
511 (code) = (j1 << 8) | j2; \ | |
17052 | 512 } while (0) |
513 | |
89765
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
514 #define SJIS_TO_JIS2(code) \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
515 do { \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
516 int s1, s2, j1, j2; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
517 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
518 s1 = (code) >> 8, s2 = (code) & 0xFF; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
519 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
520 if (s2 >= 0x9F) \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
521 { \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
522 j1 = (s1 == 0xF0 ? 0x28 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
523 : s1 == 0xF1 ? 0x24 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
524 : s1 == 0xF2 ? 0x2C \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
525 : s1 == 0xF3 ? 0x2E \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
526 : 0x6E + (s1 - 0xF4) * 2); \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
527 j2 = s2 - 0x7E; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
528 } \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
529 else \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
530 { \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
531 j1 = (s1 <= 0xF2 ? 0x21 + (s1 - 0xF0) * 2 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
532 : s1 <= 0xF4 ? 0x2D + (s1 - 0xF3) * 2 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
533 : 0x6F + (s1 - 0xF5) * 2); \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
534 j2 = s2 - ((s2 >= 0x7F ? 0x20 : 0x1F)); \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
535 } \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
536 (code) = (j1 << 8) | j2; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
537 } while (0) |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
538 |
88365 | 539 |
540 #define JIS_TO_SJIS(code) \ | |
17052 | 541 do { \ |
88365 | 542 int s1, s2, j1, j2; \ |
543 \ | |
544 j1 = (code) >> 8, j2 = (code) & 0xFF; \ | |
545 if (j1 & 1) \ | |
546 (s1 = j1 / 2 + ((j1 < 0x5F) ? 0x71 : 0xB1), \ | |
547 s2 = j2 + ((j2 >= 0x60) ? 0x20 : 0x1F)); \ | |
17052 | 548 else \ |
88365 | 549 (s1 = j1 / 2 + ((j1 < 0x5F) ? 0x70 : 0xB0), \ |
550 s2 = j2 + 0x7E); \ | |
88498
1dd66ce3fc9c
(JIS_TO_SJIS): Fix typo (j1->s1, j2->s2).
Kenichi Handa <handa@m17n.org>
parents:
88365
diff
changeset
|
551 (code) = (s1 << 8) | s2; \ |
17052 | 552 } while (0) |
553 | |
89765
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
554 #define JIS_TO_SJIS2(code) \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
555 do { \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
556 int s1, s2, j1, j2; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
557 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
558 j1 = (code) >> 8, j2 = (code) & 0xFF; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
559 if (j1 & 1) \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
560 { \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
561 s1 = (j1 <= 0x25 ? 0xF0 + (j1 - 0x21) / 2 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
562 : j1 <= 0x27 ? 0xF3 + (j1 - 0x2D) / 2 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
563 : 0xF5 + (j1 - 0x6F) / 2); \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
564 s2 = j2 + ((j2 >= 0x60) ? 0x20 : 0x1F); \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
565 } \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
566 else \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
567 { \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
568 s1 = (j1 == 0x28 ? 0xF0 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
569 : j1 == 0x24 ? 0xF1 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
570 : j1 == 0x2C ? 0xF2 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
571 : j1 == 0x2E ? 0xF3 \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
572 : 0xF4 + (j1 - 0x6E) / 2); \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
573 s2 = j2 + 0x7E; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
574 } \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
575 (code) = (s1 << 8) | s2; \ |
b06a8c2162e5
(SJIS_TO_JIS2, JIS_TO_SJIS2): New macros.
Kenichi Handa <handa@m17n.org>
parents:
89733
diff
changeset
|
576 } while (0) |
88365 | 577 |
21051
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
578 /* Encode the file name NAME using the specified coding system |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
579 for file names, if any. */ |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
580 #define ENCODE_FILE(name) \ |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
581 (! NILP (Vfile_name_coding_system) \ |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
582 && XFASTINT (Vfile_name_coding_system) != 0 \ |
22342 | 583 ? code_convert_string_norecord (name, Vfile_name_coding_system, 1) \ |
21051
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
584 : (! NILP (Vdefault_file_name_coding_system) \ |
22342 | 585 && XFASTINT (Vdefault_file_name_coding_system) != 0 \ |
586 ? code_convert_string_norecord (name, Vdefault_file_name_coding_system, 1) \ | |
21051
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
587 : name)) |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
588 |
88365 | 589 |
21051
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
590 /* Decode the file name NAME using the specified coding system |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
591 for file names, if any. */ |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
592 #define DECODE_FILE(name) \ |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
593 (! NILP (Vfile_name_coding_system) \ |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
594 && XFASTINT (Vfile_name_coding_system) != 0 \ |
22342 | 595 ? code_convert_string_norecord (name, Vfile_name_coding_system, 0) \ |
21051
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
596 : (! NILP (Vdefault_file_name_coding_system) \ |
22342 | 597 && XFASTINT (Vdefault_file_name_coding_system) != 0 \ |
598 ? code_convert_string_norecord (name, Vdefault_file_name_coding_system, 0) \ | |
21051
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
599 : name)) |
b5844e2bf088
(ENCODE_FILE): Moved from fileio.c. Use
Kenichi Handa <handa@m17n.org>
parents:
21031
diff
changeset
|
600 |
88365 | 601 |
29310
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
602 #ifdef WINDOWSNT |
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
603 /* Encode the string STR using the specified coding system |
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
604 for w32 system functions, if any. */ |
88365 | 605 #define ENCODE_SYSTEM(str) \ |
606 (! NILP (Vlocale_coding_system) \ | |
607 && XFASTINT (Vlocale_coding_system) != 0 \ | |
608 ? code_convert_string_norecord (str, Vlocale_coding_system, 1) \ | |
29310
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
609 : str) |
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
610 |
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
611 /* Decode the string STR using the specified coding system |
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
612 for w32 system functions, if any. */ |
88365 | 613 #define DECODE_SYSTEM(name) \ |
614 (! NILP (Vlocale_coding_system) \ | |
615 && XFASTINT (Vlocale_coding_system) != 0 \ | |
616 ? code_convert_string_norecord (str, Vlocale_coding_system, 0) \ | |
29310
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
617 : str) |
39574
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
618 |
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
619 #else /* WINDOWSNT */ |
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
620 |
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
621 #define ENCODE_SYSTEM(str) string_make_unibyte(str) |
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
622 #define DECODE_SYSTEM(name) name |
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
623 |
bdd381bc9eb0
(ENCODE_SYSTEM, DECODE_SYSTEM): Define also for non-NT.
Gerd Moellmann <gerd@gnu.org>
parents:
36088
diff
changeset
|
624 #endif /* !WINDOWSNT */ |
29310
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
625 |
89506 | 626 /* Used by the gtk menu code. Note that this encodes utf-8, not |
627 utf-8-emacs, so it's not a no-op. */ | |
628 #define ENCODE_UTF_8(str) code_convert_string_norecord (str, Qutf_8, 1) | |
629 | |
17052 | 630 /* Extern declarations. */ |
89666
7d38a63951c0
(make_conversion_work_buffer): Delete extern.
Kenichi Handa <handa@m17n.org>
parents:
89506
diff
changeset
|
631 extern Lisp_Object code_conversion_save P_ ((int, int)); |
20308
8d520e3dcb86
Add more prototypes and function declarations.
Andreas Schwab <schwab@suse.de>
parents:
20226
diff
changeset
|
632 extern int decoding_buffer_size P_ ((struct coding_system *, int)); |
8d520e3dcb86
Add more prototypes and function declarations.
Andreas Schwab <schwab@suse.de>
parents:
20226
diff
changeset
|
633 extern int encoding_buffer_size P_ ((struct coding_system *, int)); |
88365 | 634 extern void setup_coding_system P_ ((Lisp_Object, struct coding_system *)); |
635 extern void detect_coding P_ ((struct coding_system *)); | |
88848
a55219c46b8c
(code_convert_region): Fix prototype.
Dave Love <fx@gnu.org>
parents:
88688
diff
changeset
|
636 extern Lisp_Object code_convert_region P_ ((Lisp_Object, Lisp_Object, |
88365 | 637 Lisp_Object, Lisp_Object, |
638 int, int)); | |
639 extern Lisp_Object code_convert_string P_ ((Lisp_Object, Lisp_Object, | |
640 Lisp_Object, int, int, int)); | |
29438
8c825a8566f5
Declare code_convert_string_norecord.
Dave Love <fx@gnu.org>
parents:
29310
diff
changeset
|
641 extern Lisp_Object code_convert_string_norecord P_ ((Lisp_Object, Lisp_Object, |
8c825a8566f5
Declare code_convert_string_norecord.
Dave Love <fx@gnu.org>
parents:
29310
diff
changeset
|
642 int)); |
88365 | 643 extern Lisp_Object raw_text_coding_system P_ ((Lisp_Object)); |
644 extern Lisp_Object coding_inherit_eol_type P_ ((Lisp_Object, Lisp_Object)); | |
645 | |
646 extern int decode_coding_gap P_ ((struct coding_system *, | |
647 EMACS_INT, EMACS_INT)); | |
648 extern int encode_coding_gap P_ ((struct coding_system *, | |
649 EMACS_INT, EMACS_INT)); | |
650 extern void decode_coding_object P_ ((struct coding_system *, | |
651 Lisp_Object, EMACS_INT, EMACS_INT, | |
652 EMACS_INT, EMACS_INT, Lisp_Object)); | |
653 extern void encode_coding_object P_ ((struct coding_system *, | |
654 Lisp_Object, EMACS_INT, EMACS_INT, | |
655 EMACS_INT, EMACS_INT, Lisp_Object)); | |
656 | |
89886 | 657 /* Macros for backward compatibility. */ |
658 | |
88365 | 659 #define decode_coding_region(coding, from, to) \ |
660 decode_coding_object (coding, Fcurrent_buffer (), \ | |
661 from, CHAR_TO_BYTE (from), \ | |
662 to, CHAR_TO_BYTE (to), Fcurrent_buffer ()) | |
663 | |
664 | |
665 #define encode_coding_region(coding, from, to) \ | |
666 encode_coding_object (coding, Fcurrent_buffer (), \ | |
667 from, CHAR_TO_BYTE (from), \ | |
668 to, CHAR_TO_BYTE (to), Fcurrent_buffer ()) | |
669 | |
670 | |
671 #define decode_coding_string(coding, string, nocopy) \ | |
672 decode_coding_object (coding, string, 0, 0, XSTRING (string)->size, \ | |
673 STRING_BYTES (XSTRING (string)), Qt) | |
674 | |
675 #define encode_coding_string(coding, string, nocopy) \ | |
676 (encode_coding_object (coding, string, 0, 0, XSTRING (string)->size, \ | |
677 STRING_BYTES (XSTRING (string)), Qt), \ | |
678 (coding)->dst_object) | |
679 | |
680 | |
681 #define decode_coding_c_string(coding, src, bytes, dst_object) \ | |
682 do { \ | |
683 (coding)->source = (src); \ | |
684 (coding)->src_chars = (coding)->src_bytes = (bytes); \ | |
685 decode_coding_object ((coding), Qnil, 0, 0, (bytes), (bytes), \ | |
686 (dst_object)); \ | |
687 } while (0) | |
688 | |
689 | |
690 extern Lisp_Object preferred_coding_system P_ (()); | |
691 | |
692 | |
89483 | 693 extern Lisp_Object Qutf_8, Qutf_8_emacs; |
694 | |
17052 | 695 extern Lisp_Object Qcoding_system, Qeol_type, Qcoding_category_index; |
88365 | 696 extern Lisp_Object Qcoding_system_p; |
697 extern Lisp_Object Qraw_text, Qemacs_mule, Qno_conversion, Qundecided; | |
698 extern Lisp_Object Qiso_2022; | |
17052 | 699 extern Lisp_Object Qbuffer_file_coding_system; |
88365 | 700 |
701 extern Lisp_Object Qunix, Qdos, Qmac; | |
17052 | 702 |
22186
fc4aaf1b1772
Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents:
22118
diff
changeset
|
703 extern Lisp_Object Qtranslation_table; |
fc4aaf1b1772
Change term "character translation table" to "translation table".
Kenichi Handa <handa@m17n.org>
parents:
22118
diff
changeset
|
704 extern Lisp_Object Qtranslation_table_id; |
22118
42e2ffa98618
Change terms unify/unification to
Kenichi Handa <handa@m17n.org>
parents:
21901
diff
changeset
|
705 |
24201
d324ba7d0e40
eol-mnemonic-* variables are now strings, not characters.
Eli Zaretskii <eliz@gnu.org>
parents:
23324
diff
changeset
|
706 /* Mnemonic strings to indicate each type of end-of-line. */ |
d324ba7d0e40
eol-mnemonic-* variables are now strings, not characters.
Eli Zaretskii <eliz@gnu.org>
parents:
23324
diff
changeset
|
707 extern Lisp_Object eol_mnemonic_unix, eol_mnemonic_dos, eol_mnemonic_mac; |
d324ba7d0e40
eol-mnemonic-* variables are now strings, not characters.
Eli Zaretskii <eliz@gnu.org>
parents:
23324
diff
changeset
|
708 /* Mnemonic string to indicate type of end-of-line is not yet decided. */ |
d324ba7d0e40
eol-mnemonic-* variables are now strings, not characters.
Eli Zaretskii <eliz@gnu.org>
parents:
23324
diff
changeset
|
709 extern Lisp_Object eol_mnemonic_undecided; |
17052 | 710 |
711 #ifdef emacs | |
712 extern Lisp_Object Qfile_coding_system; | |
713 extern Lisp_Object Qcall_process, Qcall_process_region, Qprocess_argument; | |
714 extern Lisp_Object Qstart_process, Qopen_network_stream; | |
34107
46e0ec24a961
(Qwrite_region, Qcoding_system_error): Declare extern.
Gerd Moellmann <gerd@gnu.org>
parents:
30832
diff
changeset
|
715 extern Lisp_Object Qwrite_region; |
17052 | 716 |
26088
b7aa6ac26872
Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents:
25378
diff
changeset
|
717 extern char *emacs_strerror P_ ((int)); |
b7aa6ac26872
Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents:
25378
diff
changeset
|
718 |
17052 | 719 /* Coding-system for reading files and receiving data from process. */ |
720 extern Lisp_Object Vcoding_system_for_read; | |
721 /* Coding-system for writing files and sending data to process. */ | |
722 extern Lisp_Object Vcoding_system_for_write; | |
723 /* Coding-system actually used in the latest I/O. */ | |
724 extern Lisp_Object Vlast_coding_system_used; | |
26088
b7aa6ac26872
Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents:
25378
diff
changeset
|
725 /* Coding-system to use with system messages (e.g. strerror). */ |
b7aa6ac26872
Add support for large files, 64-bit Solaris, system locale codings.
Paul Eggert <eggert@twinsun.com>
parents:
25378
diff
changeset
|
726 extern Lisp_Object Vlocale_coding_system; |
17052 | 727 |
21573
92b33933ceeb
Declare inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents:
21515
diff
changeset
|
728 /* If non-zero, process buffer inherits the coding system used to decode |
92b33933ceeb
Declare inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents:
21515
diff
changeset
|
729 the subprocess output. */ |
92b33933ceeb
Declare inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents:
21515
diff
changeset
|
730 extern int inherit_process_coding_system; |
92b33933ceeb
Declare inherit-process-coding-system.
Eli Zaretskii <eliz@gnu.org>
parents:
21515
diff
changeset
|
731 |
17052 | 732 /* Coding-system to be used for encoding terminal output. This |
733 structure contains information of a coding-system specified by the | |
734 function `set-terminal-coding-system'. */ | |
735 extern struct coding_system terminal_coding; | |
736 | |
19279
3217a3ba8ef7
(CODING_FLAG_ISO_SAFE): New macro.
Kenichi Handa <handa@m17n.org>
parents:
19096
diff
changeset
|
737 /* Coding system to be used to encode text for terminal display when |
3217a3ba8ef7
(CODING_FLAG_ISO_SAFE): New macro.
Kenichi Handa <handa@m17n.org>
parents:
19096
diff
changeset
|
738 terminal coding system is nil. */ |
3217a3ba8ef7
(CODING_FLAG_ISO_SAFE): New macro.
Kenichi Handa <handa@m17n.org>
parents:
19096
diff
changeset
|
739 extern struct coding_system safe_terminal_coding; |
3217a3ba8ef7
(CODING_FLAG_ISO_SAFE): New macro.
Kenichi Handa <handa@m17n.org>
parents:
19096
diff
changeset
|
740 |
17052 | 741 /* Coding-system of what is sent from terminal keyboard. This |
742 structure contains information of a coding-system specified by the | |
743 function `set-keyboard-coding-system'. */ | |
744 extern struct coding_system keyboard_coding; | |
745 | |
18181
1d91f0e4ff7d
(Vdefault_process_coding_system): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
18001
diff
changeset
|
746 /* Default coding systems used for process I/O. */ |
1d91f0e4ff7d
(Vdefault_process_coding_system): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
18001
diff
changeset
|
747 extern Lisp_Object Vdefault_process_coding_system; |
17052 | 748 |
88365 | 749 /* Function to call to force a user to force select a propert coding |
20717
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
750 system. */ |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
751 extern Lisp_Object Vselect_safe_coding_system_function; |
19463997fbc6
(CODING_FLAG_ISO_DESIGNATION): New macro.
Kenichi Handa <handa@m17n.org>
parents:
20308
diff
changeset
|
752 |
48875
e79464fe61d7
(coding_system_require_warning): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
46549
diff
changeset
|
753 /* If nonzero, on writing a file, Vselect_safe_coding_system_function |
e79464fe61d7
(coding_system_require_warning): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
46549
diff
changeset
|
754 is called even if Vcoding_system_for_write is non-nil. */ |
e79464fe61d7
(coding_system_require_warning): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
46549
diff
changeset
|
755 extern int coding_system_require_warning; |
e79464fe61d7
(coding_system_require_warning): Extern it.
Kenichi Handa <handa@m17n.org>
parents:
46549
diff
changeset
|
756 |
21901
1b46a79d86e3
(Vfile_name_coding_system)
Richard M. Stallman <rms@gnu.org>
parents:
21573
diff
changeset
|
757 /* Coding system for file names, or nil if none. */ |
1b46a79d86e3
(Vfile_name_coding_system)
Richard M. Stallman <rms@gnu.org>
parents:
21573
diff
changeset
|
758 extern Lisp_Object Vfile_name_coding_system; |
1b46a79d86e3
(Vfile_name_coding_system)
Richard M. Stallman <rms@gnu.org>
parents:
21573
diff
changeset
|
759 |
1b46a79d86e3
(Vfile_name_coding_system)
Richard M. Stallman <rms@gnu.org>
parents:
21573
diff
changeset
|
760 /* Coding system for file names used only when |
1b46a79d86e3
(Vfile_name_coding_system)
Richard M. Stallman <rms@gnu.org>
parents:
21573
diff
changeset
|
761 Vfile_name_coding_system is nil. */ |
1b46a79d86e3
(Vfile_name_coding_system)
Richard M. Stallman <rms@gnu.org>
parents:
21573
diff
changeset
|
762 extern Lisp_Object Vdefault_file_name_coding_system; |
29310
2ffc1fff111a
(ENCODE_SYSTEM, DECODE_SYSTEM) [WINDOWSNT]: New macros.
Jason Rumney <jasonr@gnu.org>
parents:
29274
diff
changeset
|
763 |
17052 | 764 #endif |
765 | |
34107
46e0ec24a961
(Qwrite_region, Qcoding_system_error): Declare extern.
Gerd Moellmann <gerd@gnu.org>
parents:
30832
diff
changeset
|
766 /* Error signaled when there's a problem with detecting coding system */ |
46e0ec24a961
(Qwrite_region, Qcoding_system_error): Declare extern.
Gerd Moellmann <gerd@gnu.org>
parents:
30832
diff
changeset
|
767 extern Lisp_Object Qcoding_system_error; |
46e0ec24a961
(Qwrite_region, Qcoding_system_error): Declare extern.
Gerd Moellmann <gerd@gnu.org>
parents:
30832
diff
changeset
|
768 |
88365 | 769 extern char emacs_mule_bytes[256]; |
770 extern int emacs_mule_string_char P_ ((unsigned char *)); | |
771 | |
29571
951ead33c624
(EMASC_CODING_H): Renamed from _CODING_H.
Kenichi Handa <handa@m17n.org>
parents:
29438
diff
changeset
|
772 #endif /* EMACS_CODING_H */ |
89889 | 773 |
774 /* arch-tag: 2bc3b4fa-6870-4f64-8135-b962b2d290e4 | |
775 (do not change this comment) */ |